generator_gan.py


import math
import os
from timeit import default_timer as timer

import numpy as np
import tensorflow as tf

from image import ImageVariations
from network import image_decoder, image_encoder, image_output, gan_optimizer

LOG_DIR = 'logs'

class GANetwork():

    def __init__(self, name, setup=True, image_size=64, colors=3, batch_size=64, directory='network', image_manager=None,
                 input_size=64, learning_rate=0.0002, dropout=0.4, generator_convolutions=5, generator_base_width=32,
                 discriminator_convolutions=4, discriminator_base_width=32, classification_depth=1, grid_size=4,
                 log=True, y_offset=0.1, learning_momentum=0.6, learning_momentum2=0.9, learning_pivot=10000,
                 dicriminator_scaling_favor=3):
        """
        Create a GAN for generating images
        Args:
          name: The name of the network
          setup: Initialize the network in the constructor
          image_size: The size of the generated images
          colors: number of color layers (3 is rgb, 1 is grayscale)
          batch_size: images per training batch
          directory: where to save the trained network
          image_manager: a class generating real images for training
          input_size: the number of images fed to the generator when generating an image
          learning_rate: the initial rate of learning
          dropout: improve the discriminator with some dropout
          generator_convolutions: the number of convolutional layers in the generator
          generator_base_width: the base number of convolution kernels per layer in the generator
          discriminator_convolutions: the number of convolutional layers in the discriminator
          discriminator_base_width: the base number of convolution kernels per layer in the discriminator
          classification_depth: the number of fully connected layers in the discriminator
          grid_size: the size of the grid when generating an image grid
          log: should tensorboard logs be created
          y_offset: how much should the "right" answers vary from 1s and 0s
          learning_momentum: the beta1 momentum for ADAM
          learning_momentum2: the beta2 momentum for ADAM
          learning_pivot: the point where the learning rate starts declining
          dicriminator_scaling_favor: how much should the discriminator be favored when selecting the network to train
        """
        self.name = name
        self.image_size = image_size
        self.colors = colors
        self.batch_size = batch_size
        self.grid_size = min(grid_size, int(math.sqrt(batch_size)))
        self.log = log
        self.directory = directory
        os.makedirs(directory, exist_ok=True)
        #Network variables
        self.input_size = input_size
        self._gen_conv = generator_convolutions
        self._gen_width = generator_base_width
        self._dis_conv = discriminator_convolutions
        self._dis_width = discriminator_base_width
        self._class_depth = classification_depth
        self._dropout = dropout
        #Training variables
        self.learning_rate = (learning_rate, learning_momentum, learning_momentum2, learning_pivot)
        self._y_offset = y_offset
        self.current_scale = 1.0
        self._dis_scale = dicriminator_scaling_favor
        #Setup Images
        if image_manager is None:
            self.image_manager = ImageVariations(image_size=image_size, colored=(colors == 3))
        else:
            self.image_manager = image_manager
            self.image_manager.image_size = image_size
            self.image_manager.colored = (colors == 3)
        #Setup Networks
        self.iterations = tf.Variable(0, name="training_iterations", trainable=False)
        with tf.variable_scope('input'):
            self.generator_input = tf.placeholder(tf.float32, [None, self.input_size], name='generator_input')
            self.image_input = tf.placeholder(tf.uint8, shape=[None, image_size, image_size, self.colors], name='image_input')
            self.image_input_scaled = tf.subtract(tf.to_float(self.image_input)/127.5, 1, name='image_scaling')
        self.generator_output = None
        self.image_output = self.image_grid_output = None
        self.generator_solver = self.discriminator_solver = self.scale = None
        if setup:
            self.setup_network()

    def setup_network(self):
        """Initialize the network if it is not done in the constructor"""
        self.generator_output = image_decoder([self.generator_input], 'generator', self.image_size, self._gen_conv, self._gen_width, self.input_size, self.batch_size, self.colors)[0]
        self.image_output, self.image_grid_output = image_output([self.generator_output], 'output', self.image_size, self.grid_size)
        gen_logit, image_logit = image_encoder([self.generator_output, self.image_input_scaled], 'discriminator', self.image_size, self._dis_conv, self._dis_width, self._class_depth, self._dropout, 1)
        gen_var = tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES, scope='generator')
        dis_var = tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES, scope='discriminator')
        self.generator_solver, self.discriminator_solver, self.scale = \
            gan_optimizer('train', gen_var, dis_var, gen_logit, image_logit, 0., 1-self._y_offset,
                          *self.learning_rate, self.iterations, self._dis_scale, summary=self.log)


    def random_input(self):
        """Creates a random input for the generator"""
        return np.random.uniform(0.0, 1.0, size=[self.batch_size, self.input_size])


    def generate(self, session, name, amount=1):
        """Generate a image and save it"""
        def get_arr():
            arr = np.asarray(session.run(
                self.image_output,
                feed_dict={self.generator_input: self.random_input()}
            ), np.uint8)
            arr.shape = self.batch_size, self.image_size, self.image_size, self.colors
            return arr
        if amount == 1:
            self.image_manager.save_image(get_arr()[0], name)
        else:
            images = []
            counter = amount
            while counter > 0:
                images.extend(get_arr())
                counter -= self.batch_size
            for i in range(amount):
                self.image_manager.save_image(images[i], "%s_%02d"%(name, i))

    def generate_grid(self, session, name):
        """Generate a image and save it"""
        grid = session.run(
            self.image_grid_output,
            feed_dict={self.generator_input: self.random_input()}
        )
        self.image_manager.image_size = self.image_grid_output.get_shape()[1]
        self.image_manager.save_image(grid, name)
        self.image_manager.image_size = self.image_size


    def get_session(self):
        saver = tf.train.Saver()
        session = tf.Session()
        session.run(tf.global_variables_initializer())
        try:
            saver.restore(session, os.path.join(self.directory, self.name))
            start_iteration = session.run(self.iterations)
            print("\nLoaded an existing network\n")
        except Exception as e:
            start_iteration = 0
            if self.log:
                print("\nCreated a new network (%s)\n"%repr(e))
        return session, saver, start_iteration


    def __get_feed_dict__(self):
        return {
            self.image_input: self.image_manager.get_batch(self.batch_size),
            self.generator_input: self.random_input()
        }

    def __training_iteration__(self, session, i):
        if i < 500:                     #Initialising iterations
            if i < 50:
                session.run([self.discriminator_solver], feed_dict=self.__get_feed_dict__())
            else:
                session.run([self.discriminator_solver, self.generator_solver], feed_dict=self.__get_feed_dict__())
        elif i%10 == 0:                 #Check the scaling
            _, _, self.current_scale = session.run([self.discriminator_solver, self.generator_solver, self.scale], feed_dict=self.__get_feed_dict__())
        elif self.current_scale > 1.3:  #Train only the worse performing network (do some additional faster iterations)
            session.run(self.generator_solver, feed_dict={self.generator_input: self.random_input()})
            session.run(self.generator_solver, feed_dict={self.generator_input: self.random_input()})
        elif self.current_scale > 0.7:  #Train both networks if within 30% margin
            session.run([self.discriminator_solver, self.generator_solver], feed_dict=self.__get_feed_dict__())
        else:                           #Train only the worse performing network
            session.run([self.discriminator_solver], feed_dict=self.__get_feed_dict__())


    def train(self, batches=100000, print_interval=10):
        """Train the network for a number of batches (continuing if there is an existing model)"""
        start_time = last_time = last_save = timer()
        session, saver, start_iteration = self.get_session()
        if self.log:
            logger = SummaryLogger(self, session, start_iteration)
        try:
            print("Training the GAN on images in the '%s' folder"%self.image_manager.in_directory)
            print("To stop the training early press Ctrl+C (progress will be saved)")
            print('To continue training just run the training again')
            if self.log:
                print("To view the progress run 'python -m tensorflow.tensorboard --logdir %s'"%LOG_DIR)
            print("To generate images using the trained network run 'python generate.py %s'"%self.name)
            print()
            time_per = 10
            for i in range(start_iteration+1, start_iteration+batches+1):
                self.__training_iteration__(session, i)
                session.run(self.iterations.assign(i))
                #Print progress
                if i%print_interval == 0:
                    curr_time = timer()
                    time_per = time_per*0.6 + (curr_time-last_time)/print_interval*0.4
                    time = curr_time - start_time
                    print("\rIteration: %04d    Time: %02d:%02d:%02d  (%02.1fs / iteration)" % \
                        (i, time//3600, time%3600//60, time%60, time_per), end='')
                    last_time = curr_time
                if self.log:
                    logger(i)
                #Save network
                if timer() - last_save > 1800:
                    saver.save(session, os.path.join(self.directory, self.name), self.iterations)
                    last_save = timer()
        except KeyboardInterrupt:
            pass
        finally:
            print()
            if self.log:
                logger.close()
            print("Saving the network")
            saver.save(session, os.path.join(self.directory, self.name))
            session.close()


class SummaryLogger():
    """Log the progress of training to tensorboard (and some progress output to the console)"""
    def __init__(self, network, session, iteration, summary_interval=20, image_interval=500):
        self.session = session
        self.gan = network
        self.image_interval = image_interval
        self.summary_interval = summary_interval
        os.makedirs(LOG_DIR, exist_ok=True)
        if iteration == 0:
            self.writer = tf.summary.FileWriter(os.path.join(LOG_DIR, network.name), session.graph)
        else:
            self.writer = tf.summary.FileWriter(os.path.join(LOG_DIR, network.name))
        self.summary = tf.summary.merge_all()
        self.batch_input = network.random_input()

    def __call__(self, iteration):
        #Save image
        if iteration%self.image_interval == 0:
            #Hack to make tensorboard show multiple images, not just the latest one
            feed_dict = self.gan.__get_feed_dict__()
            feed_dict[self.gan.generator_input] = self.batch_input
            image, summary = self.session.run(
                [tf.summary.image(
                    'training/iteration/%d'%iteration,
                    tf.stack([self.gan.image_grid_output]),
                    max_outputs=1,
                    collections=['generated_images']
                ), self.summary],
                feed_dict=feed_dict
            )
            self.writer.add_summary(image, iteration)
            self.writer.add_summary(summary, iteration)
        elif iteration%self.summary_interval == 0:
            feed_dict = self.gan.__get_feed_dict__()
            #Save summary
            summary = self.session.run(self.summary, feed_dict=feed_dict)
            self.writer.add_summary(summary, iteration)

    def close(self):
        self.writer.close()