GANs-TimeSeriesForecasting/ModelWrapper.py at master · irdanish11/GANs-TimeSeriesForecasting · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
# -*- coding: utf-8 -*-
"""
Created on Tue Jun  9 20:20:44 2020

@author: Danish
"""


import tensorflow as tf
from tensorflow.keras.layers import LSTM, Dense, Input, Dropout, BatchNormalization
from tensorflow.keras.layers import LeakyReLU
from tensorflow.keras.models import Model
from tensorflow.keras.utils import plot_model
from tensorflow.python.keras import backend as K
from DataGenerator import BatchGenerator
from utilities import PrintInline, Timer
import os


class GAN:
    """

    Parameters
    ----------
    n_features : TYPE
        DESCRIPTION.
    optimizer : TYPE
        DESCRIPTION.
    ckpt_path : TYPE
        DESCRIPTION.
    tb_path : TYPE, optional
        DESCRIPTION. The default is None.
    dropout : TYPE, optional
        DESCRIPTION. The default is 0.2.
    alpha : TYPE, optional
        DESCRIPTION. The default is 0.2.
    gen_loss : TYPE, optional
        DESCRIPTION. The default is None.
    **kwargs :
            label_smoothing:
                Label smoothing for discriminator min_max_loss. The amount of smoothing for positive labels.
                This technique is taken from `Improved Techniques for Training GANs`
                (https://arxiv.org/abs/1606.03498). `0.0` means no smoothing.
            loss_collection:
                Collection to which this loss will be added. Loss collection for generator and discriminator.
                tf.compat.v1.GraphKeys.LOSSES
            reduction:
                A `tf.losses.Reduction` to apply to loss. e.g: Reduction.SUM_BY_NONZERO_WEIGHTS
    Returns
    -------
    None.

    """
    def __init__(self, n_features, optimizer, ckpt_path, tb_path=None, dropout=0.2, alpha=0.2, gen_loss=None, **kwargs):
        self.n_features = n_features
        self.optimizer = optimizer
        self.ckpt_path = ckpt_path
        self.tb_path = tb_path
        self.dropout = dropout
        self.aplha = alpha
        self.gen_loss = gen_loss
        self.input_shape = None
        self.history_epoch = {'Disc_Loss':[], 'Disc_Acc':[], 'Gen_Loss':[], 'Gen_Acc':[], 'Batch_Data':[]}
        self.history_batch = {'Disc_Loss':[], 'Disc_Acc':[], 'Gen_Loss':[], 'Gen_Acc':[], 'Batch_Data':[]}
        self.time_remain = 0
        self.time_taken = 0
        #Callback variables
        self.disc_metric=None
        self.gen_metric=None
        self.writer = None
        #Keyword variables
        self.gen_summary = kwargs.get('gen_summary', False)
        self.disc_summary = kwargs.get('disc_summary', False)
        self.compile_gen = kwargs.get('compile_gen', False)
        self.label_smoothing = kwargs.get('label_smoothing', 0.25)
        self.loss_collection = kwargs.get('loss_collection', tf.compat.v1.GraphKeys.LOSSES)
        self.reduction = kwargs.get('reduction', tf.compat.v1.losses.Reduction.SUM_BY_NONZERO_WEIGHTS)

    def minimax_discriminator_loss(self, Y_true, Y_pred, real_weights=1.0, gen_weights=1.0, summaries=False):
        """
        Original minimax discriminator loss for GANs, with label smoothing. Note that this loos is not
        recommended to use. A more practically seful loss is `modified_discriminator_loss`.

        L = - real_weights * log(sigmoid(D(x))) - generated_weights * log(1 - sigmoid(D(G(z))))

        See `Generative Adversarial Nets <https://arxiv.org/abs/1406.2661>`_ for more details.

        Parameters
        ----------
        Y_true : list
            A list containing 2 elements. First element Discriminator output on real data, second element
            Discriminator output on generated data. e.g [Y_hat_real, Y_hat_fake]
        Y_hat_fake : list
            A list containing 2 elements. First element Targets for real data, second element targets for
            generated/fake data. e.g [Y_real, Y_fake]

        real_weights : TYPE, optional
            Optional `Tensor` whose rank is either 0, or the same rank as `real_data`, and must be
            broadcastable to `real_data` (i.e., all dimensions must be either `1`, or the same as
            the corresponding dimension). The default is 1.0.
        gen_weights : TYPE, optional
            Same as `real_weights`, but for `generated_data`. The default is 1.0.
        summaries : bool, optional
            Whether or not to add summaries for the loss.. The default is False.

        Returns
        -------
        loss : tensor
            A loss Tensor. The shape depends on `reduction`..

        """
        Y_hat_real = Y_pred[0]
        Y_hat_fake = Y_pred[1]
        Y_real = Y_true[0]
        Y_fake = Y_true[1]
        label_smoothing = 0.25#self.label_smoothing
        loss_collection = self.loss_collection
        reduction = self.reduction
        with tf.name_scope('Discriminator_MinMax_Loss') as scope:
            # -log((1 - label_smoothing) - sigmoid(D(x)))
            loss_on_real = tf.compat.v1.losses.sigmoid_cross_entropy(Y_real, Y_hat_real, real_weights, label_smoothing,
                                                                     scope, loss_collection=None, reduction=reduction)
            # -log(- sigmoid(D(G(x))))
            loss_on_generated = tf.compat.v1.losses.sigmoid_cross_entropy(Y_fake, Y_hat_fake, gen_weights, scope=scope,
                                                                          loss_collection=None, reduction=reduction)
            D_loss = loss_on_real + loss_on_generated
            tf.compat.v1.losses.add_loss(D_loss, loss_collection)

            if summaries:
              tf.compat.v1.summary.scalar('discriminator_gen_minimax_loss', loss_on_generated)
              tf.compat.v1.summary.scalar('discriminator_real_minimax_loss', loss_on_real)
              tf.compat.v1.summary.scalar('discriminator_minimax_loss', D_loss)

        return D_loss

    def discriminator_loss(self, y_true, y_pred):
        """
        Creates a Keras type custom loss function for Discriminator MinMax Loss, to work with model.compile.

        Parameters
        ----------
        y_true : tensor
            Targets or labels, half of length conatining ones and half of length containing zeros.
        y_pred : tensor
            Predictions by Discriminator.

        Returns
        -------
        A tensor having the same dimension as the ouptut of model.

        """
        with tf.compat.v1.variable_scope('Discriminator_Loss'):
            """
                tf.split() split the given tensors into two equal parts, pythonic slicing can't be used
                here because the shape of the loss at compile time is dynamic e.g (?, probablity), so the
                first axis is not determined and by using pythonic slicing it will generate.
                ValueError: slice index 4 of dimension 1 out of bounds. for 'loss_2/dense_34_loss/
                Discriminator_Loss/strided_slice_1' (op: 'StridedSlice') with input shapes: [?,1]

                Under the hood the thing that is happening can be visualized as:

                #Discriminator output on real data
                Y_hat_real = y_pred[0:2]
                #Discriminator output on fake data
                Y_hat_fake = y_pred[2, 4]
            """
            #tf.split split the tensors and returns a list of two elements as
            #[Targets for real data, Targets for fake data]
            Y_true =  tf.split(y_true, num_or_size_splits=2, axis=0)
            #tf.split split the tensors and returns a list of two elements as
            #[Discriminator output on real data, Discriminator output on fake data]
            Y_pred = tf.split(y_pred, num_or_size_splits=2, axis=0)

            D_loss = self.minimax_discriminator_loss(Y_true, Y_pred, real_weights=1.0, gen_weights=1.0,
                                                   summaries=True)
            return  D_loss

    def minmax_generator_loss(self, x_t1, x_t1_hat, Y_hat_gan, lambda1=1.0, lambda2=1.0, summaries=False):
        """
        The generator loss G_loss which along with D_loss used to optimize the value function.
        Particularly, we combine the Mean Square Error (MSE) with the generator loss of a classical
        GAN to constitute the G_loss of our architecture.
            G_loss = λ1*g_mse + λ2*g_loss.
        The loss function G_loss is composed by g_mse and g_loss with λ1 and λ2, respectively. λ1
        and λ2 are hyper-parameters. For more see:
        `Stock Market Prediction Based on Generative Adversarial Network <https://doi.org/10.1016/j.procs.2019.01.256>`_

        Parameters
        ----------
        x_t1 : TYPE
            Real Data at time step t+1.
        x_t1_hat : TYPE
            Fake data generated by generator at time t+1.
        Y_hat_gan : TYPE
            Ouput of discrminator which is extracted using gan(combined model), not the discriminator only.
        lambda1 : TYPE, optional
            Values for hyper paramets lambda 1. For more check equation 10 in the paper. The default is 1.0.
        lambda2 : TYPE, optional
            Same as lambda1. The default is 1.0.

        Returns
        -------
        None.

        """
        loss_collection = self.loss_collection
        reduction = self.reduction
        with tf.name_scope('Generator_MinMax_Loss') as scope:
            #usually in MSE (labels-prediction)^2 but in eq-8 of paper (predictions-labels),
            #that is why we change the parameter passing order below
            g_mse = tf.compat.v1.losses.mean_squared_error(labels=x_t1_hat, predictions=x_t1, scope=scope,
                                                           loss_collection=None, reduction=reduction)
            g_loss = tf.compat.v1.losses.sigmoid_cross_entropy(tf.ones_like(Y_hat_gan), Y_hat_gan, scope=scope,
                                                               loss_collection=None, reduction=reduction)
            #GAN loss
            G_loss = (lambda1*g_mse) + (lambda2*g_loss)
            tf.compat.v1.losses.add_loss(G_loss, loss_collection)

            if summaries:
              tf.compat.v1.summary.scalar('g_mse_loss', g_mse)
              tf.compat.v1.summary.scalar('gan_g_loss', g_loss)
              tf.compat.v1.summary.scalar('gan_G_loss', G_loss)

        return G_loss


    def get_generator(self, name):
        """


        Raises
        ------
        TypeError
            DESCRIPTION.

        Returns
        -------
        generator : TYPE
            DESCRIPTION.

        """
        with tf.name_scope('Generator'):
            gen_input = Input(self.input_shape)
            #LSTM layer
            lstm = LSTM(units=50, activation='relu', return_sequences=False, input_shape=self.input_shape)(gen_input)
            lstm = Dropout(self.dropout)(lstm)
            #Fully connected layer
            fc = Dense(units=self.n_features)(lstm)
            fc = LeakyReLU(alpha=self.aplha)(fc)

        generator = Model(inputs=gen_input, outputs=fc, name=name)
        if self.gen_summary:
            print('\n')
            generator.summary()
            print('\n\n')
        if self.compile_gen:
            if self.gen_loss is None:
                raise TypeError('gen_loss can not be None, when kwargs["compile_gen"] is True. Provide valid keras loss function string')
            generator.compile(loss=self.gen_loss, optimizer=self.optimizer)
        return generator

    def get_discriminator(self, disc_loss, name):
        """
        Creates the discriminator Model as mentioned in `Stock Market Prediction Based on Generative Adversarial Network <https://doi.org/10.1016/j.procs.2019.01.256>`_

        Returns
        -------
        discriminator : object to the Model class.
            Keras engine training Model object.

        """
        with tf.name_scope('Discriminator'):
            #input layer
            disc_input = Input((self.n_features))
            #1st hidden layer
            h1 = Dense(units=72)(disc_input)
            h1 = LeakyReLU(alpha=self.aplha)(h1)
            #2nd hidden layer
            h2 = Dense(units=100)(h1)
            h2 = LeakyReLU(alpha=self.aplha)(h2)
            #3rd hidden layer
            h3 = Dense(units=10)(h2)
            h3 = LeakyReLU(alpha=self.aplha)(h3)
            #output layer
            fc = Dense(units=1, activation='sigmoid')(h3)

        discriminator = Model(disc_input, fc, name=name)
        if self.disc_summary:
            discriminator.summary()
            print('\n\n')
        discriminator.compile(loss=disc_loss, optimizer=self.optimizer, metrics=['accuracy'])
        return discriminator

    def get_gan_model(self, name):
        generator = self.get_generator(name='Generator')
        discriminator = self.get_discriminator(self.discriminator_loss, name='Discriminator')
        #Make the discriminator untrainable when we are training the generator.
        #This doesn't effect the discriminator by itself
        discriminator.trainable = False

        #Combine the two models to create the GAN
        gan_input = Input(shape=self.input_shape)
        fake_data = generator(gan_input)
        gan_output = discriminator(fake_data)

        gan = Model(gan_input, gan_output, name=name)
        #No model compilation because training is done using GradientTape
        #gan.compile(loss=gan_loss, optimizer=self.optimizer)
        return generator, discriminator, gan

    def train_generator(self, generator, gan, X_reshaped, x_t1, X_fake):
        with tf.GradientTape() as tape:
            #prediction of generator x_t1_hat given x_t
            x_t1_hat = generator(X_reshaped)
            #For info regarding model.predict(X) and model(X) see: https://stackoverflow.com/questions/60159714/when-to-use-model-predictx-vs-modelx-in-tensorflow
            #Prediction of GAN as whole model, where discrminator is non trainable.
            Y_hat_gan = gan(X_fake)
            #Computing G_loss
            G_loss = self.minmax_generator_loss(x_t1, x_t1_hat, Y_hat_gan, lambda1=1.0, lambda2=1.0, summaries=True)
            self.history_batch['Gen_Loss'].append(G_loss)
            #computing the accuracy
            acc = tf.keras.metrics.BinaryAccuracy(name='binary_accuracy', threshold=0.5)
            _ = acc.update_state(tf.ones_like(Y_hat_gan), Y_hat_gan)
            G_acc = acc.result().numpy()
            self.history_batch['Gen_Acc'].append(G_acc)
            #Reset the states of metrics
            acc.reset_states()

        #calculate gardients
        gan_gradients = tape.gradient(G_loss, gan.trainable_variables)
        #Apply gradients
        self.optimizer.apply_gradients(zip(gan_gradients, gan.trainable_variables))

    def info_out(self, which, epoch=None, epochs=None, batch=None, steps_per_epoch=None, total_time=None):
        if which.lower()=='batch':
            str1 =  'Epoch {0}/{1}, Batch {2}/{3}, - '.format(epoch, epochs, batch, steps_per_epoch-1)
            str2 = 'Time Taken By 1 Batch: {0:.2} sec. - Est Time Remaining: {1}, - '.format(self.time_taken, self.time_remain)
            str3 = 'Discriminator Loss: {0:.5}, - Discriminator Accuracy: {1:.3} - '.format(self.history_batch['Disc_Loss'][batch-1],
                                                                                            self.history_batch['Disc_Acc'][batch-1])
            str4 = 'Generator Loss: {0:.5}, - Generator Accuracy: {1:.3}.'.format(self.history_batch['Gen_Loss'][batch-1],
                                                                                  self.history_batch['Gen_Acc'][batch-1])
            PrintInline(str1+str2+str3+str4)
        elif which.lower()=='epoch':
            str1 = 'Discriminator Loss: {0:.5}, - Discriminator Accuracy: {1:.3} - '.format(self.history_epoch['Disc_Loss'][epoch-1],
                                                                                            self.history_epoch['Disc_Acc'][epoch-1])
            str2 = 'Generator Loss: {0:.5}, - Generator Accuracy: {1:.3}.'.format(self.history_epoch['Gen_Loss'][epoch-1],
                                                                                  self.history_epoch['Gen_Acc'][epoch-1])
            print('\nEpoch Completed, Total Time Taken: ' + total_time + ', - ' + str1 + str2)
            print('\t\t\t________________________________________________________\n')
        else:
            raise ValueError('Invalid value given to `which`, it can be either `batch` or `epoch`!')

    def ckpt_callback(self, epoch, models, metric_disc='loss', metric_gen='loss', save_best_only=True):
        path = self.ckpt_path
        if type(models)!= list:
            raise TypeError('Invalid value given to models it should be a list containing three models in this order: [generator, discriminator, gan_model]')
        os.makedirs(path, exist_ok=True)
        def save_disc(models, path):
            models[1].save(path+'/Discriminator.h5')
        def save_gen(models, path):
            models[0].save(path+'/Generator.h5')
            models[2].save(path+'/GAN_Model.h5')

        if save_best_only:
            #intializaing metric value
            if metric_disc=='loss' and metric_gen=='loss':
                if epoch==1:
                    self.disc_metric = 1000.0
                    self.gen_metric = 1000.0
                #Checking for improvements
                if self.history_epoch['Disc_Loss'][epoch-1] < self.disc_metric:
                    save_disc(models, path)
                if self.history_epoch['Gen_Loss'][epoch-1] < self.gen_metric:
                    save_gen(models, path)

            elif metric_disc=='accuracy' and metric_gen=='accuracy':
                if epoch==1:
                    self.disc_metric = 0.0
                    self.gen_metric = 0.0
                #Checking for improvements
                if self.history_epoch['Disc_Acc'][epoch-1] > self.disc_metric:
                    save_disc(models, path)
                if self.history_epoch['Gen_Acc'][epoch-1] > self.gen_metric:
                    save_gen(models, path)

            elif metric_disc=='loss' and metric_gen=='accuracy':
                if epoch==1:
                    self.disc_metric = 1000.0
                    self.gen_metric = 0.0
                #Checking for improvements
                if self.history_epoch['Disc_Loss'][epoch-1] < self.disc_metric:
                    save_disc(models, path)
                if self.history_epoch['Gen_Acc'][epoch-1] < self.gen_metric:
                    save_gen(models, path)

            elif metric_disc=='accuracy' and metric_gen=='loss':
                if epoch==1:
                    self.disc_metric = 0.0
                    self.gen_metric = 1000.0
                #Checking for improvements
                if self.history_epoch['Disc_Acc'][epoch-1] < self.disc_metric:
                    save_disc(models, path)
                if self.history_epoch['Gen_Loss'][epoch-1] < self.gen_metric:
                    save_gen(models, path)
        else:
            save_disc(models, path)
            save_gen(models, path)

    def tensorboard_callback(self, graph=None, models=None):
        os.makedirs(self.tb_path, exist_ok=True)
        if models != None:
            if type(models) != list:
                raise TypeError('Invalid value given to models it should be a list containing three models in this order: [generator, discriminator, gan_model]')
            else:
                for i in range(len(models)):
                    plot_model(models[i], to_file=self.tb_path+'/'+models[i].name+'.png', show_shapes=True, show_layer_names=True)
        if graph != None:
            self.writer = tf.summary.FileWriter(logdir=self.tb_path, graph=graph)


    def train_GAN(self, X_train, epochs, batch_size, batch_shape, name, gan_summary=False, tensorboard=True):
        """


        Parameters
        ----------
        X_train : TYPE
            DESCRIPTION.
        epochs : TYPE
            DESCRIPTION.
        batch_size : TYPE
            DESCRIPTION.
        batch_shape : TYPE
            DESCRIPTION.
        name : TYPE
            DESCRIPTION.
        gan_summary : TYPE, optional
            DESCRIPTION. The default is False.

        Returns
        -------
        TYPE
            DESCRIPTION.

        """
        self.input_shape = (batch_shape[1], batch_shape[2])
        generator, discriminator, gan_model = self.get_gan_model(name)
        if tensorboard:
            # Get the sessions graph
            #graph = K.get_session().graphs
            self.tensorboard_callback(models=[generator, discriminator, gan_model])
        if gan_summary:
            gan_model.summary()
            print('Note: In the GAN(combined model) Discriminator parameters are set to non-trainable because while training Generator, we do not train Discriminator!')
        steps_per_epoch = len(X_train)//batch_size
        chk = input('\n\nStart training y/N: ')
        if chk.lower()=='y':
            for epoch in range(1, epochs+1):
                #setting up timer class
                time =Timer()
                bg = BatchGenerator(X_train, batch_size=batch_size)
                for batch in range(1, steps_per_epoch):
                    #start the timer
                    time.start()
                    # X_reshaped is used data to get the output from generator model. X is the data in
                    # orignal dimensions e.g [batches,features], while X_reshaped is the data for LSTM
                    # layer as LSTM layer 3D data so X_reshaped has dimensions [batches, timesteps, features]
                    #whereas x_t1 is the data at time t+1 or next batch
                    X, X_reshaped, x_t1 = bg.get_nextBatch(batch_shape)
                    #Getting the data for discrimnator training.
                    X_disc, Y_disc, X_fake = bg.get_disc_gan_data(generator, X, X_reshaped, x_t1)
                    """ train discriminator """

                    metrics = discriminator.train_on_batch(X_disc, Y_disc)
                    self.history_batch['Disc_Loss'].append(metrics[0])
                    self.history_batch['Disc_Acc'].append(metrics[1])
                    #train generator
                    self.train_generator(generator, gan_model, X_reshaped, x_t1, X_fake)
                    #Getting total time taken by a batch
                    self.time_remain, self.time_taken = time.get_time_hhmmss(steps_per_epoch-batch)
                    self.info_out('batch', epoch, epochs, batch, steps_per_epoch)

                #computing loss & accuracy over one epoch
                self.history_epoch['Disc_Loss'].append(sum(self.history_batch['Disc_Loss'])/steps_per_epoch)
                self.history_epoch['Disc_Acc'].append(sum(self.history_batch['Disc_Acc'])/steps_per_epoch)
                self.history_epoch['Gen_Loss'].append(sum(self.history_batch['Gen_Loss'])/steps_per_epoch)
                self.history_epoch['Gen_Acc'].append(sum(self.history_batch['Gen_Acc'])/steps_per_epoch)
                self.history_epoch['Batch_Data'].append(self.history_batch)
                self.info_out(which='epoch', epoch=epoch, total_time=time.get_total_time())
                self.ckpt_callback(epoch, [generator, discriminator, gan_model])
        elif chk.lower()=='n':
            SystemExit
        return self.history_epoch