Started Implementation of Standard Autoencoder

gdialektakis · gdialektakis · commit 7acf174b42a4 · 2021-06-29T17:48:55.000+03:00
diff --git a/autoencoders/__init__.py b/autoencoders/__init__.py
diff --git a/autoencoders/standard_AE.py b/autoencoders/standard_AE.py
@@ -0,0 +1,130 @@
+import pandas as pd
+import tensorflow as tf
+import numpy as np
+import datetime
+import os
+import matplotlib.pyplot as plt
+from data_preprocessing import preprocess
+from sklearn.utils import shuffle
+
+
+# Parameters
+input_dim = 28
+hidden_size1 = 100
+hidden_size2 = 100
+z_dim = 20
+
+batch_size = 100
+n_epochs = 1000
+learning_rate = 0.001
+beta1 = 0.9
+results_path = './autoencoders/Results/Standard_AE'
+saved_model_path = results_path + '/Saved_models/'
+
+# Placeholders for input data and the targets
+x_input = tf.placeholder(dtype=tf.float32, shape=[batch_size, input_dim], name='Input')
+x_target = tf.placeholder(dtype=tf.float32, shape=[batch_size, input_dim], name='Target')
+decoder_input = tf.placeholder(dtype=tf.float32, shape=[1, z_dim], name='Decoder_input')
+
+
+def dense(x, n1, n2, name):
+    """
+    Used to create a dense layer.
+    :param x: input tensor to the dense layer
+    :param n1: no. of input neurons
+    :param n2: no. of output neurons
+    :param name: name of the entire dense layer.i.e, variable scope name.
+    :return: tensor with shape [batch_size, n2]
+    """
+    with tf.variable_scope(name, reuse=None):
+        weights = tf.get_variable("weights", shape=[n1, n2],
+                                  initializer=tf.random_normal_initializer(mean=0., stddev=0.01))
+        bias = tf.get_variable("bias", shape=[n2], initializer=tf.constant_initializer(0.0))
+        out = tf.add(tf.matmul(x, weights), bias, name='matmul')
+        return out
+
+
+# The Encoder of the network
+def encoder(x, reuse=False):
+    """
+    Encode part of the autoencoder
+    :param x: input to the autoencoder
+    :param reuse: True -> Reuse the encoder variables, False -> Create or search of variables before creating
+    :return: tensor which is the hidden latent variable of the autoencoder.
+    """
+    if reuse:
+        tf.get_variable_scope().reuse_variables()
+    with tf.name_scope('Encoder'):
+        e_dense_1 = tf.nn.relu(dense(x, input_dim, hidden_size1, 'e_dense_1'))
+        e_dense_2 = tf.nn.relu(dense(e_dense_1, hidden_size1, hidden_size2, 'e_dense_2'))
+        latent_variable = dense(e_dense_2, hidden_size2, z_dim, 'e_latent_variable')
+        return latent_variable
+
+
+# The Decoder of the network
+def decoder(x, reuse=False):
+    """
+    Decoder part of the autoencoder
+    :param x: input to the decoder
+    :param reuse: True -> Reuse the decoder variables, False -> Create or search of variables before creating
+    :return: tensor which should ideally be the input given to the encoder.
+    """
+    if reuse:
+        tf.get_variable_scope().reuse_variables()
+    with tf.name_scope('Decoder'):
+        d_dense_1 = tf.nn.relu(dense(x, z_dim, hidden_size2, 'd_dense_1'))
+        d_dense_2 = tf.nn.relu(dense(d_dense_1, hidden_size2, hidden_size1, 'd_dense_2'))
+        output = tf.nn.sigmoid(dense(d_dense_2, hidden_size1, input_dim, 'd_output'))
+        return output
+
+
+def train(train_model=True, train_data=None, test_data=None):
+    """
+    Used to train the autoencoder by passing in the necessary inputs.
+    :param train_model: True -> Train the model, False -> Load the latest trained model and show the reconstructed variables.
+    """
+    with tf.variable_scope(tf.get_variable_scope()):
+        encoder_output = encoder(x_input)
+        decoder_output = decoder(encoder_output)
+
+    with tf.variable_scope(tf.get_variable_scope()):
+        reconstructed_variables = decoder(decoder_input, reuse=True)
+
+    # Loss
+    loss = tf.reduce_mean(tf.square(x_target - decoder_output))
+
+    # Optimizer
+    optimizer = tf.train.AdamOptimizer(learning_rate=learning_rate, beta1=beta1).minimize(loss)
+    init = tf.global_variables_initializer()
+
+    # Saving the model
+    saver = tf.train.Saver()
+    step = 0
+    with tf.Session() as sess:
+        sess.run(init)
+        if train_model:
+
+            for i in range(n_epochs):
+                train_data = shuffle(train_data)
+                # break the train data df into chunks of size batch_size
+                train_df = [train_data[x:x + batch_size] for x in range(0, train_data.shape[0], batch_size)]
+                count = 0
+                for batch in train_df:
+                    if batch.shape[0] == batch_size:
+                        count += 1
+                        sess.run(optimizer, feed_dict={x_input: batch, x_target: batch})
+
+                        if count % 50 == 0:
+                            batch_loss = sess.run([loss], feed_dict={x_input: batch, x_target: batch})
+                            print("Loss: {}".format(batch_loss))
+                            print("Epoch: {}, iteration: {}".format(i, count))
+                        step += 1
+                    saver.save(sess, save_path=saved_model_path, global_step=step)
+                print("Model Trained!")
+
+            print("Saved Model Path: {}".format(saved_model_path))
+        else:
+            all_results = os.listdir(results_path)
+            all_results.sort()
+            saver.restore(sess,
+                          save_path=tf.train.latest_checkpoint(results_path + '/' + all_results[-1] + '/Saved_models/'))
diff --git a/data_loader.py b/data_loader.py
@@ -46,7 +46,7 @@ def load_cms_data(filename="open_cms_data.root"):
 
     print("\nDataframe:")
     print(dataframe.head())
-    dataframe.to_csv('27D_opensCMS_data.csv')
+    dataframe.to_csv('27D_openCMS_data.csv')
     return dataframe
 
 
diff --git a/data_preprocessing.py b/data_preprocessing.py
@@ -1,11 +1,10 @@
 import pandas as pd
-import numpy as np
 from sklearn.preprocessing import StandardScaler
 from sklearn.model_selection import train_test_split
 from sklearn.utils import shuffle
 
 
-def preprocess(filename='27D_opensCMS_data.csv'):
+def preprocess(filename='27D_openCMS_data.csv'):
     data_df = pd.read_csv(filename)
     data_df = data_df.drop(['entry', 'subentry'], axis=1)
     # data_df = data_df.astype('float32')
@@ -26,9 +25,8 @@ def preprocess(filename='27D_opensCMS_data.csv'):
     print('Test data shape: ')
     print(test_set.shape)
 
-    data_df.to_csv('27D_opensCMS_preprocessed_data.csv')
+    data_df.to_csv('27D_openCMS_preprocessed_data.csv')
 
     return train_set, test_set
 
 
-preprocess()
diff --git a/main.py b/main.py
@@ -0,0 +1,7 @@
+from data_preprocessing import preprocess
+from autoencoders import standard_AE
+
+
+train_data, test_data = preprocess()
+
+standard_AE.train(train_data=train_data, test_data=test_data)
diff --git a/plot_data.py b/plot_data.py
@@ -3,7 +3,7 @@
 
 
 def plot():
-    data_df = pd.read_csv('27D_opensCMS_preprocessed_data.csv')
+    data_df = pd.read_csv('27D_openCMS_preprocessed_data.csv')
 
     variable_list = ['pt_', 'eta_', 'phi_', 'mass_',
                      'fX', 'fY', 'fZ', 'mJetArea',
@@ -33,12 +33,17 @@ def plot():
                 prefix + 'mChargedMuEnergy', prefix + 'mNeutralEmEnergy', prefix + 'mChargedMultiplicity',
                 prefix + 'mNeutralMultiplicity']
 
-    n_bins = 50
+    n_bins = 100
 
     for kk in range(0, 28):
-        n_hist_data, bin_edges, _ = plt.hist(data_df[branches[kk]], color='orange', label='Input', alpha=1, bins=n_bins)
-        plt.xlabel(xlabel=variable_list[kk])
-        plt.ylabel('# of events')
+        if branches[kk] == prefix + 'pt_' or branches[kk] == prefix + 'mass_':
+            n_hist_data, bin_edges, _ = plt.hist(data_df[branches[kk]], color='orange', label='Input', alpha=1, bins=n_bins, log=True)
+            plt.xlabel(xlabel=variable_list[kk])
+            plt.ylabel('# of events')
+        else:
+            n_hist_data, bin_edges, _ = plt.hist(data_df[branches[kk]], color='orange', label='Input', alpha=1, bins=n_bins)
+            plt.xlabel(xlabel=variable_list[kk])
+            plt.ylabel('# of events')
         plt.show()
 
 plot()