5 vuotta sitten · 7e2c83ee4c
--- a/models/custom_layers.py
+++ b/models/custom_layers.py
@@ -2,6 +2,35 @@ from tensorflow.keras import layers
 
																 import tensorflow as tf
															
 
																 import math
															
 
																 import numpy as np
															
 
																+import itertools
															
 
																+
															
 
																+
															
 
																+class BitsToSymbols(layers.Layer):
															
 
																+    def __init__(self, cardinality):
															
 
																+        super(BitsToSymbols, self).__init__()
															
 
																+
															
 
																+        self.cardinality = cardinality
															
 
																+
															
 
																+        n = int(math.log(self.cardinality, 2))
															
 
																+        self.pows = tf.convert_to_tensor(np.power(2, np.linspace(n-1, 0, n)).reshape(-1, 1), dtype=tf.float32)
															
 
																+
															
 
																+    def call(self, inputs, **kwargs):
															
 
																+        idx = tf.cast(tf.tensordot(inputs, self.pows, axes=1), dtype=tf.int32)
															
 
																+        return tf.one_hot(idx, self.cardinality)
															
 
																+
															
 
																+
															
 
																+class SymbolsToBits(layers.Layer):
															
 
																+    def __init__(self, cardinality):
															
 
																+        super(SymbolsToBits, self).__init__()
															
 
																+
															
 
																+        n = int(math.log(cardinality, 2))
															
 
																+        lst = [list(i) for i in itertools.product([0, 1], repeat=n)]
															
 
																+
															
 
																+        # self.all_syms = tf.convert_to_tensor(np.asarray(lst), dtype=tf.float32)
															
 
																+        self.all_syms = tf.transpose(tf.convert_to_tensor(np.asarray(lst), dtype=tf.float32))
															
 
																+
															
 
																+    def call(self, inputs, **kwargs):
															
 
																+        return tf.matmul(self.all_syms, inputs)
															
 
																 class ExtractCentralMessage(layers.Layer):
															
@@ -24,9 +53,7 @@ class ExtractCentralMessage(layers.Layer):
 
																         self.w = tf.convert_to_tensor(temp_w, dtype=tf.float32)
															
 
																     def call(self, inputs, **kwargs):
															
 
																-        out = tf.matmul(inputs, self.w)
															
 
																-        return tf.reshape(out, shape=(1, 1, self.samples_per_symbol))
															
 
																-        # TODO: this won't work with dense layers need to move to separate layer
															
 
																+        return tf.matmul(inputs, self.w)
															
 
																 class AwgnChannel(layers.Layer):
															
--- a/models/end_to_end.py
+++ b/models/end_to_end.py
@@ -5,8 +5,9 @@ import numpy as np
 
																 import matplotlib.pyplot as plt
															
 
																 from sklearn.preprocessing import OneHotEncoder
															
 
																 from tensorflow.keras import layers, losses
															
 
																-from models.custom_layers import ExtractCentralMessage, OpticalChannel, DigitizationLayer
															
 
																-
															
 
																+from tensorflow.keras import backend as K
															
 
																+from models.custom_layers import ExtractCentralMessage, OpticalChannel, DigitizationLayer, BitsToSymbols
															
 
																+import itertools
															
 
																 class EndToEndAutoencoder(tf.keras.Model):
															
 
																     def __init__(self,
															
@@ -14,7 +15,7 @@ class EndToEndAutoencoder(tf.keras.Model):
 
																                  samples_per_symbol,
															
 
																                  messages_per_block,
															
 
																                  channel,
															
 
																-                 recurrent=False):
															
 
																+                 bit_mapping=False):
															
 
																         """
															
 
																         The autoencoder that aims to find a encoding of the input messages. It should be noted that a "block" consists
															
 
																         of multiple "messages" to introduce memory into the simulation as this is essential for modelling inter-symbol
															
@@ -29,12 +30,16 @@ class EndToEndAutoencoder(tf.keras.Model):
 
																         # Labelled M in paper
															
 
																         self.cardinality = cardinality
															
 
																+        self.bits_per_symbol = int(math.log(self.cardinality, 2))
															
 
																+
															
 
																         # Labelled n in paper
															
 
																         self.samples_per_symbol = samples_per_symbol
															
 
																+
															
 
																         # Labelled N in paper
															
 
																         if messages_per_block % 2 == 0:
															
 
																             messages_per_block += 1
															
 
																         self.messages_per_block = messages_per_block
															
 
																+
															
 
																         # Channel Model Layer
															
 
																         if isinstance(channel, layers.Layer):
															
 
																             self.channel = tf.keras.Sequential([
															
@@ -44,39 +49,63 @@ class EndToEndAutoencoder(tf.keras.Model):
 
																             ], name="channel_model")
															
 
																         else:
															
 
																             raise TypeError("Channel must be a subclass of keras.layers.layer!")
															
 
																-        self.recurrent = recurrent
															
 
																-
															
 
																-        if recurrent:
															
 
																-            input_layer = layers.Input(shape=(self.messages_per_block, self.cardinality), batch_size=1)
															
 
																-            # encoding_layers = [
															
 
																-            #     layers.LSTM(2 * self.cardinality, activation='relu', return_sequences=True, stateful=True),
															
 
																-            #     layers.LSTM(2 * self.cardinality, activation='relu', return_sequences=True, stateful=True)
															
 
																-            # ]
															
 
																+
															
 
																+        # Boolean identifying if bit mapping is to be learnt
															
 
																+        self.bit_mapping = bit_mapping
															
 
																+
															
 
																+        # Layer configuration for the case when bit mapping is to be learnt
															
 
																+        if self.bit_mapping:
															
 
																+            encoding_layers = [
															
 
																+                layers.Input(shape=(self.messages_per_block, self.bits_per_symbol)),
															
 
																+                BitsToSymbols(self.cardinality),
															
 
																+                layers.TimeDistributed(layers.Dense(2 * self.cardinality)),
															
 
																+                layers.TimeDistributed(layers.LeakyReLU(alpha=0.01)),
															
 
																+                # layers.TimeDistributed(layers.Dense(2 * self.cardinality)),
															
 
																+                # layers.TimeDistributed(layers.LeakyReLU(alpha=0.01)),
															
 
																+                # layers.TimeDistributed(layers.Dense(self.samples_per_symbol, activation='sigmoid')),
															
 
																+                layers.TimeDistributed(layers.Dense(self.samples_per_symbol)),
															
 
																+                layers.TimeDistributed(layers.ReLU(max_value=1.0))
															
 
																+            ]
															
 
																             decoding_layers = [
															
 
																-                layers.LSTM(2 * self.cardinality, activation='relu', return_sequences=True, stateful=True),
															
 
																-                layers.LSTM(2 * self.cardinality, activation='relu', return_sequences=True, stateful=True)
															
 
																+                layers.Dense(2 * self.cardinality),
															
 
																+                layers.LeakyReLU(alpha=0.01),
															
 
																+                # layers.Dense(2 * self.cardinality),
															
 
																+                # layers.LeakyReLU(alpha=0.01),
															
 
																+                layers.Dense(self.cardinality),
															
 
																+                layers.LeakyReLU(alpha=0.01),
															
 
																+                layers.Dense(self.bits_per_symbol, activation='sigmoid'),
															
 
																             ]
															
 
																+
															
 
																+        # layer configuration for the case when only symbol mapping is to be learnt
															
 
																         else:
															
 
																-            input_layer = layers.Input(shape=(self.messages_per_block, self.cardinality))
															
 
																+            encoding_layers = [
															
 
																+                layers.Input(shape=(self.messages_per_block, self.cardinality)),
															
 
																+                layers.TimeDistributed(layers.Dense(2 * self.cardinality)),
															
 
																+                layers.TimeDistributed(layers.LeakyReLU(alpha=0.01)),
															
 
																+                layers.TimeDistributed(layers.Dense(2 * self.cardinality)),
															
 
																+                layers.TimeDistributed(layers.LeakyReLU(alpha=0.01)),
															
 
																+                # layers.TimeDistributed(layers.Dense(self.samples_per_symbol, activation='sigmoid')),
															
 
																+                layers.TimeDistributed(layers.Dense(self.samples_per_symbol)),
															
 
																+                layers.TimeDistributed(layers.ReLU(max_value=1.0))
															
 
																+            ]
															
 
																             decoding_layers = [
															
 
																-                layers.Dense(2 * self.cardinality, activation='relu'),
															
 
																-                layers.Dense(2 * self.cardinality, activation='relu')
															
 
																+                layers.Dense(2 * self.cardinality),
															
 
																+                layers.LeakyReLU(alpha=0.01),
															
 
																+                layers.Dense(2 * self.cardinality),
															
 
																+                layers.LeakyReLU(alpha=0.01),
															
 
																+                layers.Dense(self.cardinality),
															
 
																+                layers.LeakyReLU(alpha=0.01),
															
 
																+                layers.Dense(self.bits_per_symbol, activation='sigmoid'),
															
 
																             ]
															
 
																         # Encoding Neural Network
															
 
																         self.encoder = tf.keras.Sequential([
															
 
																-            input_layer,
															
 
																-            layers.Dense(2 * self.cardinality, activation='relu'),
															
 
																-            layers.Dense(2 * self.cardinality, activation='relu'),
															
 
																-            layers.Dense(self.samples_per_symbol),
															
 
																-            layers.ReLU(max_value=1.0)
															
 
																+            *encoding_layers
															
 
																         ], name="encoding_model")
															
 
																         # Decoding Neural Network
															
 
																         self.decoder = tf.keras.Sequential([
															
 
																-            layers.Dense(self.samples_per_symbol, activation='relu'),
															
 
																-            *decoding_layers,
															
 
																-            layers.Dense(self.cardinality, activation='softmax')
															
 
																+            *decoding_layers
															
 
																         ], name="decoding_model")
															
 
																     def generate_random_inputs(self, num_of_blocks, return_vals=False):
															
@@ -93,33 +122,30 @@ class EndToEndAutoencoder(tf.keras.Model):
 
																         mid_idx = int((self.messages_per_block - 1) / 2)
															
 
																-        if self.recurrent and not return_vals:
															
 
																-            rand_int = np.random.randint(self.cardinality, size=(num_of_blocks+self.messages_per_block-1, 1))
															
 
																-
															
 
																-            rand_enc = enc.fit_transform(rand_int)
															
 
																+        if self.bit_mapping:
															
 
																+            rand_int = np.random.randint(2, size=(num_of_blocks * self.messages_per_block * self.bits_per_symbol, 1))
															
 
																-            out = []
															
 
																+            out = rand_int
															
 
																-            for i in range(num_of_blocks):
															
 
																-                out.append(rand_enc[i:i+self.messages_per_block])
															
 
																+            out_arr = np.reshape(out, (num_of_blocks, self.messages_per_block, self.bits_per_symbol))
															
 
																-            out = np.array(out)
															
 
																-
															
 
																-            return out, out[:, mid_idx, :]
															
 
																+            if return_vals:
															
 
																+                #TODO
															
 
																         else:
															
 
																             rand_int = np.random.randint(self.cardinality, size=(num_of_blocks * self.messages_per_block, 1))
															
 
																             out = enc.fit_transform(rand_int)
															
 
																+
															
 
																             out_arr = np.reshape(out, (num_of_blocks, self.messages_per_block, self.cardinality))
															
 
																             if return_vals:
															
 
																                 out_val = np.reshape(rand_int, (num_of_blocks, self.messages_per_block, 1))
															
 
																                 return out_val, out_arr, out_arr[:, mid_idx, :]
															
 
																-            return out_arr, out_arr[:, mid_idx, :]
															
 
																+        return out_arr, out_arr[:, mid_idx, :]
															
 
																-    def train(self, num_of_blocks=1e6, batch_size=None, train_size=0.8, lr=1e-3):
															
 
																+    def train(self, num_of_blocks=1e6, batch_size=None, train_size=0.8, lr=1e-2):
															
 
																         """
															
 
																         Method to train the autoencoder. Further configuration to the loss function, optimizer etc. can be made in here.
															
@@ -128,8 +154,8 @@ class EndToEndAutoencoder(tf.keras.Model):
 
																         :param train_size: Float less than 1 representing the proportion of the dataset to use for training
															
 
																         :param lr: The learning rate of the optimizer. Defines how quickly the algorithm converges
															
 
																         """
															
 
																-        X_train, y_train = self.generate_random_inputs(int(num_of_blocks*train_size))
															
 
																-        X_test, y_test = self.generate_random_inputs(int(num_of_blocks*(1-train_size)))
															
 
																+        X_train, y_train = self.generate_random_inputs(int(num_of_blocks * train_size))
															
 
																+        X_test, y_test = self.generate_random_inputs(int(num_of_blocks * (1 - train_size)))
															
 
																         opt = tf.keras.optimizers.Adam(learning_rate=lr)
															
@@ -141,30 +167,29 @@ class EndToEndAutoencoder(tf.keras.Model):
 
																                      run_eagerly=False
															
 
																                      )
															
 
																-        shuffle = True
															
 
																-        if self.recurrent and batch_size is None:
															
 
																-            # If recurrent layers are present in the model then the training data is considered one at a time without
															
 
																-            # shuffling of the data. This preserves order in the data.
															
 
																-            batch_size = 1
															
 
																-            shuffle = False
															
 
																-
															
 
																-        self.fit(x=X_train,
															
 
																-                 y=y_train,
															
 
																-                 batch_size=batch_size,
															
 
																-                 epochs=1,
															
 
																-                 shuffle=shuffle,
															
 
																-                 validation_data=(X_test, y_test)
															
 
																-                 )
															
 
																+        history = self.fit(x=X_train,
															
 
																+                           y=y_train,
															
 
																+                           batch_size=batch_size,
															
 
																+                           epochs=1,
															
 
																+                           shuffle=True,
															
 
																+                           validation_data=(X_test, y_test)
															
 
																+                           )
															
 
																+
															
 
																+        plt.plot(history.history['accuracy'])
															
 
																+        plt.plot(history.history['val_accuracy'])
															
 
																+        plt.show()
															
 
																+
															
 
																     def view_encoder(self):
															
 
																         '''
															
 
																-        A method that views the learnt encoder for each distint message. This is displayed as a plot with  asubplot for
															
 
																-        each image.
															
 
																+        A method that views the learnt encoder for each distint message. This is displayed as a plot with a subplot for
															
 
																+        each message/symbol.
															
 
																         '''
															
 
																+
															
 
																         # Generate inputs for encoder
															
 
																         messages = np.zeros((self.cardinality, self.messages_per_block, self.cardinality))
															
 
																-        mid_idx = int((self.messages_per_block-1)/2)
															
 
																+        mid_idx = int((self.messages_per_block - 1) / 2)
															
 
																         idx = 0
															
 
																         for msg in messages:
															
@@ -177,18 +202,18 @@ class EndToEndAutoencoder(tf.keras.Model):
 
																         # Compute subplot grid layout
															
 
																         i = 0
															
 
																-        while 2**i < self.cardinality**0.5:
															
 
																+        while 2 ** i < self.cardinality ** 0.5:
															
 
																             i += 1
															
 
																-        num_x = int(2**i)
															
 
																+        num_x = int(2 ** i)
															
 
																         num_y = int(self.cardinality / num_x)
															
 
																         # Plot all symbols
															
 
																-        fig, axs = plt.subplots(num_y, num_x, figsize=(2.5*num_x, 2*num_y))
															
 
																+        fig, axs = plt.subplots(num_y, num_x, figsize=(2.5 * num_x, 2 * num_y))
															
 
																         t = np.arange(self.samples_per_symbol)
															
 
																         if isinstance(self.channel.layers[1], OpticalChannel):
															
 
																-            t = t/self.channel.layers[1].fs
															
 
																+            t = t / self.channel.layers[1].fs
															
 
																         sym_idx = 0
															
 
																         for y in range(num_y):
															
@@ -220,22 +245,22 @@ class EndToEndAutoencoder(tf.keras.Model):
 
																         # Instantiate LPF layer
															
 
																         lpf = DigitizationLayer(fs=self.channel.layers[1].fs,
															
 
																-                                num_of_samples=self.messages_per_block*self.samples_per_symbol,
															
 
																+                                num_of_samples=self.messages_per_block * self.samples_per_symbol,
															
 
																                                 q_stddev=0)
															
 
																         # Apply LPF
															
 
																         lpf_out = lpf(flat_enc)
															
 
																         # Time axis
															
 
																-        t = np.arange(self.messages_per_block*self.samples_per_symbol)
															
 
																+        t = np.arange(self.messages_per_block * self.samples_per_symbol)
															
 
																         if isinstance(self.channel.layers[1], OpticalChannel):
															
 
																             t = t / self.channel.layers[1].fs
															
 
																         # Plot the concatenated symbols before and after LPF
															
 
																-        plt.figure(figsize=(2*self.messages_per_block, 6))
															
 
																+        plt.figure(figsize=(2 * self.messages_per_block, 6))
															
 
																         for i in range(1, self.messages_per_block):
															
 
																-            plt.axvline(x=t[i*self.samples_per_symbol], color='black')
															
 
																+            plt.axvline(x=t[i * self.samples_per_symbol], color='black')
															
 
																         plt.plot(t, flat_enc.numpy().T, 'x')
															
 
																         plt.plot(t, lpf_out.numpy().T)
															
@@ -251,18 +276,18 @@ class EndToEndAutoencoder(tf.keras.Model):
 
																         outputs = self.decoder(rx)
															
 
																         return outputs
															
 
																+SAMPLING_FREQUENCY = 336e9
															
 
																+CARDINALITY = 32
															
 
																+SAMPLES_PER_SYMBOL = 24
															
 
																+MESSAGES_PER_BLOCK = 9
															
 
																+DISPERSION_FACTOR = -21.7 * 1e-24
															
 
																+FIBER_LENGTH = 50
															
 
																-if __name__ == '__main__':
															
 
																-    SAMPLING_FREQUENCY = 336e9
															
 
																-    CARDINALITY = 32
															
 
																-    SAMPLES_PER_SYMBOL = 24
															
 
																-    MESSAGES_PER_BLOCK = 9
															
 
																-    DISPERSION_FACTOR = -21.7 * 1e-24
															
 
																-    FIBER_LENGTH = 50
															
 
																+if __name__ == '__main__':
															
 
																     optical_channel = OpticalChannel(fs=SAMPLING_FREQUENCY,
															
 
																-                                     num_of_samples=MESSAGES_PER_BLOCK*SAMPLES_PER_SYMBOL,
															
 
																+                                     num_of_samples=MESSAGES_PER_BLOCK * SAMPLES_PER_SYMBOL,
															
 
																                                      dispersion_factor=DISPERSION_FACTOR,
															
 
																                                      fiber_length=FIBER_LENGTH)
															
@@ -270,11 +295,13 @@ if __name__ == '__main__':
 
																                                    samples_per_symbol=SAMPLES_PER_SYMBOL,
															
 
																                                    messages_per_block=MESSAGES_PER_BLOCK,
															
 
																                                    channel=optical_channel,
															
 
																-                                   recurrent=True)
															
 
																-
															
 
																-    ae_model.train(num_of_blocks=1e5)
															
 
																-    ae_model.view_encoder()
															
 
																-    ae_model.view_sample_block()
															
 
																-    ae_model.summary()
															
 
																-
															
 
																+                                   bit_mapping=True)
															
 
																+
															
 
																+    ae_model.train(num_of_blocks=1e6)
															
 
																+    # ae_model.view_encoder()
															
 
																+    # ae_model.view_sample_block()
															
 
																+    # ae_model.summary()
															
 
																+    ae_model.encoder.summary()
															
 
																+    ae_model.channel.summary()
															
 
																+    ae_model.decoder.summary()
															
 
																     pass
															
--- a/tests/misc_test.py
+++ b/tests/misc_test.py
@@ -1,5 +1,10 @@
 
																 import misc
															
 
																 import numpy as np
															
 
																+import math
															
 
																+import itertools
															
 
																+import tensorflow as tf
															
 
																+from models.custom_layers import BitsToSymbols, SymbolsToBits, OpticalChannel
															
 
																+from matplotlib import pyplot as plt
															
 
																 def test_bit_matrix_one_hot():
															
@@ -11,5 +16,65 @@ def test_bit_matrix_one_hot():
 
																 if __name__ == "__main__":
															
 
																-    test_bit_matrix_one_hot()
															
 
																-    print("Everything passed")
															
 
																+
															
 
																+    # cardinality = 8
															
 
																+    # messages_per_block = 3
															
 
																+    # num_of_blocks = 10
															
 
																+    # bits_per_symbol = 3
															
 
																+    #
															
 
																+    # #-----------------------------------
															
 
																+    #
															
 
																+    # mid_idx = int((messages_per_block - 1) / 2)
															
 
																+    #
															
 
																+    # ################################################################################################################
															
 
																+    #
															
 
																+    # # rand_int = np.random.randint(self.cardinality, size=(num_of_blocks * self.messages_per_block, 1))
															
 
																+    # rand_int = np.random.randint(2, size=(num_of_blocks * messages_per_block * bits_per_symbol, 1))
															
 
																+    #
															
 
																+    # # out = enc.fit_transform(rand_int)
															
 
																+    # out = rand_int
															
 
																+    #
															
 
																+    # # out_arr = np.reshape(out, (num_of_blocks, self.messages_per_block, self.cardinality))
															
 
																+    # out_arr = np.reshape(out, (num_of_blocks, messages_per_block, bits_per_symbol))
															
 
																+    #
															
 
																+    # out_arr_tf = tf.convert_to_tensor(out_arr, dtype=tf.float32)
															
 
																+    #
															
 
																+    #
															
 
																+    # n = int(math.log(cardinality, 2))
															
 
																+    # pows = tf.convert_to_tensor(np.power(2, np.linspace(n - 1, 0, n)).reshape(-1, 1), dtype=tf.float32)
															
 
																+    #
															
 
																+    # pows_np = pows.numpy()
															
 
																+    #
															
 
																+    # a = np.asarray([0, 1, 1]).reshape(1, -1)
															
 
																+    #
															
 
																+    # b = tf.tensordot(out_arr_tf, pows, axes=1).numpy()
															
 
																+
															
 
																+    SAMPLING_FREQUENCY = 336e9
															
 
																+    CARDINALITY = 32
															
 
																+    SAMPLES_PER_SYMBOL = 100
															
 
																+    NUM_OF_SYMBOLS = 10
															
 
																+    DISPERSION_FACTOR = -21.7 * 1e-24
															
 
																+    FIBER_LENGTH = 50
															
 
																+
															
 
																+    optical_channel = OpticalChannel(fs=SAMPLING_FREQUENCY,
															
 
																+                                     num_of_samples=NUM_OF_SYMBOLS * SAMPLES_PER_SYMBOL,
															
 
																+                                     dispersion_factor=DISPERSION_FACTOR,
															
 
																+                                     fiber_length=FIBER_LENGTH,
															
 
																+                                     rx_stddev=0,
															
 
																+                                     q_stddev=0)
															
 
																+
															
 
																+    inp = np.random.randint(4, size=(NUM_OF_SYMBOLS, ))
															
 
																+
															
 
																+    inp_t = np.repeat(inp, SAMPLES_PER_SYMBOL).reshape(1, -1)
															
 
																+
															
 
																+    plt.plot(inp_t.flatten())
															
 
																+
															
 
																+    out_tf = optical_channel(inp_t)
															
 
																+
															
 
																+    out_np = out_tf.numpy()
															
 
																+
															
 
																+    plt.plot(out_np.flatten())
															
 
																+    plt.show()
															
 
																+
															
 
																+
															
 
																+    pass