import tensorflow as tf
from plot_keras_history import show_history, plot_history

NN_train_features = training_sample[features].values   # Training features
NN_train_labels = training_sample['R1M_Usd'].values    # Training labels
NN_test_features = testing_sample[features].values  # Testing features
NN_test_labels = testing_sample['R1M_Usd'].values   # Testing labels


from tensorflow import keras
from tensorflow.keras import layers

model = keras.Sequential()
model.add(layers.Dense(16, activation="relu", input_shape=(len(features),)))
model.add(layers.Dense(8, activation="tanh"))
model.add(layers.Dense(1))


model.compile(optimizer='RMSprop', 
              loss='mse', 
              metrics=['MeanAbsoluteError'])
model.summary()

Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 dense_3 (Dense)             (None, 16)                1504      
                                                                 
 dense_4 (Dense)             (None, 8)                 136       
                                                                 
 dense_5 (Dense)             (None, 1)                 9         
                                                                 
=================================================================
Total params: 1,649
Trainable params: 1,649
Non-trainable params: 0
_________________________________________________________________


fit_NN = model.fit(
            NN_train_features,
            NN_train_labels,
            batch_size=256,
            epochs = 10,
            validation_data=(NN_test_features,NN_test_labels),
            verbose = True
)
show_history(fit_NN)                                           # Plot, evidently!

Epoch 1/10
774/774 [==============================] - 1s 962us/step - loss: 0.0289 - mean_absolute_error: 0.0839 - val_loss: 0.0371 - val_mean_absolute_error: 0.0670
Epoch 2/10
774/774 [==============================] - 1s 950us/step - loss: 0.0289 - mean_absolute_error: 0.0838 - val_loss: 0.0370 - val_mean_absolute_error: 0.0667
Epoch 3/10
774/774 [==============================] - 1s 947us/step - loss: 0.0289 - mean_absolute_error: 0.0839 - val_loss: 0.0371 - val_mean_absolute_error: 0.0672
Epoch 4/10
774/774 [==============================] - 1s 912us/step - loss: 0.0289 - mean_absolute_error: 0.0839 - val_loss: 0.0370 - val_mean_absolute_error: 0.0669
Epoch 5/10
774/774 [==============================] - 1s 920us/step - loss: 0.0289 - mean_absolute_error: 0.0839 - val_loss: 0.0370 - val_mean_absolute_error: 0.0671
Epoch 6/10
774/774 [==============================] - 1s 919us/step - loss: 0.0288 - mean_absolute_error: 0.0839 - val_loss: 0.0372 - val_mean_absolute_error: 0.0679
Epoch 7/10
774/774 [==============================] - 1s 917us/step - loss: 0.0288 - mean_absolute_error: 0.0839 - val_loss: 0.0372 - val_mean_absolute_error: 0.0677
Epoch 8/10
774/774 [==============================] - 1s 1ms/step - loss: 0.0288 - mean_absolute_error: 0.0839 - val_loss: 0.0370 - val_mean_absolute_error: 0.0668
Epoch 9/10
774/774 [==============================] - 1s 912us/step - loss: 0.0289 - mean_absolute_error: 0.0839 - val_loss: 0.0372 - val_mean_absolute_error: 0.0680
Epoch 10/10
774/774 [==============================] - 1s 908us/step - loss: 0.0288 - mean_absolute_error: 0.0839 - val_loss: 0.0370 - val_mean_absolute_error: 0.0666


hitratio = np.mean(model.predict(NN_test_features) * NN_test_labels > 0)
print(f'Hit Ratio: {hitratio}')

Hit Ratio: 0.5416737440003773


from tensorflow.keras.utils import to_categorical

NN_train_labels_C = to_categorical(training_sample['R1M_Usd_C'].values) # One-hot encoding of the label
NN_test_labels_C = to_categorical(testing_sample['R1M_Usd_C'].values) # One-hot encoding of the label


from tensorflow.keras import initializers
from tensorflow.keras.constraints import non_neg

# Usage in a Keras layer:
initializer =initializers.RandomNormal()

model_C = keras.Sequential() # This defines the structure of the network, i.e. how layers are organized
model_C.add(layers.Dense(16, activation="tanh",           # Nb units & activation
                       input_shape=(len(features),),    # Size of input
                       kernel_initializer=initializer,  # Initialization of weights
                       kernel_constraint = non_neg()))   # Weights should be nonneg
model_C.add(layers.Dropout(.25))                          # Dropping out 25% units
model_C.add(layers.Dense(8, activation="elu",             # Nb units & activation
                       bias_initializer = initializers.Constant(0.2), # Initialization of biases
                       kernel_regularizer='l2'))        # Penalization of weights 
model_C.add(layers.Dense(2,activation='softmax'))         # Softmax for categorical output


model_C.compile(   # Model specification
        optimizer=keras.optimizers.Adam(
                learning_rate=0.01,  # Optimisation method (weight updating)
                beta_1 = 0.9, # The exponential decay rate for the 1st moment estimates
                beta_2 = 0.95), # The exponential decay rate for the 2nd moment estimates
              loss=keras.losses.BinaryCrossentropy(from_logits=True),   # Loss function
              metrics=['categorical_accuracy'])  # Output metric
model_C.summary() # Model structure

Model: "sequential_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 dense_6 (Dense)             (None, 16)                1504      
                                                                 
 dropout (Dropout)           (None, 16)                0         
                                                                 
 dense_7 (Dense)             (None, 8)                 136       
                                                                 
 dense_8 (Dense)             (None, 2)                 18        
                                                                 
=================================================================
Total params: 1,658
Trainable params: 1,658
Non-trainable params: 0
_________________________________________________________________


callback = tf.keras.callbacks.EarlyStopping(monitor = "val_loss",    # Early stopping:
                                min_delta = 0.001,       # Improvement threshold
                                patience = 4,            # Nb epochs with no improvmt 
                                verbose = 0 )            # No warnings

fit_NN_C = model_C.fit(
            NN_train_features, # Training features
            NN_train_labels_C, # Training labels
            batch_size=512, # Training parameters
            epochs = 20,  # Training parameters
            validation_data=(NN_test_features,NN_test_labels_C), # Test data
            verbose = True, # No comments from algo
            callbacks=[callback] # see callback above
            )
show_history(fit_NN_C)

Epoch 1/20

C:\Users\TGU.RAMAI\Anaconda3\lib\site-packages\tensorflow\python\util\dispatch.py:1096: UserWarning: "`binary_crossentropy` received `from_logits=True`, but the `output` argument was produced by a sigmoid or softmax activation and thus does not represent logits. Was this intended?"
  return dispatch_target(*args, **kwargs)

387/387 [==============================] - 1s 2ms/step - loss: 0.6993 - categorical_accuracy: 0.5030 - val_loss: 0.6938 - val_categorical_accuracy: 0.4963
Epoch 2/20
387/387 [==============================] - 1s 1ms/step - loss: 0.6934 - categorical_accuracy: 0.5004 - val_loss: 0.6932 - val_categorical_accuracy: 0.5037
Epoch 3/20
387/387 [==============================] - 1s 1ms/step - loss: 0.6933 - categorical_accuracy: 0.5017 - val_loss: 0.6931 - val_categorical_accuracy: 0.5037
Epoch 4/20
387/387 [==============================] - 1s 1ms/step - loss: 0.6933 - categorical_accuracy: 0.5007 - val_loss: 0.6932 - val_categorical_accuracy: 0.4963
Epoch 5/20
387/387 [==============================] - 1s 1ms/step - loss: 0.6934 - categorical_accuracy: 0.5014 - val_loss: 0.6932 - val_categorical_accuracy: 0.5037


model_custom = keras.Sequential() # this defines the structure of the network, i.e. how layers are organised
model_custom.add(layers.Dense(16, activation="relu", input_shape=(len(features),)))
model_custom.add(layers.Dense(8, activation="sigmoid"))
model_custom.add(layers.Dense(1)) # No activation means linear activation: f(x) = x


def custom_loss(y_true, y_pred): # Defines the loss, we use gamma = 5
  loss = tf.reduce_mean(tf.square(y_pred - tf.reduce_mean(y_pred))) - 5 * tf.reduce_mean(
          (y_true - tf.reduce_mean(y_true))*(y_pred - tf.reduce_mean(y_pred)))
  return loss
model_custom.compile( # Model specification
              optimizer='RMSprop',  # Optim method
              loss=custom_loss, # New loss function
              metrics=['MeanAbsoluteError'])


fit_NN_cust = model_custom.fit(
            NN_train_features, # training features
            NN_train_labels, # Training labels
            batch_size=512, epochs = 10, # Training parameters
            validation_data=(NN_test_features,NN_test_labels), # Test data
            verbose = False) # No warnings
show_history(fit_NN_cust)


hitratio = np.mean(model_custom.predict(NN_test_features) * NN_test_labels > 0) # Hit ratio
print(f'Hit Ratio: {hitratio}')

Hit Ratio: 0.44688639471285324


data_rnn = data_ml[data_ml['stock_id'].isin(stock_ids_short)] # Dedicated dataset
training_sample_rnn = data_rnn[data_rnn['date'] < separation_date] # Training set
testing_sample_rnn = data_rnn[data_rnn['date'] > separation_date] # Test set

nb_stocks = len(stock_ids_short) # Nb stocks
nb_feats = len(features) # Nb features
nb_dates_train = training_sample_rnn.shape[0] // nb_stocks # Nb training dates
nb_dates_test = testing_sample_rnn.shape[0] // nb_stocks # Nb testing dates

nn_train_features = training_sample_rnn[features].values # Train features in array format
nn_test_features = testing_sample_rnn[features].values # Test features in array format
nn_train_labels = training_sample_rnn['R1M_Usd'].values # Train label in array format
nn_test_labels = testing_sample_rnn['R1M_Usd'].values # Test label in array format


train_features_rnn = np.reshape(nn_train_features, # Formats the training data into tricky ordered array
                                (nb_stocks, nb_dates_train, nb_feats)) # The order is: stock, date, feature
test_features_rnn = np.reshape(nn_test_features, # Formats the training data into tricky ordered array
                               (nb_stocks, nb_dates_test, nb_feats)) # The order is: stock, date, feature
train_labels_rnn = np.reshape(nn_train_labels, (nb_stocks, nb_dates_train, 1))
test_labels_rnn = np.reshape(nn_test_labels, (nb_stocks, nb_dates_test, 1))


model_RNN = keras.Sequential()
model_RNN.add(layers.GRU(16, # Nb units in hidden layer
                         batch_input_shape = (nb_stocks, nb_dates_train, nb_feats), # Dimensions = tricky part
                         activation='tanh', # Activation function
                         return_sequences=True)) # Return all the sequence
model_RNN.add(layers.Dense(1)) # Final aggregation layer
model_RNN.compile(optimizer='RMSprop', # Loss = quadratic
              loss='mse', # Backprop
              metrics=['MeanAbsoluteError']) # Output metric MAE


fit_RNN = model_RNN.fit(train_features_rnn, # Training features
                        train_labels_rnn, # Training labels
                        epochs = 10, # Number of rounds
                        batch_size = nb_stocks, # Length of sequences
                        verbose=False) # No warnings
show_history(fit_RNN)


new_model = keras.Sequential()
new_model.add(layers.GRU(16, 
                         batch_input_shape = (nb_stocks, nb_dates_test, nb_feats), # New dimensions
                         activation='tanh', # Activation function
                         return_sequences=True)) # Return the full sequence
new_model.add(layers.Dense(1)) # Output dimension
new_model.set_weights(model_RNN.get_weights())


pred_rnn = new_model.predict(test_features_rnn, batch_size = nb_stocks) # Predictions
hitratio = np.mean(np.multiply(pred_rnn,test_labels_rnn) > 0) # Hit ratio
print(f'Hit Ratio: {hitratio}')

Hit Ratio: 0.498276586801177

Chapter 7 Neural networks¶

7.1 The original perceptron¶

7.2 Multilayer perceptron¶

7.2.1 Introduction and notations¶

7.2.2 Universal approximation¶

7.2.3 Learning via back-propagation¶

7.2.4 Further details on classification¶

7.3 How deep we should go and other practical issues¶

7.3.1 Architectural choices¶

7.3.2 Frequency of weight updates and learning duration¶

7.3.3 Penalizations and dropout¶

7.4 Code samples and comments for vanilla MLP¶

7.4.1 Regresion example¶

7.4.2 Classification example¶

7.4.3 Custom losses¶

7.5 Recurrent networks¶

7.5.1 Presentation¶

7.5.2 Code and results¶

7.6 Other common architectures¶

7.6.1 Generative adversarial networks¶

7.6.2 Autoencoders¶

7.6.3. A word on convolutional networks¶

7.6.4 Advanced architectures¶

7.7 Coding exercices¶

References¶