LSTM (Long short-term memory) Attention Model for Trading

By Aman Jindal, CFA, FRM, CQF

Deep learning has been applied to the problem of time series forecasting.¶

Two stocks, from the same industry, viz. The Home Depot, Inc., HD (NYSE) and Lowe's Companies, Inc., LOW (NYSE) have been chosen. Their six years of traded stock price data (2014-19) has been obtained. Then technical features for these two stocks corresponding to their six year of data have been designed and analyzed.
Post that LSTM Attention Models have been built using the first five years of data (2014-2018) for both the stocks individually. Subsequently, the models have been assessed to check for the predictive power and efficacy.
Google Colab has been used to build the model because of GPU constraints of a standard computer

# Installing yfinance, ta-lib and yellowbrick libraries 

!pip install yfinance
!wget https://launchpad.net/~mario-mariomedina/+archive/ubuntu/talib/+files/libta-lib0_0.4.0-oneiric1_amd64.deb -qO libta.deb
!wget https://launchpad.net/~mario-mariomedina/+archive/ubuntu/talib/+files/ta-lib0-dev_0.4.0-oneiric1_amd64.deb -qO ta.deb
!dpkg -i libta.deb ta.deb
!pip install ta-lib
!pip install -U yellowbrick

import matplotlib.pyplot as plt
import pandas as pd
import numpy as np
import yfinance as yf
import talib
import datetime
import warnings
warnings.filterwarnings("ignore")

from tensorflow.keras.layers import LSTM, Dense, Dot, Activation, Input
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.models import Model
import tensorflow.keras.backend as K
import tensorflow as tf

# Importing Data
# Stocks chosen are HD and LOW

start = datetime.datetime(2013, 12, 31)
end   = datetime.datetime(2019, 12, 31)

df = yf.download('HD', start=start, end=end)
df1 = yf.download('LOW', start=start, end=end)

[*********************100%***********************]  1 of 1 completed
[*********************100%***********************]  1 of 1 completed

df.head()

# Visualizing Stock Prices

plt.figure(figsize=(10,6))
df['Adj Close'].plot(label='HD')
df1['Adj Close'].plot(label='LOW')
plt.legend()
plt.title('Stock Price Movememt',fontsize=16)
plt.grid(False);

# Creating Features
# 10 Day return direction has been chosen for prediction

HD = df.copy()
LOW = df1.copy()
stocks = {'HD':HD,'LOW':LOW}

for stock in stocks.values():
    
    features = []
    stock.rename(columns={'Adj Close':'price'}, inplace=True)
    stock['price_FD10'] = stock['price'].shift(-10)
    stock['ret_D10'] = np.log(stock['price']/stock['price'].shift(10))
    stock['ret_FD10'] = np.log(stock['price_FD10']/stock['price_FD10'].shift(10))
    stock['label'] = np.where(stock['ret_FD10']>=0,1,0)
    
    for i in [10]:
        stock['ret_10Dlag'+ str(i)] = stock['ret_D10'].shift(i)
        features.extend(['ret_10Dlag'+str(i)])
    
    for i in [28]:
        stock['mom_D'+str(i)] = talib.MOM(stock['price'], timeperiod=i)
        features.extend(['mom_D'+str(i)])
    
    for i in [14,50,200]:
      
        stock['sma_D'+str(i)] = talib.SMA(stock['price'], timeperiod=i)
        stock['ema_D'+str(i)] = talib.EMA(stock['price'], timeperiod=i)
        stock['rsi_D'+str(i)] = talib.RSI(stock['price'], timeperiod=i)
        stock['cmo_D'+str(i)] = talib.CMO(stock['price'], timeperiod=i)
  
        features.extend(['sma_D'+str(i),'ema_D'+str(i),'rsi_D'+str(i),'cmo_D'+str(i)])
    
    for i in [20]:
        stock['bolUP_D'+str(i)], middleband, stock['bolDOWN_D'+str(i)] = talib.BBANDS(stock['price'], timeperiod=i)
        stock['bolBandwidth_D'+str(i)] = (stock['bolUP_D'+str(i)] - stock['bolDOWN_D'+str(i)])/middleband

        features.extend(['bolUP_D'+str(i),'bolDOWN_D'+str(i),'bolBandwidth_D'+str(i)])
    
    stock['macd'], stock['macdSignal'], _ = talib.MACD(stock['price'])
    
    features.extend(['macd','macdSignal'])
    
    stock.dropna(inplace=True)

target_names = {0:"Down Move",1:"Up Move"}

print(features)

['ret_10Dlag10', 'mom_D28', 'sma_D14', 'ema_D14', 'rsi_D14', 'cmo_D14', 'sma_D50', 'ema_D50', 'rsi_D50', 'cmo_D50', 'sma_D200', 'ema_D200', 'rsi_D200', 'cmo_D200', 'bolUP_D20', 'bolDOWN_D20', 'bolBandwidth_D20', 'macd', 'macdSignal']

# Sanity Check

np.all(HD.index == LOW.index)

True

# Function for creating Train and Test Sets

def createTrainTest(stock, features, testSize = 252):
    
    totalRecords = len(stock.index)
    test = np.arange(totalRecords - testSize, totalRecords)
    train = np.arange(0,test[0])
    X_train = stock.loc[stock.index[train],features]
    X_test = stock.loc[stock.index[test],features]
    y_train = stock.loc[stock.index[train],'label']
    y_test = stock.loc[stock.index[test],'label']
    
    return X_train, X_test, y_train.to_numpy().reshape(-1,1), y_test.to_numpy().reshape(-1,1)

# Function for Scaling Data

def scaleTrainTest(X_train, X_test):
    
    from sklearn.preprocessing import RobustScaler
    
    scaler = RobustScaler().fit(X_train)
    X_train_scaled = scaler.transform(X_train)
    X_test_scaled = scaler.transform(X_test)
    
    return X_train_scaled, X_test_scaled

# Function for creating Data for Deep Learning Network

def createDataLSTM(X_train, X_test, y_train, y_test, n_features, n_days=28, testSize=252):

    X_train_LSTM = np.zeros((X_train.shape[0]-n_days+1, n_days, n_features))
    X_test_LSTM = np.zeros((testSize, n_days, n_features))
    y_train_LSTM = np.zeros((X_train.shape[0]-n_days+1,1))
    
    for i in range(X_train.shape[0]-n_days+1):
        X_train_LSTM[i,0:n_days] = X_train[i:i+n_days]
        y_train_LSTM[i] = y_train[i+n_days-1]
    
    j = 0
    for i in range(testSize):
        if i<(n_days-1):
            X_test_LSTM[i,0:n_days-1-i] = X_train[X_train.shape[0]-n_days+1+i:]
            X_test_LSTM[i,n_days-1-i:] = X_test[0:i+1] 
        else:
            X_test_LSTM[i,0:n_days] = X_test[j:j+n_days]
            j = j+1
    return X_train_LSTM, X_test_LSTM, y_train_LSTM, y_test

# Function for Feature Scoring and Selection 

def featureImportances(X_train,y_train):
    
    from sklearn.ensemble import RandomForestClassifier
    from sklearn.ensemble import AdaBoostClassifier
    from sklearn.ensemble import GradientBoostingClassifier
    from yellowbrick.model_selection import FeatureImportances

    rfc = RandomForestClassifier(max_depth=3, n_jobs=-1,random_state=0)
    viz1 = FeatureImportances(rfc,relative=False,labels=features)
    viz1.fit(X_train, y_train)
    viz1.show()

    abc = AdaBoostClassifier(n_estimators=100,random_state=0)
    viz2 = FeatureImportances(abc,relative=False,labels=features)
    viz2.fit(X_train, y_train)
    viz2.show()

    gbc = GradientBoostingClassifier(max_depth=3,random_state=0)
    viz3= FeatureImportances(gbc,relative=False,labels=features)
    viz3.fit(X_train, y_train)
    viz3.show();

# Function for plotting K-Means Clustering

def plotKMeans(X_train, y_train, cols, axis_labels=None, title=None):

    import matplotlib.pyplot as plt 
    import matplotlib.patches as mpatches
    from matplotlib.colors import ListedColormap, BoundaryNorm
    
    x_min, x_max = X_train[:, cols[0]].min() - 1, X_train[:, cols[0]].max() + 1
    y_min, y_max = X_train[:, cols[1]].min() - 1, X_train[:, cols[1]].max() + 1

    class_names = ['Cluster 1', 'Cluster 2']
    color_list = ['#FFFF00', '#00AAFF']
    cmap_bold = ListedColormap(color_list)
    bnorm = BoundaryNorm(np.arange(0, 3), ncolors=2)
    
    plt.figure(figsize=(7,7))
    plt.xlim(x_min, x_max)
    plt.ylim(y_min, y_max)
    plt.scatter(X_train[:, cols[0]], X_train[:, cols[1]], s=100, c=y_train, cmap=cmap_bold, norm = bnorm, edgecolor='black', lw = 1)
    plt.xlabel(axis_labels[0], fontsize=13)
    plt.ylabel(axis_labels[1], fontsize=13)

    legend_handles = []
    for i in range(0, 2):
        patch = mpatches.Patch(color=color_list[i], label=class_names[i])
        legend_handles.append(patch) 
    plt.legend(handles=legend_handles, fontsize=13)
    plt.title('{}: K-Means Clustering'.format(title),fontdict = {'fontsize':16})
    plt.show();

# Function for Calculating Daily Profit and Loss over the Test Set

def calcPnL(model,stock,X_test,y_test,threshold = 0.5,testSize=252, stock_name=None):
    
    totalRecords = len(stock.index)
    test = np.arange(totalRecords - testSize, totalRecords)
    analysis = pd.DataFrame(data = stock.loc[stock.index[test],'ret_FD10'],index = stock.index[test])
    analysis['buyAndHold'] = (stock.loc[stock.index[test],'price']/stock.loc[stock.index[test[0]],'price'])-1.0
    analysis['probUP'] = model.predict(X_test)
    analysis['betSize'] = np.where(analysis['probUP']>threshold,2*analysis['probUP']-1,0.0)
    analysis['dailyP&L'] = analysis['ret_FD10']*analysis['betSize']
     
    profitLSTM = analysis['dailyP&L'].sum()*100
    profitBuyHold = (analysis.loc[analysis.index[testSize-1],'buyAndHold'])*100
    
    plt.figure(figsize=(10,6))
    plt.plot(analysis['dailyP&L'].cumsum(),label='LSTM Attention, Return = {:.2f} %'.format(profitLSTM))
    plt.plot(analysis['buyAndHold'], label='Buy and Hold, Return = {:.2f} %'.format(profitBuyHold))
    plt.legend(fontsize=13)
    plt.title('{}: Returns generated over 2019 (Test Set)'.format(stock_name),fontdict = {'fontsize':16})
    plt.grid(False);

# Function for ConfusionMatrix, Classification Report Precision-Recall Curve, Area under ROC Curve 

def plotMetrics(model, X_test, y_test, target_names, title=None):

    from sklearn.metrics import confusion_matrix, plot_confusion_matrix, classification_report, precision_recall_curve, roc_curve, auc 
    
    y_scores = model.predict(X_test)
    y_pred = np.where(model.predict(X_test)>=0.5,1,0)
    print("\n\033[1m\t\t\033[4m {} Confusion Matrix\033[0m\033[0m\n".format(title))
    print(confusion_matrix(y_test, y_pred))
    print("\n\033[1m\t\t\033[4m {} Classification Report\033[0m\033[0m\n".format(title))
    print(classification_report(y_test, y_pred, target_names=target_names))
    
    precision, recall, _ = precision_recall_curve(y_test, y_scores)
    plt.figure(figsize=(7,7))
    plt.xlim([0.0, 1.01])
    plt.ylim([0.0, 1.01])
    plt.plot(precision, recall, label='Precision-Recall Curve')
    plt.xlabel('Precision', fontsize=14)
    plt.ylabel('Recall', fontsize=14)
    plt.title("{} Precision Recall Curve".format(title), fontsize=16)
    plt.grid(True)
    plt.show();
    print('\n\n')

    fpr, tpr, _ = roc_curve(y_test, y_scores)
    roc_auc = auc(fpr, tpr)

    plt.figure(figsize=(7,7))
    plt.xlim([-0.01, 1.01])
    plt.ylim([-0.01, 1.01])
    plt.plot(fpr, tpr, lw=3, label='AUC = {:0.2f}'.format(roc_auc))
    plt.xlabel('False Positive Rate', fontsize=12)
    plt.ylabel('True Positive Rate', fontsize=12)
    plt.title('{} ROC curve'.format(title), fontsize=16)
    plt.legend(loc='lower right', fontsize=13)
    plt.plot([0, 1], [0, 1], lw=2, linestyle='-.')
    plt.grid(True)
    plt.show();

# Function for Plotting Transition Probabilities

def plotTransitionProb(model,stock,X_test,y_test,title = None,testSize = 252):
    
    import matplotlib.pyplot as plt 
    import matplotlib.patches as mpatches
    from matplotlib.colors import ListedColormap
    
    y_scores = model.predict(X_test)
    y_pred = np.where(model.predict(X_test)>=0.5,1,0)
    totalRecords = len(stock.index)
    test = np.arange(totalRecords - testSize, totalRecords)
    target_names = ['Wrong Prediction','Correct Prediction']
    c = y_test == y_pred
    color_list = ['#EEEE00','#0000CC']
    cmap = ListedColormap(color_list)
    legend_handles = []
    for i in range(0, len(target_names)):
        patch = mpatches.Patch(color=color_list[i], label=target_names[i])
        legend_handles.append(patch)

    plt.figure(figsize=(10,6))
    plt.scatter(stock.index[test],y_scores, c = c, cmap = cmap)
    plt.legend(loc=0,handles=legend_handles)
    plt.title('{}: Transition Probabilities for Up Moves'.format(title),fontdict = {'fontsize':16})
    plt.grid(True);

    plt.figure(figsize=(10,6))
    plt.scatter(stock.index[test], 1-y_scores, c = c, cmap = cmap)
    plt.legend(loc=0,handles=legend_handles)
    plt.title('{}: Transition Probabilities for Down Moves'.format(title),fontdict = {'fontsize':16})
    plt.grid(True);

# Feature Scoring:

for stock_name, stock in stocks.items():
    
    X_train, X_test, y_train, y_test = createTrainTest(stock, features)
    X_train_scaled, X_test_scaled = scaleTrainTest(X_train, X_test)
    print ("\n\033[1m\t\t\t\t\033[4mAnalyzing {}\033[0m\033[0m".format(stock_name))
    featureImportances(X_train_scaled,y_train)

				Analyzing HD

				Analyzing LOW

# K-Means Clustering

from sklearn.cluster import KMeans

for stock_name, stock in stocks.items():
    
    X_train, X_test, y_train, y_test = createTrainTest(stock, features)
    X_train_scaled, X_test_scaled = scaleTrainTest(X_train, X_test)
  
    kmeans = KMeans(n_clusters = 2, random_state=0)
    X_new = kmeans.fit_transform(X_train_scaled)
    
    # Plotting the two new Transformed Axes

    cols = [0,1]
    axis_labels = ['Transformed Axis 1','Transformed Axis 2']
    plotKMeans(X_new, kmeans.labels_, cols, axis_labels, title=stock_name)
    
    # Plotting EMA50 vs MACD

    cols = [7,17]
    axis_labels = [features[cols[0]],features[cols[1]]]
    plotKMeans(X_train_scaled, kmeans.labels_, cols, axis_labels, title=stock_name)

    # Plotting RSI50 vs Bollinger Bandwidth

    cols = [8,16]
    axis_labels = [features[cols[0]],features[cols[1]]]
    plotKMeans(X_train_scaled, kmeans.labels_, cols, axis_labels, title=stock_name)

    #Plotting SMA200 vs CMA200:

    cols = [10,13]
    axis_labels = [features[cols[0]],features[cols[1]]]
    plotKMeans(X_train_scaled, kmeans.labels_, cols, axis_labels, title=stock_name)

    #Plotting Return vs Momentum:

    cols = [0,1]
    axis_labels = [features[cols[0]],features[cols[1]]]
    plotKMeans(X_train_scaled, kmeans.labels_, cols, axis_labels, title=stock_name)

#Setting number of units for different layers 

np.random.seed(1)
tf.random.set_seed(1)
inputDays = 28
unitsPreLSTM = 128
unitsPostLSTM = 32
unitsDenseAttention = 32

# Function for creating the Attention LSTM Model

def model(inputDays, unitsPreLSTM , unitsPostLSTM, unitsDenseAttention, featuresLen, name=None):
    
    # Pre Attention LSTM

    X = Input(shape=(inputDays, featuresLen), name='Input')
    a = LSTM(units = unitsPreLSTM, return_sequences=True, dropout=0.05, name='PreAttention_LSTM')(X)   
    
    # Computing Attention and Context

    e1 = Dense(unitsDenseAttention, activation = "relu", name='Dense1_Attention')(a)
    e2 = Dense(1, activation = "relu", name='Dense2_Attention')(e1)
    alphas = Activation(lambda x: K.softmax(x, axis=1), name='attention_weights')(e2)
    context = Dot(axes = 1, name='context')([alphas,a])
    
    # Post Attention LSTM
    
    s = LSTM(unitsPostLSTM, dropout=0.05, name='PostAttention_LSTM')(context)
    output = Dense(1, activation='sigmoid', name='Output')(s)
    
    model = Model(inputs=X, outputs=output, name=name)
  
    return model

# Creating the Attention LSTM Model for HD

modelHD = model(inputDays, unitsPreLSTM, unitsPostLSTM, unitsDenseAttention, len(features), name='model_HD')
modelHD.summary()

Model: "model_HD"
__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
==================================================================================================
Input (InputLayer)              [(None, 28, 19)]     0                                            
__________________________________________________________________________________________________
PreAttention_LSTM (LSTM)        (None, 28, 128)      75776       Input[0][0]                      
__________________________________________________________________________________________________
Dense1_Attention (Dense)        (None, 28, 32)       4128        PreAttention_LSTM[0][0]          
__________________________________________________________________________________________________
Dense2_Attention (Dense)        (None, 28, 1)        33          Dense1_Attention[0][0]           
__________________________________________________________________________________________________
attention_weights (Activation)  (None, 28, 1)        0           Dense2_Attention[0][0]           
__________________________________________________________________________________________________
context (Dot)                   (None, 1, 128)       0           attention_weights[0][0]          
                                                                 PreAttention_LSTM[0][0]          
__________________________________________________________________________________________________
PostAttention_LSTM (LSTM)       (None, 32)           20608       context[0][0]                    
__________________________________________________________________________________________________
Output (Dense)                  (None, 1)            33          PostAttention_LSTM[0][0]         
==================================================================================================
Total params: 100,578
Trainable params: 100,578
Non-trainable params: 0
__________________________________________________________________________________________________

# Model Compile Settings for HD

opt = Adam(lr=0.0005, beta_1=0.9, beta_2=0.999, decay=0.01)
modelHD.compile(optimizer=opt, loss='binary_crossentropy', metrics=['accuracy'])

# Creating Data for HD Attention LSTM Model

X_train, X_test, y_train, y_test = createTrainTest(stocks['HD'], features)
X_train_scaled, X_test_scaled = scaleTrainTest(X_train, X_test)
X_train_LSTM, X_test_LSTM, y_train_LSTM, y_test_LSTM = createDataLSTM(
    X_train_scaled, X_test_scaled, y_train, y_test, len(features), n_days=28, testSize=252)

# Training the HD Model 

modelHD.fit(X_train_LSTM, y_train_LSTM, epochs=50, batch_size=28, verbose=2)

Epoch 1/50
37/37 - 0s - loss: 0.6735 - accuracy: 0.5945
Epoch 2/50
37/37 - 0s - loss: 0.6432 - accuracy: 0.6053
Epoch 3/50
37/37 - 0s - loss: 0.6311 - accuracy: 0.6366
Epoch 4/50
37/37 - 0s - loss: 0.6183 - accuracy: 0.6719
Epoch 5/50
37/37 - 0s - loss: 0.6102 - accuracy: 0.6846
Epoch 6/50
37/37 - 0s - loss: 0.5975 - accuracy: 0.6983
Epoch 7/50
37/37 - 0s - loss: 0.5913 - accuracy: 0.7023
Epoch 8/50
37/37 - 0s - loss: 0.5854 - accuracy: 0.7150
Epoch 9/50
37/37 - 0s - loss: 0.5812 - accuracy: 0.7209
Epoch 10/50
37/37 - 0s - loss: 0.5745 - accuracy: 0.7209
Epoch 11/50
37/37 - 0s - loss: 0.5699 - accuracy: 0.7277
Epoch 12/50
37/37 - 0s - loss: 0.5698 - accuracy: 0.7238
Epoch 13/50
37/37 - 0s - loss: 0.5602 - accuracy: 0.7267
Epoch 14/50
37/37 - 0s - loss: 0.5625 - accuracy: 0.7267
Epoch 15/50
37/37 - 0s - loss: 0.5566 - accuracy: 0.7287
Epoch 16/50
37/37 - 0s - loss: 0.5550 - accuracy: 0.7326
Epoch 17/50
37/37 - 0s - loss: 0.5531 - accuracy: 0.7336
Epoch 18/50
37/37 - 0s - loss: 0.5478 - accuracy: 0.7316
Epoch 19/50
37/37 - 0s - loss: 0.5464 - accuracy: 0.7277
Epoch 20/50
37/37 - 0s - loss: 0.5439 - accuracy: 0.7346
Epoch 21/50
37/37 - 0s - loss: 0.5404 - accuracy: 0.7365
Epoch 22/50
37/37 - 0s - loss: 0.5405 - accuracy: 0.7356
Epoch 23/50
37/37 - 0s - loss: 0.5361 - accuracy: 0.7395
Epoch 24/50
37/37 - 0s - loss: 0.5335 - accuracy: 0.7375
Epoch 25/50
37/37 - 0s - loss: 0.5286 - accuracy: 0.7414
Epoch 26/50
37/37 - 0s - loss: 0.5303 - accuracy: 0.7434
Epoch 27/50
37/37 - 0s - loss: 0.5256 - accuracy: 0.7424
Epoch 28/50
37/37 - 0s - loss: 0.5200 - accuracy: 0.7542
Epoch 29/50
37/37 - 0s - loss: 0.5179 - accuracy: 0.7522
Epoch 30/50
37/37 - 0s - loss: 0.5187 - accuracy: 0.7532
Epoch 31/50
37/37 - 0s - loss: 0.5167 - accuracy: 0.7640
Epoch 32/50
37/37 - 0s - loss: 0.5157 - accuracy: 0.7551
Epoch 33/50
37/37 - 0s - loss: 0.5103 - accuracy: 0.7679
Epoch 34/50
37/37 - 0s - loss: 0.5094 - accuracy: 0.7708
Epoch 35/50
37/37 - 0s - loss: 0.5086 - accuracy: 0.7728
Epoch 36/50
37/37 - 0s - loss: 0.5012 - accuracy: 0.7757
Epoch 37/50
37/37 - 0s - loss: 0.5046 - accuracy: 0.7708
Epoch 38/50
37/37 - 0s - loss: 0.4994 - accuracy: 0.7718
Epoch 39/50
37/37 - 0s - loss: 0.5048 - accuracy: 0.7728
Epoch 40/50
37/37 - 0s - loss: 0.4975 - accuracy: 0.7796
Epoch 41/50
37/37 - 0s - loss: 0.4957 - accuracy: 0.7738
Epoch 42/50
37/37 - 0s - loss: 0.4940 - accuracy: 0.7757
Epoch 43/50
37/37 - 0s - loss: 0.4968 - accuracy: 0.7738
Epoch 44/50
37/37 - 0s - loss: 0.4927 - accuracy: 0.7826
Epoch 45/50
37/37 - 0s - loss: 0.4895 - accuracy: 0.7816
Epoch 46/50
37/37 - 0s - loss: 0.4826 - accuracy: 0.7845
Epoch 47/50
37/37 - 0s - loss: 0.4868 - accuracy: 0.7806
Epoch 48/50
37/37 - 0s - loss: 0.4887 - accuracy: 0.7816
Epoch 49/50
37/37 - 0s - loss: 0.4826 - accuracy: 0.7826
Epoch 50/50
37/37 - 0s - loss: 0.4782 - accuracy: 0.7865

<tensorflow.python.keras.callbacks.History at 0x7f5045c55048>

# Evaluating HD Model

modelHD.evaluate(X_test_LSTM, y_test_LSTM)

8/8 [==============================] - 0s 6ms/step - loss: 0.6860 - accuracy: 0.7222

[0.685989260673523, 0.7222222089767456]

# Plotting Metrics for HD Model

plotMetrics(modelHD, X_test_LSTM, y_test_LSTM, list(target_names.values()), 'HD')
plotTransitionProb(modelHD,stocks['HD'],X_test_LSTM,y_test_LSTM,'HD',testSize = 252)

		 HD Confusion Matrix

[[ 56  42]
 [ 28 126]]

		 HD Classification Report

              precision    recall  f1-score   support

   Down Move       0.67      0.57      0.62        98
     Up Move       0.75      0.82      0.78       154

    accuracy                           0.72       252
   macro avg       0.71      0.69      0.70       252
weighted avg       0.72      0.72      0.72       252

# Forecasting using HD Model on the test set

calcPnL(modelHD,stocks['HD'],X_test_LSTM,y_test_LSTM,threshold = 0.52, stock_name='HD')

# Creating the Attention LSTM Model for LOW

modelLOW = model(inputDays, unitsPreLSTM, unitsPostLSTM, unitsDenseAttention, len(features), name='model_LOW')
modelLOW.summary()

Model: "model_LOW"
__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
==================================================================================================
Input (InputLayer)              [(None, 28, 19)]     0                                            
__________________________________________________________________________________________________
PreAttention_LSTM (LSTM)        (None, 28, 128)      75776       Input[0][0]                      
__________________________________________________________________________________________________
Dense1_Attention (Dense)        (None, 28, 32)       4128        PreAttention_LSTM[0][0]          
__________________________________________________________________________________________________
Dense2_Attention (Dense)        (None, 28, 1)        33          Dense1_Attention[0][0]           
__________________________________________________________________________________________________
attention_weights (Activation)  (None, 28, 1)        0           Dense2_Attention[0][0]           
__________________________________________________________________________________________________
context (Dot)                   (None, 1, 128)       0           attention_weights[0][0]          
                                                                 PreAttention_LSTM[0][0]          
__________________________________________________________________________________________________
PostAttention_LSTM (LSTM)       (None, 32)           20608       context[0][0]                    
__________________________________________________________________________________________________
Output (Dense)                  (None, 1)            33          PostAttention_LSTM[0][0]         
==================================================================================================
Total params: 100,578
Trainable params: 100,578
Non-trainable params: 0
__________________________________________________________________________________________________

# Model Compile Settings for LOW

opt = Adam(lr=0.0004, beta_1=0.9, beta_2=0.999, decay=0.01)
modelLOW.compile(optimizer=opt, loss='binary_crossentropy', metrics=['accuracy'])

# Creating Data for LOW Attention LSTM Model

X_train, X_test, y_train, y_test = createTrainTest(stocks['LOW'], features)
X_train_scaled, X_test_scaled = scaleTrainTest(X_train, X_test)
X_train_LSTM, X_test_LSTM, y_train_LSTM, y_test_LSTM = createDataLSTM(
    X_train_scaled, X_test_scaled, y_train, y_test, len(features), n_days=28, testSize=252)

# Training the LOW Model 

modelLOW.fit(X_train_LSTM, y_train_LSTM, epochs=50, batch_size=28, verbose=2)

Epoch 1/50
37/37 - 0s - loss: 0.6824 - accuracy: 0.5690
Epoch 2/50
37/37 - 0s - loss: 0.6504 - accuracy: 0.6327
Epoch 3/50
37/37 - 0s - loss: 0.6281 - accuracy: 0.6494
Epoch 4/50
37/37 - 0s - loss: 0.6116 - accuracy: 0.6621
Epoch 5/50
37/37 - 0s - loss: 0.5992 - accuracy: 0.6876
Epoch 6/50
37/37 - 0s - loss: 0.5837 - accuracy: 0.7140
Epoch 7/50
37/37 - 0s - loss: 0.5805 - accuracy: 0.7052
Epoch 8/50
37/37 - 0s - loss: 0.5707 - accuracy: 0.7277
Epoch 9/50
37/37 - 0s - loss: 0.5625 - accuracy: 0.7316
Epoch 10/50
37/37 - 0s - loss: 0.5557 - accuracy: 0.7307
Epoch 11/50
37/37 - 0s - loss: 0.5561 - accuracy: 0.7267
Epoch 12/50
37/37 - 0s - loss: 0.5502 - accuracy: 0.7356
Epoch 13/50
37/37 - 0s - loss: 0.5461 - accuracy: 0.7326
Epoch 14/50
37/37 - 0s - loss: 0.5401 - accuracy: 0.7434
Epoch 15/50
37/37 - 0s - loss: 0.5406 - accuracy: 0.7356
Epoch 16/50
37/37 - 0s - loss: 0.5343 - accuracy: 0.7453
Epoch 17/50
37/37 - 0s - loss: 0.5299 - accuracy: 0.7434
Epoch 18/50
37/37 - 0s - loss: 0.5288 - accuracy: 0.7453
Epoch 19/50
37/37 - 0s - loss: 0.5294 - accuracy: 0.7385
Epoch 20/50
37/37 - 0s - loss: 0.5225 - accuracy: 0.7453
Epoch 21/50
37/37 - 0s - loss: 0.5232 - accuracy: 0.7414
Epoch 22/50
37/37 - 0s - loss: 0.5199 - accuracy: 0.7424
Epoch 23/50
37/37 - 0s - loss: 0.5148 - accuracy: 0.7444
Epoch 24/50
37/37 - 0s - loss: 0.5131 - accuracy: 0.7414
Epoch 25/50
37/37 - 0s - loss: 0.5099 - accuracy: 0.7385
Epoch 26/50
37/37 - 0s - loss: 0.5086 - accuracy: 0.7424
Epoch 27/50
37/37 - 0s - loss: 0.5026 - accuracy: 0.7444
Epoch 28/50
37/37 - 0s - loss: 0.5007 - accuracy: 0.7375
Epoch 29/50
37/37 - 0s - loss: 0.4970 - accuracy: 0.7405
Epoch 30/50
37/37 - 0s - loss: 0.5024 - accuracy: 0.7356
Epoch 31/50
37/37 - 0s - loss: 0.4970 - accuracy: 0.7444
Epoch 32/50
37/37 - 0s - loss: 0.4939 - accuracy: 0.7463
Epoch 33/50
37/37 - 0s - loss: 0.4930 - accuracy: 0.7365
Epoch 34/50
37/37 - 0s - loss: 0.4901 - accuracy: 0.7434
Epoch 35/50
37/37 - 0s - loss: 0.4856 - accuracy: 0.7424
Epoch 36/50
37/37 - 0s - loss: 0.4852 - accuracy: 0.7395
Epoch 37/50
37/37 - 0s - loss: 0.4828 - accuracy: 0.7385
Epoch 38/50
37/37 - 0s - loss: 0.4790 - accuracy: 0.7453
Epoch 39/50
37/37 - 0s - loss: 0.4802 - accuracy: 0.7414
Epoch 40/50
37/37 - 0s - loss: 0.4784 - accuracy: 0.7434
Epoch 41/50
37/37 - 0s - loss: 0.4740 - accuracy: 0.7473
Epoch 42/50
37/37 - 0s - loss: 0.4774 - accuracy: 0.7385
Epoch 43/50
37/37 - 0s - loss: 0.4747 - accuracy: 0.7444
Epoch 44/50
37/37 - 0s - loss: 0.4689 - accuracy: 0.7453
Epoch 45/50
37/37 - 0s - loss: 0.4704 - accuracy: 0.7473
Epoch 46/50
37/37 - 0s - loss: 0.4690 - accuracy: 0.7483
Epoch 47/50
37/37 - 0s - loss: 0.4701 - accuracy: 0.7473
Epoch 48/50
37/37 - 0s - loss: 0.4637 - accuracy: 0.7512
Epoch 49/50
37/37 - 0s - loss: 0.4650 - accuracy: 0.7483
Epoch 50/50
37/37 - 0s - loss: 0.4614 - accuracy: 0.7561

<tensorflow.python.keras.callbacks.History at 0x7f4fe73a6b70>

# Evaluating LOW Model

modelLOW.evaluate(X_test_LSTM, y_test_LSTM)

8/8 [==============================] - 0s 5ms/step - loss: 0.7432 - accuracy: 0.6071

[0.7431829571723938, 0.6071428656578064]

# Plotting Metrics for LOW Model

plotMetrics(modelLOW, X_test_LSTM, y_test_LSTM, list(target_names.values()), 'LOW')
plotTransitionProb(modelLOW,stocks['LOW'],X_test_LSTM,y_test_LSTM,'LOW',testSize = 252)

		 LOW Confusion Matrix

[[ 20  78]
 [ 21 133]]

		 LOW Classification Report

              precision    recall  f1-score   support

   Down Move       0.49      0.20      0.29        98
     Up Move       0.63      0.86      0.73       154

    accuracy                           0.61       252
   macro avg       0.56      0.53      0.51       252
weighted avg       0.57      0.61      0.56       252

# Forecasting using HD Model on the test set

calcPnL(modelLOW,stocks['LOW'],X_test_LSTM,y_test_LSTM,threshold = 0.52, stock_name='LOW')

	Open	High	Low	Close	Adj Close	Volume
Date
2013-12-31	81.989998	82.470001	81.720001	82.339996	71.085419	4493600
2014-01-02	82.110001	82.570000	81.800003	82.019997	70.809158	4253400
2014-01-03	81.910004	82.480003	81.830002	81.889999	70.696899	3897900
2014-01-06	81.650002	81.980003	81.099998	81.099998	70.014908	11188800
2014-01-07	81.309998	81.919998	81.080002	81.500000	70.360229	4630900