from IPython.display import Image


# ![LSTM diagram 1](images_lstm/schema_lstm.jpg)
Image(filename ='images_lstm/schema_lstm.jpg')


# ![LSTM diagram 2](images_lstm/schema_lstm_2.jpg)
Image(filename ='images_lstm/schema_lstm_2.jpg')


import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import torch as th
import csv

from torch import nn
from torch.utils.data import Dataset, DataLoader
from torch.utils.tensorboard import SummaryWriter
from torchviz import make_dot

%load_ext tensorboard


dico = {"Description" : "Point Name",
        "MOTOR CURRENT" : "PARD@3C52@3C52-M@JT7099.CAL",
        "Température palier étage 1" : "PARD@3C52@3C52-M@TE7011A.PNT",
        "Température palier étage2" : "PARD@3C52@3C52-M@TE7021A.PNT",
        "Température palier étage 3" : "PARD@3C52@3C52-M@TE7031A.PNT",
        "Température palier étage 4" : "PARD@3C52@3C52-M@TE7041A.PNT",
        "Déplacement axiale 1/2" : "PARD@3C52@3C52-M@VT7001.PNT:RAW",
        "Déplacement axiale 3/4" : "PARD@3C52@3C52-M@VT7002.PNT:RAW",
        "1e stade vibration X" : "PARD@3C52@3C52-M@VT7011A.PNT:RAW",
        "1er stade vibration Y" : "PARD@3C52@3C52-M@VT7011B.PNT:RAW",
        "2e stade vibration X" : "PARD@3C52@3C52-M@VT7021A.PNT:RAW",
        "2e stade vibration Y" : "PARD@3C52@3C52-M@VT7021B.PNT:RAW",
        "3e stade vibration X" : "PARD@3C52@3C52-M@VT7031A.PNT:RAW",
        "3e stade vibration Y" : "PARD@3C52@3C52-M@VT7031B.PNT:RAW",
        "4e stade vibration X" : "PARD@3C52@3C52-M@VT7041A.PNT:RAW",
        "4e stade vibration Y" : "PARD@3C52@3C52-M@VT7041B.PNT:RAW",
        "Température huile sortie réfrigerant" : "PARD@3C52@3C52@TE7086.PNT",
        "labels" : "labels"}


device = "cuda" if th.cuda.is_available() else "cpu"
#checks if a gpu is available instead of a cpu in order to speed up the computation
print(device)

cuda


df = pd.read_csv("clean_data_huile.csv")
tempetage1 = df[['PARD@3C52@3C52-M@TE7011A.PNT','labels']]


value = tempetage1['PARD@3C52@3C52-M@TE7011A.PNT']
label = tempetage1['labels']
plt.figure(figsize = (15,6))
plt.grid()
plt.plot(value, label = "Signal of 'Température palier étage 1'")
plt.plot(0.2*label, label = "Labelling")
plt.vlines(10000, -2, 2, colors = 'r', label = "Segments that divide the dataset according to its type")
plt.vlines(43089, -2, 2, colors = 'r')
plt.vlines(66900, -2, 2, colors = 'r')
plt.vlines(100032, -2, 2, colors = 'r')
plt.legend()
plt.show()


df_train_1 = df[0: 10000] # first normal set
df_test_1 = df[14000:43089].reset_index() # first abnormal train test
df_test_2 = df[43089: 66900].reset_index() # second abnormal train test
df_train_2 = df[66900:100032] # second normal set
df_test_3 = df[100032:].reset_index() # third abnormal train test
df_train = pd.concat((df_train_1, df_train_2), axis = 0).reset_index() # train on all normal data
df_test = df_test_3[:5000] # set to test the train
df_test_perf = df[43089:]


input_features = [dico["Température palier étage 1"], dico["MOTOR CURRENT"], dico["Température huile sortie réfrigerant"]]
output_features = [dico["Température palier étage 1"]]
input_dim = len(input_features)
output_dim = len(output_features)
sample_size = 20

def compute(df, window) :
    """
    return a dataset adapted to build the data
    """
    df = df.loc[:, input_features]
    for value in range(1, window) :
        for feature in input_features :
            df[feature + str(value)] = df[feature].shift(value)
    return df

def form_data(df, window) :
    """
    build the data with a dataset from compute
    """
    pred = 1 # we predict the next point
    df = compute(df, window)
    data = []
    label = []
    l = len(df)
    for rang in range(l - window - pred + 1) :
        local_data = []
        local_label = []
        for feature in input_features :
            local_data.append(list(df.loc[rang + window - 1, feature::len(input_features)])[::-1])
        for feature in output_features :
            if pred > 1 :
                local_label.append(list(df.loc[rang + window, feature : feature + str(pred - 1): len(input_features)])[::-1])
            elif pred == 1 :
                local_label.append(list(df.loc[rang + window, feature : feature]))
        data.append(local_data)
        label.append(local_label)
    
    data = np.array([np.array(sample).T for sample in data])
    label = np.array(label)
    return data, label

data_train, labels_train = form_data(df_train, sample_size)
data_test, labels_test = form_data(df_test, sample_size)


#Hyperparameters
sample_size = 20
batch_size = 100
num_workers = 8 #improves the speed of the training step
nb_layers = 1
learning_rate = 0.0001
hidden_size = 10
loss_func = th.nn.MSELoss()
min_epochs = 20
max_epochs = 60


class FeaturesDataset(Dataset) :
    def __init__(self, data, labels) :
        self.data = [th.tensor(values) for values in data]
        self.labels = [th.tensor(label) for label in labels]

    def __len__(self) :
        return len(self.labels)
    
    def __getitem__(self, idx) :
        return self.data[idx], self.labels[idx]


writer = SummaryWriter()

class Model(nn.Module) :
    def __init__(self, input_dim, output_dim) :
        super(Model, self).__init__()
        self.LSTM = th.nn.LSTM(input_dim, hidden_size, nb_layers, batch_first = True, bidirectional = False)
        self.non_lin = th.nn.ReLU() 
        self.lin = th.nn.Linear(hidden_size, output_dim)
        
        self.lr = learning_rate
        
        self.loss_function = loss_func
        
    def forward(self, x) :
        x, _ = self.LSTM(x)
        x = x[:, -1, :].squeeze()
        x = self.non_lin(x)
        x = self.lin(x)
        return th.nn.Tanh()(x)

def training() :
    """
    trains and then tests the trained LSTM
    """
    model = Model(input_dim = input_dim, output_dim = output_dim).to(device)
    optimizer = th.optim.Adam(model.parameters(), lr = learning_rate)
    test_loss_global = 10
    epoch = 0
    arret = False

    while not arret :
        epoch += 1
        batch_loss = 0
        for data, target in train_dataloader :
            data = data.float().to(device)
            target = target.squeeze().unsqueeze(1).to(device)
            optimizer.zero_grad()
            output = model(data) # contains sample_size * nb_features points
            loss = loss_func(output.float(), target.float())

            loss.backward()
            optimizer.step()
            batch_loss += loss.item()

        if epoch % 2 == 0 :
            writer.add_scalar("train_loss", batch_loss, epoch)
            print(f"epoch = {epoch}")
            test_loss = 0
            for data, target in test_dataloader :
                data = data.float().to(device)
                target = target.squeeze().unsqueeze(1).to(device)
                output = model(data)
                loss = loss_func(output.float(), target.float()) 
                test_loss += loss
            print(test_loss)
            writer.add_scalar("test_loss", test_loss, epoch)

            if (test_loss > test_loss_global and epoch > min_epochs) or epoch > max_epochs :
                print(epoch)
                arret = True
            test_loss_global = test_loss

    writer.flush()
    writer.close()


model = th.load('model_complet_lstm.pt')


def model_prediction(model, dataloader) :
    """
    applies the LSTM model to a dataset
    returns the actual curve and the predicted curve
    """
    courbe_theo = []
    courbe_calc = []
    for data, target in dataloader :
        data = data.float().to(device)
        target = target.to(device)
        output = model(data)
        for i in output :
            for j in i :
                courbe_calc.append(j.item())
        for k in target :
            for j in k :
                courbe_theo.append(j.item())
    return courbe_theo, courbe_calc


def show_curve_diff(courbe_theo, courbe_calc, threshold = 0.001, tolerance = 5, alerts = []) :
    """
    plots the superposition of the actual and predicted curve
    and the difference between these two curves compared with the threshold applied to the data
    """
    plt.figure(figsize = (30, 6))
    
    for rang, valeur in enumerate(alerts) :
        if valeur == 2 :
            plt.vlines(rang, -.5, .5, colors='r')
        elif valeur == 1 :
            plt.vlines(rang, -.5, .5, colors='orange')
        
    plt.plot(courbe_theo, label = 'Real signal')
    plt.plot(courbe_calc, label = 'Prediction')
    plt.legend()
    plt.show()
    plt.figure(figsize = (30, 6))
    diff = np.array(courbe_theo) - np.array(courbe_calc)
    plt.plot(diff, label = 'Difference between real and prediction')
    limit = threshold*tolerance
    plt.hlines([-limit, limit], 0, len(courbe_theo), color = 'r', label = 'Threshold * tolerance')
    plt.legend()
    plt.show()


val = FeaturesDataset(data_test, labels_test)
test_dataloader_normal = DataLoader(val, batch_size = batch_size, shuffle = False, num_workers = num_workers)


show_curve_diff(*model_prediction(model, test_dataloader_normal))


data_l_test_1, labels_l_test_1 = form_data(df_test_1, sample_size)
data_l_test_2, labels_l_test_2 = form_data(df_test_2, sample_size)
data_l_test_3, labels_l_test_3 = form_data(df_test_3, sample_size)


val_1 = FeaturesDataset(data_l_test_1, labels_l_test_1)
val_2 = FeaturesDataset(data_l_test_2, labels_l_test_2)
val_3 = FeaturesDataset(data_l_test_3, labels_l_test_3)
test_dataloader_1 = DataLoader(val_1, batch_size = batch_size, shuffle = False, num_workers = num_workers)
test_dataloader_2 = DataLoader(val_2, batch_size = batch_size, shuffle = False, num_workers = num_workers)
test_dataloader_3 = DataLoader(val_3, batch_size = batch_size, shuffle = False, num_workers = num_workers)


show_curve_diff(*model_prediction(model, test_dataloader_1))


show_curve_diff(*model_prediction(model, test_dataloader_2))


show_curve_diff(*model_prediction(model, test_dataloader_3))


threshold = 0.001
length_input = 5000 + sample_size
buffer_time = 504


def local_anomaly(predicted_signal, actual_signal, threshold, tolerance) :
    """
    returns a boolean indicating if the given signals differ by more than threshold*tolerance anywhere on the period
    """
    predicted_signal = np.array(predicted_signal)
    actual_signal = np.array(actual_signal)
    diff = actual_signal - predicted_signal

    max_diff = max(abs(diff))
    if max_diff > threshold * tolerance :
        return True
    return False


def anomaly(dataframe, length_input, tolerance = 5, threshold = 0.001, plot = True) :
    """
    returns the actual curve, the predicted curve and a list of int indicating the colour of every point :
    green, orange or red
    """
    dataframe_calc = dataframe.loc[len(dataframe) - length_input:, :]

    dataframe_calc = dataframe_calc.reset_index(drop = True)
    data, labels = form_data(dataframe_calc, sample_size)
    inp = FeaturesDataset(data, labels)
    dataloader = DataLoader(inp, batch_size = batch_size, shuffle = False, num_workers = num_workers)
    
    courbe_theo, courbe_calc = model_prediction(model, dataloader)
            
    alerts = []
    
    for point_calc, point_theo in zip(courbe_calc, courbe_theo) :   
        if local_anomaly([point_calc], [point_theo], threshold, tolerance) :
            alerts.append(1)
        else:
            alerts.append(0)
    
    for rang, valeur in enumerate(alerts) :
        if valeur == 1 :
            alerts[rang] = 2 # red 
        elif rang >= buffer_time and alerts[rang - buffer_time:rang].count(2) >= 12 :
            alerts[rang] = 1 # orange
        else:
            alerts[rang] = 0 # green
    
    if plot :
        show_curve_diff(courbe_theo, courbe_calc, alerts = alerts, tolerance = tolerance, threshold = threshold)
    
    return courbe_theo, courbe_calc, alerts


_,_,_ = anomaly(df.loc[80000:90000].reset_index(), length_input)


tolerance = 5
length_input = 92000 + sample_size # we set the length_input from 5000 to 92000 because the dataset df_test_perf is large and we want to evaluate the model on the whole dataframe


def transform_0_1(i) :
    if i != 0 : return 1
    return 0


def performances(df, tolerance) :
    label = list(df['labels'])
    label_0_1 = [transform_0_1(i) for i in label][sample_size:]
    nb_error = label_0_1.count(1)
    true_positives = 0
    false_positives = 0
    false_negatives = 0
    true_negatives = 0
    courbe_theo, courbe_calc, alerts = anomaly(df, length_input=len(df), tolerance = tolerance)
    for prediction, real in zip(alerts, label_0_1) :
        if prediction == real :
            if prediction == 1:
                true_positives += 1
            else:
                true_negatives += 1
        else:
            if prediction == 0 :
                false_negatives += 1
            elif prediction == 1:
                false_positives += 1
            else:
                if real == 1 :
                    true_positives += 1
                else:
                    false_positives += 1
    recall = true_positives / nb_error
    precision = true_positives / (true_positives + false_positives)
    return recall, precision, false_negatives


# ![tol1](images_lstm/im1.png)
Image(filename ='images_lstm/im1.png')


# ![tol2](images_lstm/im2.png)
Image(filename ='images_lstm/im2.png')


# ![tol3](images_lstm/im3.png)
Image(filename ='images_lstm/im3.png')


# ![tol4](images_lstm/im4.png)
Image(filename ='images_lstm/im4.png')


# ![tol5](images_lstm/im5.png)
Image(filename ='images_lstm/im5.png')


# ![tol6](images_lstm/im6.png)
Image(filename ='images_lstm/im6.png')


# ![tol7](images_lstm/im7.png)
Image(filename ='images_lstm/im7.png')


# ![tol8](images_lstm/im8.png)
Image(filename ='images_lstm/im8.png')


# ![tol9](images_lstm/im9.png)
Image(filename ='images_lstm/im9.png')


def speed_evaluation(tolerance) :
    """
    on all dataset df
    plots vertical lines when axis Y is labelled as an error 
    plots dots when axis Y is predicted as an error
    """
    stop = False
    count = 0
    lst = []

    while not stop :
        df_test = df[count:count + 50].reset_index()
        count += 50
        ano = anomaly(df_test, 50, tolerance = 5, plot = False)[2]
        if 2 in ano or 1 in ano :
            lst.append(count)
            print(count)
        if count >= 135000 :
            stop = True

    plt.scatter(np.arange(len(lst)), lst)
    label_index = label[label != 0].index
    plt.plot(lst)
    print(len(lst))
    plt.hlines(label_index, 0, 1400, color = 'r')


# ![speed_tol_1](images_lstm/rapidity1.png)
Image(filename ='images_lstm/rapidity1.png')


# ![speed_tol_5](images_lstm/rapidity5.png)
Image(filename ='images_lstm/rapidity5.png')

Long short-term memory (LSTM)¶

I. Principle of the algorithm¶

II. Preparation of the datasets used for training and testing¶

III. The algorithm¶

Preparation of the data¶

Training¶

The LSTM model¶

A test on a normal set not in the training set¶

Testing on abnormal set¶

IV. Global solution (comparing prediction and real signal)¶

Raising an alarm when encountering an anomaly¶

Performance in terms of accuracy¶

Performance in terms of speed¶

Tolerance = 1¶

Tolerance = 5¶

V. Conclusion¶

Performance¶

Limits¶