Repository: MegaJoctan/MALE5
Branch: MQL5-ML
Commit: d6541568aaba
Files: 47
Total size: 473.0 KB

Directory structure:
gitextract_ly_vy9wi/

├── .github/
│   └── FUNDING.yml
├── .gitignore
├── Examples/
│   ├── Classifier Model Example.mq5
│   └── Regressor Model Example.mq5
├── LICENSE
├── MqPlotLib/
│   └── plots.mqh
├── Neural Networks/
│   ├── Pattern Nets.mqh
│   ├── README.md
│   ├── Regressor Nets.mqh
│   ├── initializers.mqh
│   ├── kohonen maps.mqh
│   └── optimizers.mqh
├── Numpy/
│   └── Numpy.mqh
├── Pandas/
│   ├── Incremental LE.mqh
│   └── pandas.mqh
├── README.md
├── Sklearn/
│   ├── Cluster/
│   │   ├── DBSCAN.mqh
│   │   ├── Hierachical Clustering.mqh
│   │   ├── KMeans.mqh
│   │   └── base.mqh
│   ├── Decomposition/
│   │   ├── LDA.mqh
│   │   ├── NMF.mqh
│   │   ├── PCA.mqh
│   │   ├── README.md
│   │   ├── TruncatedSVD.mqh
│   │   └── base.mqh
│   ├── Ensemble/
│   │   ├── AdaBoost.mqh
│   │   ├── README.md
│   │   └── Random Forest.mqh
│   ├── Linear Models/
│   │   ├── Linear Regression.mqh
│   │   ├── Logistic Regression.mqh
│   │   ├── README.md
│   │   └── Ridge.mqh
│   ├── Naive Bayes/
│   │   ├── Naive Bayes.mqh
│   │   ├── README.md
│   │   └── naive bayes visuals.py
│   ├── Neighbors/
│   │   └── KNN_nearest_neighbors.mqh
│   ├── Tree/
│   │   ├── README.md
│   │   └── tree.mqh
│   ├── metrics.mqh
│   └── preprocessing.mqh
├── Stats Models/
│   ├── ADF.mqh
│   ├── ARIMA.mqh
│   └── OLS.mqh
├── Tensors.mqh
├── Utils.mqh
└── requirements.txt

================================================
FILE CONTENTS
================================================

================================================
FILE: .github/FUNDING.yml
================================================
# These are supported funding model platforms

ko_fi: omegajoctan

custom: ['https://www.mql5.com/en/users/omegajoctan/seller']
custom: ['https://www.buymeacoffee.com/omegajoctan']


================================================
FILE: .gitignore
================================================
*.ex5
*.psd
*.zip
*.rar

*.xlsx

Todo's.txt
logisticwiki.txt

/venv

/Neural Nets Pro

================================================
FILE: Examples/Classifier Model Example.mq5
================================================
//+------------------------------------------------------------------+
//|                                      Classifier Model Sample.mq5 |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
#property version   "1.00"

#include <MALE5\Decision Tree\tree.mqh>
#include <MALE5\preprocessing.mqh>
#include <MALE5\MatrixExtend.mqh> //helper functions for for data manipulations
#include <MALE5\metrics.mqh> //fo measuring the performance

StandardizationScaler scaler; //standardization scaler from preprocessing.mqh
CDecisionTreeClassifier *decision_tree; //a decision tree classifier model

MqlRates rates[];
//+------------------------------------------------------------------+
//| Expert initialization function                                   |
//+------------------------------------------------------------------+
int OnInit()
  {
  
//--- Model selection
   
     decision_tree = new CDecisionTreeClassifier(2, 5); //a decision tree classifier from DecisionTree class
     
//---

     vector open, high, low, close;     
     int data_size = 1000;
     
//--- Getting the open, high, low and close values for the past 1000 bars, starting from the recent closed bar of 1
     
     open.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_OPEN, 1, data_size);
     high.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_HIGH, 1, data_size);
     low.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_LOW, 1, data_size);
     close.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_CLOSE, 1, data_size);
     
     matrix X(data_size, 3); //creating the x matrix 
   
//--- Assigning the open, high, and low price values to the x matrix 

     X.Col(open, 0);
     X.Col(high, 1);
     X.Col(low, 2);
     
//--- Since we are using the x variables to predict y, we choose the close price to be the target variable 
   
     vector y(data_size); 
     for (int i=0; i<data_size; i++)
       {
         if (close[i]>open[i]) //a bullish candle appeared
           y[i] = 1; //buy signal
         else
           {
             y[i] = 0; //sell signal
           } 
       }

//--- We split the data into training and testing samples for training and evaluation
 
     matrix X_train, X_test;
     vector y_train, y_test;
     
     double train_size = 0.7; //70% of the data should be used for training the rest for testing
     int random_state = 42; //we put a random state to shuffle the data so that a machine learning model understands the patterns and not the order of the dataset, this makes the model durable
      
     MatrixExtend::TrainTestSplitMatrices(X, y, X_train, y_train, X_test, y_test, train_size, random_state); // we split the x and y data into training and testing samples         
     

//--- Normalizing the independent variables
   
     X_train = scaler.fit_transform(X_train); // we fit the scaler on the training data and transform the data alltogether
     X_test = scaler.transform(X_test); // we transform the new data this way
     

//--- Training the  model
     
     decision_tree.fit(X_train, y_train); //The training function 
     
//--- Measuring predictive accuracy 
   
     vector train_predictions = decision_tree.predict_bin(X_train);
     
     Print("Training results classification report");
     Metrics::classification_report(y_train, train_predictions);

//--- Evaluating the model on out-of-sample predictions
     
     vector test_predictions = decision_tree.predict_bin(X_test);
     
     Print("Testing results classification report");
     Metrics::classification_report(y_test, test_predictions); 
     
//---

    ArraySetAsSeries(rates, true);
        

   return(INIT_SUCCEEDED);
  }
//+------------------------------------------------------------------+
//| Expert deinitialization function                                 |
//+------------------------------------------------------------------+
void OnDeinit(const int reason)
  {
//---
    delete (decision_tree); //We have to delete the AI model object from the memory
  }
//+------------------------------------------------------------------+
//| Expert tick function                                             |
//+------------------------------------------------------------------+
void OnTick()
  {
     
//--- Making predictions live from the market 
   
   CopyRates(Symbol(), PERIOD_D1, 1, 3, rates); //Get the very recent information from the market
   
   vector x = {rates[0].open, rates[0].high, rates[0].low}; //Assigning data from the recent candle in a similar way to the training data
   
   x = scaler.transform(x);
   int signal = (int)decision_tree.predict_bin(x);
   
   Comment("Signal = ",signal==1?"BUY":"SELL");  //Ternary operator for checking if the signal is either buy or sell
  }
//+------------------------------------------------------------------+


================================================
FILE: Examples/Regressor Model Example.mq5
================================================
//+------------------------------------------------------------------+
//|                                       Regressor Model sample.mq5 |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
#property version   "1.00"

#include <MALE5\Decision Tree\tree.mqh>
#include <MALE5\preprocessing.mqh>
#include <MALE5\MatrixExtend.mqh> //helper functions for for data manipulations
#include <MALE5\metrics.mqh> //fo measuring the performance

StandardizationScaler scaler; //standardization scaler from preprocessing.mqh
CDecisionTreeRegressor *decision_tree; //a decision tree classifier model

MqlRates rates[];
//+------------------------------------------------------------------+
//| Expert initialization function                                   |
//+------------------------------------------------------------------+
int OnInit()
  {

//--- Model selection
   
     decision_tree = new CDecisionTreeRegressor(2, 5); //a decision tree classifier from DecisionTree class


     vector open, high, low, close;     
     int data_size = 1000; //bars
     
//--- Getting the open, high, low and close values for the past 1000 bars, starting from the recent closed bar of 1
     
     open.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_OPEN, 1, data_size);
     high.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_HIGH, 1, data_size);
     low.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_LOW, 1, data_size);
     
     close.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_CLOSE, 1, data_size);
     
     matrix X(data_size, 3); //creating the x matrix 
   
//--- Assigning the open, high, and low price values to the x matrix 

     X.Col(open, 0);
     X.Col(high, 1);
     X.Col(low, 2);
     
     vector y = close; // The target variable is the close price, using open, high and low values were want to predict the next closing price
     
//--- We split the data into training and testing samples for training and evaluation
 
     matrix X_train, X_test;
     vector y_train, y_test;
     
     double train_size = 0.7; //70% of the data to be used for training the rest 30% for testing
     int random_state = 42; //we put a random state to shuffle the data so that a machine learning model understands the patterns and not the order of the dataset, this makes the model durable
      
     MatrixExtend::TrainTestSplitMatrices(X, y, X_train, y_train, X_test, y_test, train_size, random_state); // we split the x and y data into training and testing samples         
     
//--- Normalizing the independent variables
   
     X_train = scaler.fit_transform(X_train); // we fit the scaler on the training data and transform the data alltogether
     X_test = scaler.transform(X_test); // we transform the new data this way
     
//--- Training the  model
     
     decision_tree.fit(X_train, y_train); //The training function 
     
//--- Measuring predictive accuracy 
   
     vector train_predictions = decision_tree.predict(X_train);
     
     printf("Decision decision_tree training r2_score = %.3f ",Metrics::RegressionMetric(y_train, train_predictions, METRIC_R_SQUARED));

//--- Evaluating the model on out-of-sample predictions
     
     vector test_predictions = decision_tree.predict(X_test);
     
     printf("Decision decision_tree out-of-sample r2_score = %.3f ",Metrics::r_squared(y_test, test_predictions)); 


   return(INIT_SUCCEEDED);
  }
//+------------------------------------------------------------------+
//| Expert deinitialization function                                 |
//+------------------------------------------------------------------+
void OnDeinit(const int reason)
  {
//---
    delete (decision_tree); //We have to delete the AI model object from the memory
  }
//+------------------------------------------------------------------+
//| Expert tick function                                             |
//+------------------------------------------------------------------+
void OnTick()
  {
     
//--- Making predictions live from the market 
   
   CopyRates(Symbol(), PERIOD_D1, 1, 3, rates); //Get the very recent information from the market
   
   vector x = {rates[0].open, rates[0].high, rates[0].low}; //Assigning data from the recent candle in a similar way to the training data
   
   x  = scaler.transform(x);
   double predicted_close_price = decision_tree.predict(x);
   
   Comment("Next closing price predicted is = ",predicted_close_price);  
  }
//+------------------------------------------------------------------+


================================================
FILE: LICENSE
================================================
MIT License

Copyright (c) 2023 Omega Joctan

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.


================================================
FILE: MqPlotLib/plots.mqh
================================================
//+------------------------------------------------------------------+
//|                                                        plots.mqh |
//|                                    Copyright 2022, Fxalgebra.com |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Fxalgebra.com"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+
#include <Graphics\Graphic.mqh>
#include <MALE5\MatrixExtend.mqh>

class CPlots
  {  
protected:
   CGraphic *graph;
   
   long m_chart_id;
   int m_subwin;
   int m_x1, m_x2;
   int m_y1, m_y2;
   string m_font_family;
   bool m_chart_show;
   
   string m_plot_names[];
   ENUM_CURVE_TYPE m_curve_type;
   bool GraphCreate(string plot_name);
   
   vector m_x, m_y;
   string x_label, y_label;
   
public:
         CPlots(long chart_id=0, int sub_win=0 ,int x1=30, int y1=40, int x2=550, int y2=310, string font_family="Consolas", bool chart_show=true);
        ~CPlots(void);
         
         bool Plot(string plot_name, vector& x, vector& y, string x_axis_label, string y_axis_label, string label, ENUM_CURVE_TYPE curve_type=CURVE_POINTS_AND_LINES,color  clr = clrDodgerBlue, bool   points_fill = true);
         bool AddPlot(vector &v,string label="plt",color clr=clrOrange);
  };
  
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CPlots::CPlots(long chart_id=0, int sub_win=0 ,int x1=30, int y1=40, int x2=550, int y2=310, string font_family="Consolas", bool chart_show=true):
   m_chart_id(chart_id),
   m_subwin(sub_win),
   m_x1(x1),
   m_y1(y1),
   m_x2(x2),
   m_y2(y2),   
   m_font_family(font_family),
   m_chart_show(chart_show)
 {
   graph = new CGraphic();
   ChartRedraw(m_chart_id);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CPlots::~CPlots(void)
 {
   for (int i=0; i<ArraySize(m_plot_names); i++)
       ObjectDelete(m_chart_id,m_plot_names[i]);
   
   delete(graph);
   ChartRedraw();
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool CPlots::GraphCreate(string plot_name)
 {   
   ChartRedraw(m_chart_id);
   
   ArrayResize(m_plot_names,ArraySize(m_plot_names)+1);
   m_plot_names[ArraySize(m_plot_names)-1] = plot_name;
   ChartSetInteger(m_chart_id, CHART_SHOW, m_chart_show);
   
   if(!graph.Create(m_chart_id, plot_name, m_subwin, m_x1, m_y1, m_x2, m_y2))
     {
      printf("Failed to Create graphical object on the Main chart Err = %d", GetLastError());
      return(false);
     }
     
   return (true);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

bool CPlots::Plot(
                  string plot_name,
                  vector& x,
                  vector& y,
                  string x_axis_label,
                  string y_axis_label,
                  string label,
                  ENUM_CURVE_TYPE curve_type=CURVE_POINTS_AND_LINES,
                  color  clr = clrDodgerBlue,
                  bool   points_fill = true
               )
  {
   
   if (!this.GraphCreate(plot_name))
     return (false);
   
//---
   
   this.m_x = x;
   this.m_y = y;
   this.x_label = x_axis_label;;
   this.y_label = y_axis_label;
   
   double x_arr[], y_arr[];
   MatrixExtend::VectorToArray(x, x_arr);
   MatrixExtend::VectorToArray(y, y_arr);
   
   m_curve_type = curve_type;
   
   graph.CurveAdd(x_arr, y_arr, ColorToARGB(clr), m_curve_type, label);

   graph.XAxis().Name(x_axis_label);
   graph.XAxis().NameSize(13);
   graph.YAxis().Name(y_axis_label);
   graph.YAxis().NameSize(13);
   graph.FontSet(m_font_family, 13);
   graph.CurvePlotAll();
   graph.Update();

   return(true);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool CPlots::AddPlot(vector &v, string label="plt",color clr=clrOrange)
 {
   double x_arr[], y_arr[];
   MatrixExtend::VectorToArray(this.m_x, x_arr);
   MatrixExtend::VectorToArray(v, y_arr);
 
   if (!graph.CurveAdd(x_arr, y_arr, ColorToARGB(clr), m_curve_type, label))
    {
      printf("%s failed to add a plot to the existing plot Err =%d",__FUNCTION__,GetLastError());
      return false;
    }

   graph.XAxis().Name(this.x_label);
   graph.XAxis().NameSize(13);
   graph.YAxis().Name(this.y_label);
   graph.YAxis().NameSize(13);
   graph.FontSet(m_font_family, 13);
   graph.CurvePlotAll();
   graph.Update();

   return(true);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Neural Networks/Pattern Nets.mqh
================================================
//+------------------------------------------------------------------+
//|                                                 Pattern Nets.mqh |
//|                                    Copyright 2022, Fxalgebra.com |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Fxalgebra.com"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| Neural network type for pattern recognition/ can be used to      |
//| to predict discrete data target variables. They are widely known |
//| as classification Neural Networks                                |
//+------------------------------------------------------------------+
#include <MALE5\MatrixExtend.mqh>
#include <MALE5\preprocessing.mqh>

#ifndef RANDOM_STATE 
 #define  RANDOM_STATE 42
#endif 
 
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
enum activation
  {
   AF_HARD_SIGMOID_ = AF_HARD_SIGMOID,
   AF_SIGMOID_ = AF_SIGMOID,
   AF_SWISH_ = AF_SWISH,
   AF_SOFTSIGN_ = AF_SOFTSIGN,
   AF_TANH_ = AF_TANH
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
class CPatternNets
  {
private:
   
   vector W_CONFIG;
   vector W; //Weights vector
   vector B; //Bias vector 
   activation  A_FX;
   
protected:
   ulong    inputs;
   ulong    outputs;
   ulong    rows;
   vector   HL_CONFIG;
   bool     SoftMaxLayer;
   vector   classes;
   void     SoftMaxLayerFX(matrix<double> &mat);
   
public:
                     CPatternNets(matrix &xmatrix, vector &yvector,vector &HL_NODES, activation ActivationFx, bool SoftMaxLyr=false);
                    ~CPatternNets(void);
                    
                     int  PatternNetFF(vector &in_vector);
                     vector PatternNetFF(matrix &xmatrix); 
                     
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CPatternNets::CPatternNets(matrix &xmatrix, vector &yvector,vector &HL_NODES, activation ActivationFx, bool SoftMaxLyr=false)
  {
      A_FX = ActivationFx;
      inputs = xmatrix.Cols();
      rows = xmatrix.Rows();
      SoftMaxLayer = SoftMaxLyr;
      
//--- Normalize data

      if (rows != yvector.Size())
        {
          Print(__FUNCTION__," FATAL | Number of rows in the x matrix is not the same the y vector size ");
          return;
        }
     
     classes = MatrixExtend::Unique(yvector);
     outputs = classes.Size();
     
     HL_CONFIG.Copy(HL_NODES);
      
     HL_CONFIG.Resize(HL_CONFIG.Size()+1); //Add the output layer
     HL_CONFIG[HL_CONFIG.Size()-1] = (int)outputs; //Append one node to the output layer
//---
     W_CONFIG.Resize(HL_CONFIG.Size());
     B.Resize((ulong)HL_CONFIG.Sum());
     
//--- GENERATE WEIGHTS
   
     ulong layer_input = inputs; 
       
     for (ulong i=0; i<HL_CONFIG.Size(); i++)
       {
          W_CONFIG[i] = layer_input*HL_CONFIG[i];
          layer_input = (ulong)HL_CONFIG[i];
       }
     
     W.Resize((ulong)W_CONFIG.Sum());
     
     W = MatrixExtend::Random(0.0, 1.0, (int)W.Size(),RANDOM_STATE); //Gen weights
     B = MatrixExtend::Random(0.0,1.0,(int)B.Size(),RANDOM_STATE); //Gen bias
      
//---
     
     #ifdef DEBUG_MODE
       Comment(
                "< - - -  P A T T E R N    N E T S  - - - >\n",
                "HIDDEN LAYERS + OUTPUT ",HL_CONFIG,"\n",   
                "INPUTS ",inputs," | OUTPUTS ",outputs," W CONFIG ",W_CONFIG,"\n",
                "activation ",EnumToString(A_FX)," SoftMaxLayer = ",bool(SoftMaxLayer)
              );
              
       Print("WEIGHTS ",W,"\nBIAS ",B);
     #endif 
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CPatternNets::~CPatternNets(void)
  {
    ZeroMemory(W);
    ZeroMemory(B);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
int CPatternNets::PatternNetFF(vector &in_vector)
 {
  
   matrix L_INPUT = {}, L_OUTPUT={}, L_WEIGHTS = {};
   vector v_weights ={};
   
   ulong w_start = 0;             
   
   L_INPUT = MatrixExtend::VectorToMatrix(in_vector); 
   
   vector L_BIAS_VECTOR = {};
   matrix L_BIAS_MATRIX = {};
   
   ulong b_start = 0;
   
   for (ulong i=0; i<W_CONFIG.Size(); i++)
      {         
         MatrixExtend::Copy(W,v_weights,w_start,ulong(W_CONFIG[i]));
         
         L_WEIGHTS = MatrixExtend::VectorToMatrix(v_weights,L_INPUT.Rows());
         
         MatrixExtend::Copy(B,L_BIAS_VECTOR,b_start,(ulong)HL_CONFIG[i]);
         L_BIAS_MATRIX = MatrixExtend::VectorToMatrix(L_BIAS_VECTOR);
         
         #ifdef DEBUG_MODE
           Print("--> ",i);
           Print("L_WEIGHTS\n",L_WEIGHTS,"\nL_INPUT\n",L_INPUT,"\nL_BIAS\n",L_BIAS_MATRIX);
         #endif 
         
         L_OUTPUT = L_WEIGHTS.MatMul(L_INPUT);

         L_OUTPUT = L_OUTPUT+L_BIAS_MATRIX; //Add bias

//---
         
         if (i==W_CONFIG.Size()-1) //Last layer
          {
             if (SoftMaxLayer)  
              {
                Print("Before softmax\n",L_OUTPUT);
                SoftMaxLayerFX(L_OUTPUT);
                Print("After\n",L_OUTPUT);
              }
             else
               L_OUTPUT.Activation(L_OUTPUT, ENUM_ACTIVATION_FUNCTION(A_FX));
          }
         else
            L_OUTPUT.Activation(L_OUTPUT, ENUM_ACTIVATION_FUNCTION(A_FX));
            
//---

         L_INPUT.Copy(L_OUTPUT); //Assign outputs to the inputs
         w_start += (ulong)W_CONFIG[i]; //New weights copy
         b_start += (ulong)HL_CONFIG[i];
         
      }
   
   #ifdef DEBUG_MODE 
     Print("--> outputs\n ",L_OUTPUT);
   #endif 
   
   vector v_out = MatrixExtend::MatrixToVector(L_OUTPUT);
   
   return((int)classes[v_out.ArgMax()]);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

void CPatternNets::SoftMaxLayerFX(matrix<double> &mat)
 {
   vector<double> ret = MatrixExtend::MatrixToVector(mat);
   
   ret.Activation(ret, AF_SOFTMAX);
   
   mat = MatrixExtend::VectorToMatrix(ret, mat.Cols());
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

vector CPatternNets::PatternNetFF(matrix &xmatrix)
 {
   vector v(xmatrix.Rows());
   
    for (ulong i=0; i<xmatrix.Rows(); i++)
         v[i] = PatternNetFF(xmatrix.Row(i));      
   
   return (v);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Neural Networks/README.md
================================================
## Kohonen Maps (Self-Organizing Maps)

This documentation explains the `CKohonenMaps` class in MQL5, which implements **Kohonen Maps**, also known as **Self-Organizing Maps (SOM)**, for clustering and visualization tasks.

**I. Kohonen Maps Theory:**

Kohonen Maps are a type of **artificial neural network** used for unsupervised learning, specifically for **clustering** and **visualization** of high-dimensional data. They work by:

1. **Initializing a grid of neurons:** Each neuron is associated with a weight vector representing its position in the high-dimensional space.
2. **Iteratively presenting data points:**
    * For each data point:
        * Find the **winning neuron** (closest neuron in terms of distance) based on the weight vectors.
        * Update the weights of the winning neuron and its **neighborhood** towards the data point, with decreasing influence as the distance from the winning neuron increases.
3. **Convergence:** After a certain number of iterations (epochs), the weight vectors of the neurons become organized in a way that reflects the underlying structure of the data.

**II. CKohonenMaps Class:**

The `CKohonenMaps` class provides functionalities for implementing Kohonen Maps in MQL5:

**Public Functions:**

* **CKohonenMaps(uint clusters=2, double alpha=0.01, uint epochs=100, int random_state=42)** Constructor, allows setting hyperparameters:
    * `clusters`: Number of clusters (default: 2).
    * `alpha`: Learning rate (default: 0.01).
    * `epochs`: Number of training epochs (default: 100).
    * `random_state`: Random seed for reproducibility (default: 42).
* `~CKohonenMaps(void)` Destructor.
* `void fit(const matrix &x)` Trains the model on the provided data (`x`).
* `int predict(const vector &x)` Predicts the cluster label for a single data point (`x`).
* `vector predict(const matrix &x)` Predicts cluster labels for multiple data points (`x`).

**Internal Functions:**

* `Euclidean_distance(const vector &v1, const vector &v2)`: Calculates the Euclidean distance between two vectors.
* `CalcTimeElapsed(double seconds)`: Converts seconds to a human-readable format (not relevant for core functionality).

**III. Additional Notes:**

* The class internally uses the `CPlots` class (not documented here) for potential visualization purposes.
* The `c_matrix` and `w_matrix` member variables store the cluster assignments and weight matrix, respectively.
* Choosing the appropriate number of clusters is crucial for the quality of the results.

By understanding the theoretical foundation and functionalities of the `CKohonenMaps` class, MQL5 users can leverage Kohonen Maps for:

* **Clustering:** Group similar data points together based on their features.
* **Data visualization:** Project the high-dimensional data onto a lower-dimensional space (e.g., a 2D grid of neurons) for easier visualization, potentially using the `CPlots` class.


## Pattern Recognition Neural Network 

This documentation explains the `CPatternNets` class in MQL5, which implements a **feed-forward neural network** for pattern recognition tasks.

**I. Neural Network Theory:**

A feed-forward neural network consists of interconnected layers of **neurons**. Each neuron receives input from the previous layer, applies an **activation function** to transform the signal, and outputs the result to the next layer.

**II. CPatternNets Class:**

The `CPatternNets` class provides functionalities for training and using a feed-forward neural network for pattern recognition in MQL5:

**Public Functions:**

* `CPatternNets(matrix &xmatrix, vector &yvector,vector &HL_NODES, activation ActivationFx, bool SoftMaxLyr=false)` Constructor:
    * `xmatrix`: Input data matrix (rows: samples, columns: features).
    * `yvector`: Target labels vector (corresponding labels for each sample in `xmatrix`).
    * `HL_NODES`: Vector specifying the number of neurons in each hidden layer.
    * `ActivationFx`: Activation function (enum specifying the type of activation function).
    * `SoftMaxLyr`: Flag indicating whether to use a SoftMax layer in the output (default: False).
* `~CPatternNets(void)` Destructor.
* `int PatternNetFF(vector &in_vector)` Performs a forward pass on the network with a single input vector and returns the predicted class label.
* `vector PatternNetFF(matrix &xmatrix)` Performs a forward pass on the network for all rows in the input matrix and returns a vector of predicted class labels.

**Internal Functions:**

* `SoftMaxLayerFX(matrix<double> &mat)`: Applies the SoftMax function to a matrix (used for the output layer if `SoftMaxLyr` is True).

**III. Class Functionality:**

1. **Initialization:**
    * The constructor validates data dimensions and parses user-defined hyperparameters.
    * The network architecture (number of layers and neurons) is determined based on the provided configuration.
    * Weights (connections between neurons) and biases (individual offsets for each neuron) are randomly initialized.

2. **Forward Pass:**
    * The provided input vector is fed into the first layer.
    * Each layer performs the following steps:
        * Calculates the weighted sum of the previous layer's outputs.
        * Adds the bias term to the weighted sum.
        * Applies the chosen activation function to the result.
    * This process continues through all layers until the final output layer is reached.

3. **SoftMax Layer (Optional)**
    * If the `SoftMaxLyr` flag is True, the output layer uses the SoftMax function to ensure the output values sum to 1 and represent class probabilities.

4. **Prediction:**
    * For single-sample prediction (`PatternNetFF(vector &in_vector)`), the class label with the **highest output value** is returned.
    * For batch prediction (`PatternNetFF(matrix &xmatrix)`), a vector containing the predicted class label for each sample in the input matrix is returned.

**IV. Additional Notes:**

* The class provides several debug statements (disabled by default) to print intermediate calculations for debugging purposes.
* The code uses helper functions from the `MatrixExtend` class (not documented here) for matrix and vector operations.
* Choosing the appropriate network architecture, activation function, and learning approach (not implemented in this class) is crucial for optimal performance on specific tasks.

By understanding the theoretical foundation and functionalities of the `CPatternNets` class, MQL5 users can leverage neural networks for various pattern recognition tasks, including:

* **Classification:** Classifying data points into predefined categories based on their features.
* **Anomaly detection:** Identifying data points that deviate significantly from the expected patterns.
* **Feature learning:** Extracting hidden patterns or representations from the data.


## Regression Neural Network

This documentation explains the `CRegressorNets` class in MQL5, which implements a **Multi-Layer Perceptron (MLP)** for regression tasks.

**I. Regression vs. Classification:**

* **Regression:** Predicts continuous output values.
* **Classification:** Assigns data points to predefined categories.

**II. MLP Neural Network:**

An MLP is a type of **feed-forward neural network** used for supervised learning tasks like regression. It consists of:

* **Input layer:** Receives the input data.
* **Hidden layers:** Process and transform the information.
* **Output layer:** Produces the final prediction (continuous value in regression).

**III. CRegressorNets Class:**

The `CRegressorNets` class provides functionalities for training and using an MLP for regression in MQL5:

**Public Functions:**

* `CRegressorNets(vector &HL_NODES, activation ActivationFX=AF_RELU_)` Constructor:
    * `HL_NODES`: Vector specifying the number of neurons in each hidden layer.
    * `ActivationFX`: Activation function (enum specifying the type of activation function).
* `~CRegressorNets(void)` Destructor.
* `void fit(matrix &x, vector &y)` Trains the model on the provided data (`x` - features, `y` - target values).
* `double predict(vector &x)` Predicts the output value for a single input vector.
* `vector predict(matrix &x)` Predicts output values for all rows in the input matrix.

**Internal Functions (not directly accessible)**

* `CalcTimeElapsed(double seconds)`: Calculates and returns a string representing the elapsed time in a human-readable format (not relevant for core functionality).
* `RegressorNetsBackProp(matrix& x, vector &y, uint epochs, double alpha, loss LossFx=LOSS_MSE_, optimizer OPTIMIZER=OPTIMIZER_ADAM)`: Performs backpropagation for training (details not provided but likely involve calculating gradients and updating weights and biases).
* Optimizer functions (e.g., `AdamOptimizerW`, `AdamOptimizerB`) Implement specific optimization algorithms like Adam for updating weights and biases during training.

**Other Class Members:**

* `mlp_struct mlp`: Stores information about the network architecture (inputs, hidden layers, and outputs).
* `CTensors*` pointers: Represent tensors holding weights, biases, and other internal calculations (specific implementation likely relies on a custom tensor library).
* `matrix` variables: Used for calculations during training and may hold temporary data (e.g., `W_MATRIX`, `B_MATRIX`).
* `vector` variables: Store network configuration details (e.g., `W_CONFIG`, `HL_CONFIG`).
* `bool isBackProp`: Flag indicating if backpropagation is being performed (private).
* `matrix` variables: Used for storing intermediate results during backpropagation (e.g., `ACTIVATIONS`, `Partial_Derivatives`).

**IV. Additional Notes:**

* The class provides various activation function options and supports different loss functions (e.g., Mean Squared Error, Mean Absolute Error) for selecting the appropriate evaluation metric during training.
* The class implements the Adam optimizer, one of several optimization algorithms used for efficient training of neural networks.
* Detailed implementation of the backpropagation algorithm is not provided but is likely the core functionality for training the network.


**Reference**
* [Data Science and Machine Learning (Part 12): Can Self-Training Neural Networks Help You Outsmart the Stock Market?](https://www.mql5.com/en/articles/12209)
* [Data Science and Machine Learning — Neural Network (Part 01): Feed Forward Neural Network demystified](https://www.mql5.com/en/articles/11275)
* [Data Science and Machine Learning — Neural Network (Part 02): Feed forward NN Architectures Design](https://www.mql5.com/en/articles/11334)


================================================
FILE: Neural Networks/Regressor Nets.mqh
================================================
//+------------------------------------------------------------------+
//|                                                neural_nn_lib.mqh |
//|                                    Copyright 2022, Omega Joctan. |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Omega Joctan."
#property link      "https://www.mql5.com/en/users/omegajoctan"

//+------------------------------------------------------------------+
//|  Regressor Neural Networks | Neural Networks for solving         |
//|  regression problems in contrast to classification problems,     |
//|  here we deal with continuous variables                          |
//+------------------------------------------------------------------+

#include <MALE5\preprocessing.mqh>;
#include <MALE5\MatrixExtend.mqh>;
#include <MALE5\Metrics.mqh>
#include <MALE5\Tensors.mqh>
#include <MALE5\cross_validation.mqh>
#include "optimizers.mqh"


//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

enum activation
  {
   AF_ELU_ = AF_ELU,
   AF_EXP_ = AF_EXP,
   AF_GELU_ = AF_GELU,
   AF_LINEAR_ = AF_LINEAR,
   AF_LRELU_ = AF_LRELU,
   AF_RELU_ = AF_RELU,
   AF_SELU_ = AF_SELU,
   AF_TRELU_ = AF_TRELU,
   AF_SOFTPLUS_ = AF_SOFTPLUS
  };
  
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

enum loss
  {
    LOSS_MSE_ = LOSS_MSE,  // Mean Squared Error
    LOSS_MAE_ = LOSS_MAE,  // Mean Absolute Error
    LOSS_MSLE_ = LOSS_MSLE,  // Mean Squared Logarithmic Error
    LOSS_POISSON_ = LOSS_POISSON  // Poisson Loss
  };

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

struct backprop //This structure returns the loss information obtained from the backpropagation function
  {
    vector training_loss,
           validation_loss;
           
           void Init(ulong epochs)
            {
              training_loss.Resize(epochs);
              validation_loss.Resize(epochs);
            }
  };

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

struct mlp_struct //multi layer perceptron information structure
 {
   ulong inputs;
   ulong hidden_layers;
   ulong outputs;
 };
  
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
class CRegressorNets
  {   
   mlp_struct        mlp;
   
   CTensors          *Weights_tensor; //Weight Tensor
   CTensors          *Bias_tensor;
   CTensors          *Input_tensor;
   CTensors          *Output_tensor;
   
protected:
   activation        A_FX;
   loss              m_loss_function;
   bool              trained;

   string            ConvertTime(double seconds);

//-- for backpropn

   vector            W_CONFIG;
   vector            HL_CONFIG; 
   
   bool              isBackProp; 
   matrix<double>    ACTIVATIONS;
   matrix<double>    Partial_Derivatives; 
   int               m_random_state;
   
private: 
   
   virtual backprop  backpropagation(const matrix& x, const vector &y, OptimizerSGD *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual backprop  backpropagation(const matrix& x, const vector &y, OptimizerAdaDelta *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual backprop  backpropagation(const matrix& x, const vector &y, OptimizerAdaGrad *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual backprop  backpropagation(const matrix& x, const vector &y, OptimizerAdam *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual backprop  backpropagation(const matrix& x, const vector &y, OptimizerNadam *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual backprop  backpropagation(const matrix& x, const vector &y, OptimizerRMSprop *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   
public:

                              CRegressorNets(vector &HL_NODES, activation AF_=AF_RELU_, loss m_loss_function=LOSS_MSE_, int random_state=42);
                             ~CRegressorNets(void);

   virtual void              fit(const matrix &x, const vector &y, OptimizerSGD *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual void              fit(const matrix &x, const vector &y, OptimizerAdaDelta *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual void              fit(const matrix &x, const vector &y, OptimizerAdaGrad *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual void              fit(const matrix &x, const vector &y, OptimizerAdam *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual void              fit(const matrix &x, const vector &y, OptimizerNadam *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   virtual void              fit(const matrix &x, const vector &y, OptimizerRMSprop *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false);
   
   virtual double            predict(const vector &x);
   virtual vector            predict(const matrix &x);
  };

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CRegressorNets::CRegressorNets(vector &HL_NODES, activation AF_=AF_RELU_, loss LOSS_=LOSS_MSE_, int random_state=42)
 :A_FX(AF_),
  m_loss_function(LOSS_),
  isBackProp(false),
  m_random_state(random_state)
  {   
     HL_CONFIG.Copy(HL_NODES);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CRegressorNets::~CRegressorNets(void)
  {
   if (CheckPointer(this.Weights_tensor) != POINTER_INVALID)  delete(this.Weights_tensor);
   if (CheckPointer(this.Bias_tensor) != POINTER_INVALID)  delete(this.Bias_tensor);
   if (CheckPointer(this.Input_tensor) != POINTER_INVALID)  delete(this.Input_tensor);
   if (CheckPointer(this.Output_tensor) != POINTER_INVALID)  delete(this.Output_tensor);
   
   isBackProp = false; 
  }

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CRegressorNets::predict(const vector &x)
  {   
  
  if (!trained)
   {
     printf("%s Train the model first before using it to make predictions | call the fit function first",__FUNCTION__);
     return 0;
   }
   
   matrix L_INPUT = MatrixExtend::VectorToMatrix(x); 
   matrix L_OUTPUT ={};
    
   for(ulong i=0; i<mlp.hidden_layers; i++)
     {      
      if (isBackProp) //if we are on backpropagation store the inputs to be used for finding derivatives 
        this.Input_tensor.Add(L_INPUT, i);  

      L_OUTPUT = this.Weights_tensor.Get(i).MatMul(L_INPUT) + this.Bias_tensor.Get(i); //Weights x INputs + Bias 

      L_OUTPUT.Activation(L_OUTPUT, ENUM_ACTIVATION_FUNCTION(A_FX)); //Activation
      
      L_INPUT = L_OUTPUT; //Next layer inputs = previous layer outputs
      
      if (isBackProp)  this.Output_tensor.Add(L_OUTPUT, i); //Add bias //if we are on backpropagation store the outputs to be used for finding derivatives 
     }
   
   return(L_OUTPUT[0][0]);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CRegressorNets::predict(const matrix &x)
 {
  ulong size = x.Rows();
  
  vector v(size);
   if (x.Cols() != mlp.inputs)
    {
       Print("Cen't pass this matrix to a MLP it doesn't have the same number of columns as the inputs given primarily");
       return (v); 
    }

   for (ulong i=0; i<size; i++)
     v[i] = predict(x.Row(i));    
    
   return (v);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

string CRegressorNets::ConvertTime(double seconds)
{
    string time_str = "";
    uint minutes = 0, hours = 0;

    if (seconds >= 60)
    {
        minutes = (uint)(seconds / 60.0) ;
        seconds = fmod(seconds, 1.0) * 60;
        time_str = StringFormat("%d Minutes and %.3f Seconds", minutes, seconds);
    }
    
    if (minutes >= 60)
    {
        hours = (uint)(minutes / 60.0);
        minutes = minutes % 60;
        time_str = StringFormat("%d Hours and %d Minutes", hours, minutes);
    }

    if (time_str == "")
    {
        time_str = StringFormat("%.3f Seconds", seconds);
    }

    return time_str;
}
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
backprop CRegressorNets::backpropagation(const matrix& x, const vector &y, OptimizerSGD *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
   isBackProp = true;
   
//---

   backprop backprop_struct;
   backprop_struct.Init(epochs);
   
   ulong rows = x.Rows();
   
   mlp.inputs = x.Cols();
   mlp.outputs = 1;
   
//---

   vector v2 = {(double)mlp.outputs}; //Adding the output layer to the mix of hidden layers
  
   HL_CONFIG = MatrixExtend::concatenate(HL_CONFIG, v2);
   mlp.hidden_layers = HL_CONFIG.Size();
   W_CONFIG.Resize(HL_CONFIG.Size());
     
//---

   if (y.Size() != rows)
     {
        Print(__FUNCTION__," FATAL | Number of rows in the x matrix is not the same the y vector size ");
        return backprop_struct;
     }
     
     
     matrix W, B;
     
//--- GENERATE WEIGHTS
    
     this.Weights_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Bias_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Input_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Output_tensor = new CTensors((uint)mlp.hidden_layers);
     
     ulong layer_input = mlp.inputs; 
     
     for (ulong i=0; i<mlp.hidden_layers; i++)
       {
          W_CONFIG[i] = layer_input*HL_CONFIG[i];
          
          W = MatrixExtend::Random(0.0, 1.0,(ulong)HL_CONFIG[i],layer_input, m_random_state);
          
          W = W * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Weights_tensor.Add(W, i);
          
          B = MatrixExtend::Random(0.0, 0.5,(ulong)HL_CONFIG[i],1,m_random_state);
          
          B = B * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Bias_tensor.Add(B, i);
          
          layer_input = (ulong)HL_CONFIG[i];
       }
     
//---

   if (MQLInfoInteger(MQL_DEBUG))
      Comment("<-------------------  R E G R E S S O R   N E T S  ------------------------->\n",
            "HL_CONFIG ",HL_CONFIG," TOTAL HL(S) ",mlp.hidden_layers,"\n",
            "W_CONFIG ",W_CONFIG," ACTIVATION ",EnumToString(A_FX),"\n",
            "NN INPUTS ",mlp.inputs," OUTPUT ",mlp.outputs
           );

//--- Optimizer
      
   OptimizerSGD optimizer_weights = optimizer;
   OptimizerSGD optimizer_bias = optimizer;
   
   if (batch_size>0)
    {
      OptimizerMinBGD optimizer_weights;
      OptimizerMinBGD optimizer_bias;
    }
     
//--- Cross validation

    CCrossValidation cross_validation;      
    CTensors *cv_tensor;
    matrix validation_data = MatrixExtend::concatenate(x, y);
    matrix validation_x;
    vector validation_y;
    
    cv_tensor = cross_validation.KFoldCV(validation_data, 10); //k-fold cross validation | 10 folds selected
    
//---

    matrix DELTA = {};
    double actual=0, pred=0;
    
    matrix temp_inputs ={};
    
    matrix dB = {}; //Bias Derivatives
    matrix dW = {}; //Weight Derivatives
    
   
    for (ulong epoch=0; epoch<epochs && !IsStopped(); epoch++)
      {        
        double epoch_start = GetTickCount(); 

        uint num_batches = (uint)MathFloor(x.Rows()/(batch_size+DBL_EPSILON));
        
        vector batch_loss(num_batches), 
               batch_accuracy(num_batches);
                       
         vector actual_v(1), pred_v(1), LossGradient = {};
         
         if (batch_size==0) //Stochastic Gradient Descent
          {
           for (ulong iter=0; iter<rows; iter++) //iterate through all data points
             {
               pred = predict(x.Row(iter));
               actual = y[iter];
               
               pred_v[0] = pred; 
               actual_v[0] = actual; 
   //---
                
                DELTA.Resize(mlp.outputs,1);
                
                for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                  {    
                     Partial_Derivatives = this.Output_tensor.Get(int(layer));
                     temp_inputs = this.Input_tensor.Get(int(layer));
                     
                     Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                     
                     if (mlp.hidden_layers-1 == layer) //Last layer
                      {                     
                        LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                        
                        DELTA.Col(LossGradient, 0);
                      }
                      
                     else
                      {
                        W = this.Weights_tensor.Get(layer+1);
                        
                        DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                      }
                    
                    //-- Observation | DeLTA matrix is same size as the bias matrix
                    
                    W = this.Weights_tensor.Get(layer);
                    B = this.Bias_tensor.Get(layer);
                  
                   //--- Derivatives wrt weights and bias
                  
                    dB = DELTA;
                    dW = DELTA.MatMul(temp_inputs.Transpose());                   
                    
                   //--- Weights updates
                    
                    optimizer_weights.update(W, dW);
                    optimizer_bias.update(B, dB);
                    
                    this.Weights_tensor.Add(W, layer);
                    this.Bias_tensor.Add(B, layer);
                  }
             }
         }
        else //Batch Gradient Descent
          {
               
            for (uint batch=0, batch_start=0, batch_end=batch_size; batch<num_batches; batch++, batch_start+=batch_size, batch_end=(batch_start+batch_size-1))
               {
                  matrix batch_x = MatrixExtend::Get(x, batch_start, batch_end-1);
                  vector batch_y = MatrixExtend::Get(y, batch_start, batch_end-1);
                  
                  rows = batch_x.Rows();              
                  
                    for (ulong iter=0; iter<rows ; iter++) //iterate through all data points
                      {
                        pred_v[0] = predict(batch_x.Row(iter));
                        actual_v[0] = y[iter];
                        
            //---
                        
                      DELTA.Resize(mlp.outputs,1);
                      
                      for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                        {    
                           Partial_Derivatives = this.Output_tensor.Get(int(layer));
                           temp_inputs = this.Input_tensor.Get(int(layer));
                           
                           Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                           
                           if (mlp.hidden_layers-1 == layer) //Last layer
                            {                     
                              LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                              
                              DELTA.Col(LossGradient, 0);
                            }
                            
                           else
                            {
                              W = this.Weights_tensor.Get(layer+1);
                              
                              DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                            }
                          
                          //-- Observation | DeLTA matrix is same size as the bias matrix
                          
                          W = this.Weights_tensor.Get(layer);
                          B = this.Bias_tensor.Get(layer);
                        
                         //--- Derivatives wrt weights and bias
                        
                          dB = DELTA;
                          dW = DELTA.MatMul(temp_inputs.Transpose());                   
                          
                         //--- Weights updates
                          
                          optimizer_weights.update(W, dW);
                          optimizer_bias.update(B, dB);
                          
                          this.Weights_tensor.Add(W, layer);
                          this.Bias_tensor.Add(B, layer);
                        }
                    }
                 
                 pred_v = predict(batch_x);
                 
                 batch_loss[batch] = pred_v.Loss(batch_y, ENUM_LOSS_FUNCTION(m_loss_function));
                 batch_loss[batch] = MathIsValidNumber(batch_loss[batch]) ? (batch_loss[batch]>1e6 ? 1e6 : batch_loss[batch]) : 1e6; //Check for nan and return some large value if it is nan
                 
                 batch_accuracy[batch] = Metrics::r_squared(batch_y, pred_v);
                 
                 if (show_batch_progress)
                  printf("----> batch[%d/%d] batch-loss %.5f accuracy %.3f",batch+1,num_batches,batch_loss[batch], batch_accuracy[batch]);  
              }
          }
          
//--- End of an epoch
      
        vector validation_loss(cv_tensor.SIZE);
        vector validation_acc(cv_tensor.SIZE);
        for (ulong i=0; i<cv_tensor.SIZE; i++)
          {
            validation_data = cv_tensor.Get(i);
            MatrixExtend::XandYSplitMatrices(validation_data, validation_x, validation_y);
            
            vector val_preds = this.predict(validation_x);;
            
            validation_loss[i] = val_preds.Loss(validation_y, ENUM_LOSS_FUNCTION(m_loss_function));
            validation_acc[i] = Metrics::r_squared(validation_y, val_preds);
          }
                  
        pred_v = this.predict(x);
        
        if (batch_size==0)
          {      
              backprop_struct.training_loss[epoch] = pred_v.Loss(y, ENUM_LOSS_FUNCTION(m_loss_function));
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
        else
          {
              backprop_struct.training_loss[epoch] = batch_loss.Mean();
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
          
        double epoch_stop = GetTickCount();  
        printf("--> Epoch [%d/%d] training -> loss %.8f accuracy %.3f validation -> loss %.5f accuracy %.3f | Elapsed %s ",epoch+1,epochs,backprop_struct.training_loss[epoch],Metrics::r_squared(y, pred_v),backprop_struct.validation_loss[epoch],validation_acc.Mean(),this.ConvertTime((epoch_stop-epoch_start)/1000.0));
     }
     
   isBackProp = false;
  
  
  if (CheckPointer(this.Input_tensor) != POINTER_INVALID)  delete(this.Input_tensor);
  if (CheckPointer(this.Output_tensor) != POINTER_INVALID)  delete(this.Output_tensor); 
  if (CheckPointer(optimizer)!=POINTER_INVALID)  
    delete optimizer;
    
   return backprop_struct;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
backprop CRegressorNets::backpropagation(const matrix& x, const vector &y, OptimizerAdaDelta *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
   isBackProp = true;
   
//---

   backprop backprop_struct;
   backprop_struct.Init(epochs);
   
   ulong rows = x.Rows();
   
   mlp.inputs = x.Cols();
   mlp.outputs = 1;
   
//---

   vector v2 = {(double)mlp.outputs}; //Adding the output layer to the mix of hidden layers
  
   HL_CONFIG = MatrixExtend::concatenate(HL_CONFIG, v2);
   mlp.hidden_layers = HL_CONFIG.Size();
   W_CONFIG.Resize(HL_CONFIG.Size());
     
//---

   if (y.Size() != rows)
     {
        Print(__FUNCTION__," FATAL | Number of rows in the x matrix is not the same the y vector size ");
        return backprop_struct;
     }
     
     
     matrix W, B;
     
//--- GENERATE WEIGHTS
    
     this.Weights_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Bias_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Input_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Output_tensor = new CTensors((uint)mlp.hidden_layers);
     
     ulong layer_input = mlp.inputs; 
     
     for (ulong i=0; i<mlp.hidden_layers; i++)
       {
          W_CONFIG[i] = layer_input*HL_CONFIG[i];
          
          W = MatrixExtend::Random(0.0, 1.0,(ulong)HL_CONFIG[i],layer_input, m_random_state);
          
          W = W * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Weights_tensor.Add(W, i);
          
          B = MatrixExtend::Random(0.0, 0.5,(ulong)HL_CONFIG[i],1,m_random_state);
          
          B = B * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Bias_tensor.Add(B, i);
          
          layer_input = (ulong)HL_CONFIG[i];
       }
     
//---

   if (MQLInfoInteger(MQL_DEBUG))
      Comment("<-------------------  R E G R E S S O R   N E T S  ------------------------->\n",
            "HL_CONFIG ",HL_CONFIG," TOTAL HL(S) ",mlp.hidden_layers,"\n",
            "W_CONFIG ",W_CONFIG," ACTIVATION ",EnumToString(A_FX),"\n",
            "NN INPUTS ",mlp.inputs," OUTPUT ",mlp.outputs
           );

//--- Optimizer
      
   OptimizerAdaDelta optimizer_weights = optimizer;
   OptimizerAdaDelta optimizer_bias = optimizer;
   
   if (batch_size>0)
    {
      OptimizerMinBGD optimizer_weights;
      OptimizerMinBGD optimizer_bias;
    }
     
//--- Cross validation

    CCrossValidation cross_validation;      
    CTensors *cv_tensor;
    matrix validation_data = MatrixExtend::concatenate(x, y);
    matrix validation_x;
    vector validation_y;
    
    cv_tensor = cross_validation.KFoldCV(validation_data, 10); //k-fold cross validation | 10 folds selected
    
//---

    matrix DELTA = {};
    double actual=0, pred=0;
    
    matrix temp_inputs ={};
    
    matrix dB = {}; //Bias Derivatives
    matrix dW = {}; //Weight Derivatives
    
   
    for (ulong epoch=0; epoch<epochs && !IsStopped(); epoch++)
      {        
        double epoch_start = GetTickCount(); 

        uint num_batches = (uint)MathFloor(x.Rows()/(batch_size+DBL_EPSILON));
        
        vector batch_loss(num_batches), 
               batch_accuracy(num_batches);
                       
         vector actual_v(1), pred_v(1), LossGradient = {};
         
         if (batch_size==0) //Stochastic Gradient Descent
          {
           for (ulong iter=0; iter<rows; iter++) //iterate through all data points
             {
               pred = predict(x.Row(iter));
               actual = y[iter];
               
               pred_v[0] = pred; 
               actual_v[0] = actual; 
   //---
                
                DELTA.Resize(mlp.outputs,1);
                
                for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                  {    
                     Partial_Derivatives = this.Output_tensor.Get(int(layer));
                     temp_inputs = this.Input_tensor.Get(int(layer));
                     
                     Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                     
                     if (mlp.hidden_layers-1 == layer) //Last layer
                      {                     
                        LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                        
                        DELTA.Col(LossGradient, 0);
                      }
                      
                     else
                      {
                        W = this.Weights_tensor.Get(layer+1);
                        
                        DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                      }
                    
                    //-- Observation | DeLTA matrix is same size as the bias matrix
                    
                    W = this.Weights_tensor.Get(layer);
                    B = this.Bias_tensor.Get(layer);
                  
                   //--- Derivatives wrt weights and bias
                  
                    dB = DELTA;
                    dW = DELTA.MatMul(temp_inputs.Transpose());                   
                    
                   //--- Weights updates
                    
                    optimizer_weights.update(W, dW);
                    optimizer_bias.update(B, dB);
                    
                    this.Weights_tensor.Add(W, layer);
                    this.Bias_tensor.Add(B, layer);
                  }
             }
         }
        else //Batch Gradient Descent
          {
               
            for (uint batch=0, batch_start=0, batch_end=batch_size; batch<num_batches; batch++, batch_start+=batch_size, batch_end=(batch_start+batch_size-1))
               {
                  matrix batch_x = MatrixExtend::Get(x, batch_start, batch_end-1);
                  vector batch_y = MatrixExtend::Get(y, batch_start, batch_end-1);
                  
                  rows = batch_x.Rows();              
                  
                    for (ulong iter=0; iter<rows ; iter++) //iterate through all data points
                      {
                        pred_v[0] = predict(batch_x.Row(iter));
                        actual_v[0] = y[iter];
                        
            //---
                        
                      DELTA.Resize(mlp.outputs,1);
                      
                      for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                        {    
                           Partial_Derivatives = this.Output_tensor.Get(int(layer));
                           temp_inputs = this.Input_tensor.Get(int(layer));
                           
                           Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                           
                           if (mlp.hidden_layers-1 == layer) //Last layer
                            {                     
                              LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                              
                              DELTA.Col(LossGradient, 0);
                            }
                            
                           else
                            {
                              W = this.Weights_tensor.Get(layer+1);
                              
                              DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                            }
                          
                          //-- Observation | DeLTA matrix is same size as the bias matrix
                          
                          W = this.Weights_tensor.Get(layer);
                          B = this.Bias_tensor.Get(layer);
                        
                         //--- Derivatives wrt weights and bias
                        
                          dB = DELTA;
                          dW = DELTA.MatMul(temp_inputs.Transpose());                   
                          
                         //--- Weights updates
                          
                          optimizer_weights.update(W, dW);
                          optimizer_bias.update(B, dB);
                          
                          this.Weights_tensor.Add(W, layer);
                          this.Bias_tensor.Add(B, layer);
                        }
                    }
                 
                 pred_v = predict(batch_x);
                 
                 batch_loss[batch] = pred_v.Loss(batch_y, ENUM_LOSS_FUNCTION(m_loss_function));
                 batch_loss[batch] = MathIsValidNumber(batch_loss[batch]) ? (batch_loss[batch]>1e6 ? 1e6 : batch_loss[batch]) : 1e6; //Check for nan and return some large value if it is nan
                 
                 batch_accuracy[batch] = Metrics::r_squared(batch_y, pred_v);
                 
                 if (show_batch_progress)
                  printf("----> batch[%d/%d] batch-loss %.5f accuracy %.3f",batch+1,num_batches,batch_loss[batch], batch_accuracy[batch]);  
              }
          }
          
//--- End of an epoch
      
        vector validation_loss(cv_tensor.SIZE);
        vector validation_acc(cv_tensor.SIZE);
        for (ulong i=0; i<cv_tensor.SIZE; i++)
          {
            validation_data = cv_tensor.Get(i);
            MatrixExtend::XandYSplitMatrices(validation_data, validation_x, validation_y);
            
            vector val_preds = this.predict(validation_x);;
            
            validation_loss[i] = val_preds.Loss(validation_y, ENUM_LOSS_FUNCTION(m_loss_function));
            validation_acc[i] = Metrics::r_squared(validation_y, val_preds);
          }
                  
        pred_v = this.predict(x);
        
        if (batch_size==0)
          {      
              backprop_struct.training_loss[epoch] = pred_v.Loss(y, ENUM_LOSS_FUNCTION(m_loss_function));
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
        else
          {
              backprop_struct.training_loss[epoch] = batch_loss.Mean();
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
          
        double epoch_stop = GetTickCount();  
        printf("--> Epoch [%d/%d] training -> loss %.8f accuracy %.3f validation -> loss %.5f accuracy %.3f | Elapsed %s ",epoch+1,epochs,backprop_struct.training_loss[epoch],Metrics::r_squared(y, pred_v),backprop_struct.validation_loss[epoch],validation_acc.Mean(),this.ConvertTime((epoch_stop-epoch_start)/1000.0));
     }
     
   isBackProp = false;
   
  if (CheckPointer(this.Input_tensor) != POINTER_INVALID)  delete(this.Input_tensor);
  if (CheckPointer(this.Output_tensor) != POINTER_INVALID)  delete(this.Output_tensor); 
  if (CheckPointer(optimizer)!=POINTER_INVALID)  
    delete optimizer;
    
   return backprop_struct;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
backprop CRegressorNets::backpropagation(const matrix& x, const vector &y, OptimizerAdaGrad *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
   isBackProp = true;
   
//---

   backprop backprop_struct;
   backprop_struct.Init(epochs);
   
   ulong rows = x.Rows();
   
   mlp.inputs = x.Cols();
   mlp.outputs = 1;
   
//---

   vector v2 = {(double)mlp.outputs}; //Adding the output layer to the mix of hidden layers
  
   HL_CONFIG = MatrixExtend::concatenate(HL_CONFIG, v2);
   mlp.hidden_layers = HL_CONFIG.Size();
   W_CONFIG.Resize(HL_CONFIG.Size());
     
//---

   if (y.Size() != rows)
     {
        Print(__FUNCTION__," FATAL | Number of rows in the x matrix is not the same the y vector size ");
        return backprop_struct;
     }
     
     
     matrix W, B;
     
//--- GENERATE WEIGHTS
    
     this.Weights_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Bias_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Input_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Output_tensor = new CTensors((uint)mlp.hidden_layers);
     
     ulong layer_input = mlp.inputs; 
     
     for (ulong i=0; i<mlp.hidden_layers; i++)
       {
          W_CONFIG[i] = layer_input*HL_CONFIG[i];
          
          W = MatrixExtend::Random(0.0, 1.0,(ulong)HL_CONFIG[i],layer_input, m_random_state);
          
          W = W * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Weights_tensor.Add(W, i);
          
          B = MatrixExtend::Random(0.0, 0.5,(ulong)HL_CONFIG[i],1,m_random_state);
          
          B = B * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Bias_tensor.Add(B, i);
          
          layer_input = (ulong)HL_CONFIG[i];
       }
     
//---

   if (MQLInfoInteger(MQL_DEBUG))
      Comment("<-------------------  R E G R E S S O R   N E T S  ------------------------->\n",
            "HL_CONFIG ",HL_CONFIG," TOTAL HL(S) ",mlp.hidden_layers,"\n",
            "W_CONFIG ",W_CONFIG," ACTIVATION ",EnumToString(A_FX),"\n",
            "NN INPUTS ",mlp.inputs," OUTPUT ",mlp.outputs
           );

//--- Optimizer
      
   OptimizerAdaGrad optimizer_weights = optimizer;
   OptimizerAdaGrad optimizer_bias = optimizer;
   
   if (batch_size>0)
    {
      OptimizerMinBGD optimizer_weights;
      OptimizerMinBGD optimizer_bias;
    }
     
//--- Cross validation

    CCrossValidation cross_validation;      
    CTensors *cv_tensor;
    matrix validation_data = MatrixExtend::concatenate(x, y);
    matrix validation_x;
    vector validation_y;
    
    cv_tensor = cross_validation.KFoldCV(validation_data, 10); //k-fold cross validation | 10 folds selected
    
//---

    matrix DELTA = {};
    double actual=0, pred=0;
    
    matrix temp_inputs ={};
    
    matrix dB = {}; //Bias Derivatives
    matrix dW = {}; //Weight Derivatives
    
   
    for (ulong epoch=0; epoch<epochs && !IsStopped(); epoch++)
      {        
        double epoch_start = GetTickCount(); 

        uint num_batches = (uint)MathFloor(x.Rows()/(batch_size+DBL_EPSILON));
        
        vector batch_loss(num_batches), 
               batch_accuracy(num_batches);
                       
         vector actual_v(1), pred_v(1), LossGradient = {};
         
         if (batch_size==0) //Stochastic Gradient Descent
          {
           for (ulong iter=0; iter<rows; iter++) //iterate through all data points
             {
               pred = predict(x.Row(iter));
               actual = y[iter];
               
               pred_v[0] = pred; 
               actual_v[0] = actual; 
   //---
                
                DELTA.Resize(mlp.outputs,1);
                
                for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                  {    
                     Partial_Derivatives = this.Output_tensor.Get(int(layer));
                     temp_inputs = this.Input_tensor.Get(int(layer));
                     
                     Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                     
                     if (mlp.hidden_layers-1 == layer) //Last layer
                      {                     
                        LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                        
                        DELTA.Col(LossGradient, 0);
                      }
                      
                     else
                      {
                        W = this.Weights_tensor.Get(layer+1);
                        
                        DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                      }
                    
                    //-- Observation | DeLTA matrix is same size as the bias matrix
                    
                    W = this.Weights_tensor.Get(layer);
                    B = this.Bias_tensor.Get(layer);
                  
                   //--- Derivatives wrt weights and bias
                  
                    dB = DELTA;
                    dW = DELTA.MatMul(temp_inputs.Transpose());                   
                    
                   //--- Weights updates
                    
                    optimizer_weights.update(W, dW);
                    optimizer_bias.update(B, dB);
                    
                    this.Weights_tensor.Add(W, layer);
                    this.Bias_tensor.Add(B, layer);
                  }
             }
         }
        else //Batch Gradient Descent
          {
               
            for (uint batch=0, batch_start=0, batch_end=batch_size; batch<num_batches; batch++, batch_start+=batch_size, batch_end=(batch_start+batch_size-1))
               {
                  matrix batch_x = MatrixExtend::Get(x, batch_start, batch_end-1);
                  vector batch_y = MatrixExtend::Get(y, batch_start, batch_end-1);
                  
                  rows = batch_x.Rows();              
                  
                    for (ulong iter=0; iter<rows ; iter++) //iterate through all data points
                      {
                        pred_v[0] = predict(batch_x.Row(iter));
                        actual_v[0] = y[iter];
                        
            //---
                        
                      DELTA.Resize(mlp.outputs,1);
                      
                      for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                        {    
                           Partial_Derivatives = this.Output_tensor.Get(int(layer));
                           temp_inputs = this.Input_tensor.Get(int(layer));
                           
                           Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                           
                           if (mlp.hidden_layers-1 == layer) //Last layer
                            {                     
                              LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                              
                              DELTA.Col(LossGradient, 0);
                            }
                            
                           else
                            {
                              W = this.Weights_tensor.Get(layer+1);
                              
                              DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                            }
                          
                          //-- Observation | DeLTA matrix is same size as the bias matrix
                          
                          W = this.Weights_tensor.Get(layer);
                          B = this.Bias_tensor.Get(layer);
                        
                         //--- Derivatives wrt weights and bias
                        
                          dB = DELTA;
                          dW = DELTA.MatMul(temp_inputs.Transpose());                   
                          
                         //--- Weights updates
                          
                          optimizer_weights.update(W, dW);
                          optimizer_bias.update(B, dB);
                          
                          this.Weights_tensor.Add(W, layer);
                          this.Bias_tensor.Add(B, layer);
                        }
                    }
                 
                 pred_v = predict(batch_x);
                 
                 batch_loss[batch] = pred_v.Loss(batch_y, ENUM_LOSS_FUNCTION(m_loss_function));
                 batch_loss[batch] = MathIsValidNumber(batch_loss[batch]) ? (batch_loss[batch]>1e6 ? 1e6 : batch_loss[batch]) : 1e6; //Check for nan and return some large value if it is nan
                 
                 batch_accuracy[batch] = Metrics::r_squared(batch_y, pred_v);
                 
                 if (show_batch_progress)
                  printf("----> batch[%d/%d] batch-loss %.5f accuracy %.3f",batch+1,num_batches,batch_loss[batch], batch_accuracy[batch]);  
              }
          }
          
//--- End of an epoch
      
        vector validation_loss(cv_tensor.SIZE);
        vector validation_acc(cv_tensor.SIZE);
        for (ulong i=0; i<cv_tensor.SIZE; i++)
          {
            validation_data = cv_tensor.Get(i);
            MatrixExtend::XandYSplitMatrices(validation_data, validation_x, validation_y);
            
            vector val_preds = this.predict(validation_x);;
            
            validation_loss[i] = val_preds.Loss(validation_y, ENUM_LOSS_FUNCTION(m_loss_function));
            validation_acc[i] = Metrics::r_squared(validation_y, val_preds);
          }
                  
        pred_v = this.predict(x);
        
        if (batch_size==0)
          {      
              backprop_struct.training_loss[epoch] = pred_v.Loss(y, ENUM_LOSS_FUNCTION(m_loss_function));
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
        else
          {
              backprop_struct.training_loss[epoch] = batch_loss.Mean();
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
          
        double epoch_stop = GetTickCount();  
        printf("--> Epoch [%d/%d] training -> loss %.8f accuracy %.3f validation -> loss %.5f accuracy %.3f | Elapsed %s ",epoch+1,epochs,backprop_struct.training_loss[epoch],Metrics::r_squared(y, pred_v),backprop_struct.validation_loss[epoch],validation_acc.Mean(),this.ConvertTime((epoch_stop-epoch_start)/1000.0));
     }
     
   isBackProp = false;
   
  if (CheckPointer(this.Input_tensor) != POINTER_INVALID)  delete(this.Input_tensor);
  if (CheckPointer(this.Output_tensor) != POINTER_INVALID)  delete(this.Output_tensor); 
  if (CheckPointer(optimizer)!=POINTER_INVALID)  
    delete optimizer;
    
   return backprop_struct;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
backprop CRegressorNets::backpropagation(const matrix& x, const vector &y, OptimizerAdam *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
   isBackProp = true;
   
//---

   backprop backprop_struct;
   backprop_struct.Init(epochs);
   
   ulong rows = x.Rows();
   
   mlp.inputs = x.Cols();
   mlp.outputs = 1;
   
//---

   vector v2 = {(double)mlp.outputs}; //Adding the output layer to the mix of hidden layers
  
   HL_CONFIG = MatrixExtend::concatenate(HL_CONFIG, v2);
   mlp.hidden_layers = HL_CONFIG.Size();
   W_CONFIG.Resize(HL_CONFIG.Size());
     
//---

   if (y.Size() != rows)
     {
        Print(__FUNCTION__," FATAL | Number of rows in the x matrix is not the same the y vector size ");
        return backprop_struct;
     }
     
     
     matrix W, B;
     
//--- GENERATE WEIGHTS
    
     this.Weights_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Bias_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Input_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Output_tensor = new CTensors((uint)mlp.hidden_layers);
     
     ulong layer_input = mlp.inputs; 
     
     for (ulong i=0; i<mlp.hidden_layers; i++)
       {
          W_CONFIG[i] = layer_input*HL_CONFIG[i];
          
          W = MatrixExtend::Random(0.0, 1.0,(ulong)HL_CONFIG[i],layer_input, m_random_state);
          
          W = W * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Weights_tensor.Add(W, i);
          
          B = MatrixExtend::Random(0.0, 0.5,(ulong)HL_CONFIG[i],1,m_random_state);
          
          B = B * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Bias_tensor.Add(B, i);
          
          layer_input = (ulong)HL_CONFIG[i];
       }
     
//---

   if (MQLInfoInteger(MQL_DEBUG))
      Comment("<-------------------  R E G R E S S O R   N E T S  ------------------------->\n",
            "HL_CONFIG ",HL_CONFIG," TOTAL HL(S) ",mlp.hidden_layers,"\n",
            "W_CONFIG ",W_CONFIG," ACTIVATION ",EnumToString(A_FX),"\n",
            "NN INPUTS ",mlp.inputs," OUTPUT ",mlp.outputs
           );

//--- Optimizer
      
   OptimizerAdam optimizer_weights = optimizer;
   OptimizerAdam optimizer_bias = optimizer;
   
   if (batch_size>0)
    {
      OptimizerMinBGD optimizer_weights;
      OptimizerMinBGD optimizer_bias;
    }
     
//--- Cross validation

    CCrossValidation cross_validation;      
    CTensors *cv_tensor;
    matrix validation_data = MatrixExtend::concatenate(x, y);
    matrix validation_x;
    vector validation_y;
    
    cv_tensor = cross_validation.KFoldCV(validation_data, 10); //k-fold cross validation | 10 folds selected
    
//---

    matrix DELTA = {};
    double actual=0, pred=0;
    
    matrix temp_inputs ={};
    
    matrix dB = {}; //Bias Derivatives
    matrix dW = {}; //Weight Derivatives
    
   
    for (ulong epoch=0; epoch<epochs && !IsStopped(); epoch++)
      {        
        double epoch_start = GetTickCount(); 

        uint num_batches = (uint)MathFloor(x.Rows()/(batch_size+DBL_EPSILON));
        
        vector batch_loss(num_batches), 
               batch_accuracy(num_batches);
                       
         vector actual_v(1), pred_v(1), LossGradient = {};
         
         if (batch_size==0) //Stochastic Gradient Descent
          {
           for (ulong iter=0; iter<rows; iter++) //iterate through all data points
             {
               pred = predict(x.Row(iter));
               actual = y[iter];
               
               pred_v[0] = pred; 
               actual_v[0] = actual; 
   //---
                
                DELTA.Resize(mlp.outputs,1);
                
                for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                  {    
                     Partial_Derivatives = this.Output_tensor.Get(int(layer));
                     temp_inputs = this.Input_tensor.Get(int(layer));
                     
                     Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                     
                     if (mlp.hidden_layers-1 == layer) //Last layer
                      {                     
                        LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                        
                        DELTA.Col(LossGradient, 0);
                      }
                      
                     else
                      {
                        W = this.Weights_tensor.Get(layer+1);
                        
                        DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                      }
                    
                    //-- Observation | DeLTA matrix is same size as the bias matrix
                    
                    W = this.Weights_tensor.Get(layer);
                    B = this.Bias_tensor.Get(layer);
                  
                   //--- Derivatives wrt weights and bias
                  
                    dB = DELTA;
                    dW = DELTA.MatMul(temp_inputs.Transpose());                   
                    
                   //--- Weights updates
                    
                    optimizer_weights.update(W, dW);
                    optimizer_bias.update(B, dB);
                    
                    this.Weights_tensor.Add(W, layer);
                    this.Bias_tensor.Add(B, layer);
                  }
             }
         }
        else //Batch Gradient Descent
          {
               
            for (uint batch=0, batch_start=0, batch_end=batch_size; batch<num_batches; batch++, batch_start+=batch_size, batch_end=(batch_start+batch_size-1))
               {
                  matrix batch_x = MatrixExtend::Get(x, batch_start, batch_end-1);
                  vector batch_y = MatrixExtend::Get(y, batch_start, batch_end-1);
                  
                  rows = batch_x.Rows();              
                  
                    for (ulong iter=0; iter<rows ; iter++) //iterate through all data points
                      {
                        pred_v[0] = predict(batch_x.Row(iter));
                        actual_v[0] = y[iter];
                        
            //---
                        
                      DELTA.Resize(mlp.outputs,1);
                      
                      for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                        {    
                           Partial_Derivatives = this.Output_tensor.Get(int(layer));
                           temp_inputs = this.Input_tensor.Get(int(layer));
                           
                           Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                           
                           if (mlp.hidden_layers-1 == layer) //Last layer
                            {                     
                              LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                              
                              DELTA.Col(LossGradient, 0);
                            }
                            
                           else
                            {
                              W = this.Weights_tensor.Get(layer+1);
                              
                              DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                            }
                          
                          //-- Observation | DeLTA matrix is same size as the bias matrix
                          
                          W = this.Weights_tensor.Get(layer);
                          B = this.Bias_tensor.Get(layer);
                        
                         //--- Derivatives wrt weights and bias
                        
                          dB = DELTA;
                          dW = DELTA.MatMul(temp_inputs.Transpose());                   
                          
                         //--- Weights updates
                          
                          optimizer_weights.update(W, dW);
                          optimizer_bias.update(B, dB);
                          
                          this.Weights_tensor.Add(W, layer);
                          this.Bias_tensor.Add(B, layer);
                        }
                    }
                 
                 pred_v = predict(batch_x);
                 
                 batch_loss[batch] = pred_v.Loss(batch_y, ENUM_LOSS_FUNCTION(m_loss_function));
                 batch_loss[batch] = MathIsValidNumber(batch_loss[batch]) ? (batch_loss[batch]>1e6 ? 1e6 : batch_loss[batch]) : 1e6; //Check for nan and return some large value if it is nan
                 
                 batch_accuracy[batch] = Metrics::r_squared(batch_y, pred_v);
                 
                 if (show_batch_progress)
                  printf("----> batch[%d/%d] batch-loss %.5f accuracy %.3f",batch+1,num_batches,batch_loss[batch], batch_accuracy[batch]);  
              }
          }
          
//--- End of an epoch
      
        vector validation_loss(cv_tensor.SIZE);
        vector validation_acc(cv_tensor.SIZE);
        for (ulong i=0; i<cv_tensor.SIZE; i++)
          {
            validation_data = cv_tensor.Get(i);
            MatrixExtend::XandYSplitMatrices(validation_data, validation_x, validation_y);
            
            vector val_preds = this.predict(validation_x);;
            
            validation_loss[i] = val_preds.Loss(validation_y, ENUM_LOSS_FUNCTION(m_loss_function));
            validation_acc[i] = Metrics::r_squared(validation_y, val_preds);
          }
                  
        pred_v = this.predict(x);
        
        if (batch_size==0)
          {      
              backprop_struct.training_loss[epoch] = pred_v.Loss(y, ENUM_LOSS_FUNCTION(m_loss_function));
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
        else
          {
              backprop_struct.training_loss[epoch] = batch_loss.Mean();
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
          
        double epoch_stop = GetTickCount();  
        printf("--> Epoch [%d/%d] training -> loss %.8f accuracy %.3f validation -> loss %.5f accuracy %.3f | Elapsed %s ",epoch+1,epochs,backprop_struct.training_loss[epoch],Metrics::r_squared(y, pred_v),backprop_struct.validation_loss[epoch],validation_acc.Mean(),this.ConvertTime((epoch_stop-epoch_start)/1000.0));
     }
     
   isBackProp = false;
   
  if (CheckPointer(this.Input_tensor) != POINTER_INVALID)  delete(this.Input_tensor);
  if (CheckPointer(this.Output_tensor) != POINTER_INVALID)  delete(this.Output_tensor); 
  if (CheckPointer(optimizer)!=POINTER_INVALID)  
    delete optimizer;
    
   return backprop_struct;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
backprop CRegressorNets::backpropagation(const matrix& x, const vector &y, OptimizerNadam *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
   isBackProp = true;
   
//---

   backprop backprop_struct;
   backprop_struct.Init(epochs);
   
   ulong rows = x.Rows();
   
   mlp.inputs = x.Cols();
   mlp.outputs = 1;
   
//---

   vector v2 = {(double)mlp.outputs}; //Adding the output layer to the mix of hidden layers
  
   HL_CONFIG = MatrixExtend::concatenate(HL_CONFIG, v2);
   mlp.hidden_layers = HL_CONFIG.Size();
   W_CONFIG.Resize(HL_CONFIG.Size());
     
//---

   if (y.Size() != rows)
     {
        Print(__FUNCTION__," FATAL | Number of rows in the x matrix is not the same the y vector size ");
        return backprop_struct;
     }
     
     
     matrix W, B;
     
//--- GENERATE WEIGHTS
    
     this.Weights_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Bias_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Input_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Output_tensor = new CTensors((uint)mlp.hidden_layers);
     
     ulong layer_input = mlp.inputs; 
     
     for (ulong i=0; i<mlp.hidden_layers; i++)
       {
          W_CONFIG[i] = layer_input*HL_CONFIG[i];
          
          W = MatrixExtend::Random(0.0, 1.0,(ulong)HL_CONFIG[i],layer_input, m_random_state);
          
          W = W * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Weights_tensor.Add(W, i);
          
          B = MatrixExtend::Random(0.0, 0.5,(ulong)HL_CONFIG[i],1,m_random_state);
          
          B = B * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Bias_tensor.Add(B, i);
          
          layer_input = (ulong)HL_CONFIG[i];
       }
     
//---

   if (MQLInfoInteger(MQL_DEBUG))
      Comment("<-------------------  R E G R E S S O R   N E T S  ------------------------->\n",
            "HL_CONFIG ",HL_CONFIG," TOTAL HL(S) ",mlp.hidden_layers,"\n",
            "W_CONFIG ",W_CONFIG," ACTIVATION ",EnumToString(A_FX),"\n",
            "NN INPUTS ",mlp.inputs," OUTPUT ",mlp.outputs
           );

//--- Optimizer
      
   OptimizerNadam optimizer_weights = optimizer;
   OptimizerNadam optimizer_bias = optimizer;
   
   if (batch_size>0)
    {
      OptimizerMinBGD optimizer_weights;
      OptimizerMinBGD optimizer_bias;
    }
     
//--- Cross validation

    CCrossValidation cross_validation;      
    CTensors *cv_tensor;
    matrix validation_data = MatrixExtend::concatenate(x, y);
    matrix validation_x;
    vector validation_y;
    
    cv_tensor = cross_validation.KFoldCV(validation_data, 10); //k-fold cross validation | 10 folds selected
    
//---

    matrix DELTA = {};
    double actual=0, pred=0;
    
    matrix temp_inputs ={};
    
    matrix dB = {}; //Bias Derivatives
    matrix dW = {}; //Weight Derivatives
    
   
    for (ulong epoch=0; epoch<epochs && !IsStopped(); epoch++)
      {        
        double epoch_start = GetTickCount(); 

        uint num_batches = (uint)MathFloor(x.Rows()/(batch_size+DBL_EPSILON));
        
        vector batch_loss(num_batches), 
               batch_accuracy(num_batches);
                       
         vector actual_v(1), pred_v(1), LossGradient = {};
         
         if (batch_size==0) //Stochastic Gradient Descent
          {
           for (ulong iter=0; iter<rows; iter++) //iterate through all data points
             {
               pred = predict(x.Row(iter));
               actual = y[iter];
               
               pred_v[0] = pred; 
               actual_v[0] = actual; 
   //---
                
                DELTA.Resize(mlp.outputs,1);
                
                for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                  {    
                     Partial_Derivatives = this.Output_tensor.Get(int(layer));
                     temp_inputs = this.Input_tensor.Get(int(layer));
                     
                     Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                     
                     if (mlp.hidden_layers-1 == layer) //Last layer
                      {                     
                        LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                        
                        DELTA.Col(LossGradient, 0);
                      }
                      
                     else
                      {
                        W = this.Weights_tensor.Get(layer+1);
                        
                        DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                      }
                    
                    //-- Observation | DeLTA matrix is same size as the bias matrix
                    
                    W = this.Weights_tensor.Get(layer);
                    B = this.Bias_tensor.Get(layer);
                  
                   //--- Derivatives wrt weights and bias
                  
                    dB = DELTA;
                    dW = DELTA.MatMul(temp_inputs.Transpose());                   
                    
                   //--- Weights updates
                    
                    optimizer_weights.update(W, dW);
                    optimizer_bias.update(B, dB);
                    
                    this.Weights_tensor.Add(W, layer);
                    this.Bias_tensor.Add(B, layer);
                  }
             }
         }
        else //Batch Gradient Descent
          {
               
            for (uint batch=0, batch_start=0, batch_end=batch_size; batch<num_batches; batch++, batch_start+=batch_size, batch_end=(batch_start+batch_size-1))
               {
                  matrix batch_x = MatrixExtend::Get(x, batch_start, batch_end-1);
                  vector batch_y = MatrixExtend::Get(y, batch_start, batch_end-1);
                  
                  rows = batch_x.Rows();              
                  
                    for (ulong iter=0; iter<rows ; iter++) //iterate through all data points
                      {
                        pred_v[0] = predict(batch_x.Row(iter));
                        actual_v[0] = y[iter];
                        
            //---
                        
                      DELTA.Resize(mlp.outputs,1);
                      
                      for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                        {    
                           Partial_Derivatives = this.Output_tensor.Get(int(layer));
                           temp_inputs = this.Input_tensor.Get(int(layer));
                           
                           Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                           
                           if (mlp.hidden_layers-1 == layer) //Last layer
                            {                     
                              LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                              
                              DELTA.Col(LossGradient, 0);
                            }
                            
                           else
                            {
                              W = this.Weights_tensor.Get(layer+1);
                              
                              DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                            }
                          
                          //-- Observation | DeLTA matrix is same size as the bias matrix
                          
                          W = this.Weights_tensor.Get(layer);
                          B = this.Bias_tensor.Get(layer);
                        
                         //--- Derivatives wrt weights and bias
                        
                          dB = DELTA;
                          dW = DELTA.MatMul(temp_inputs.Transpose());                   
                          
                         //--- Weights updates
                          
                          optimizer_weights.update(W, dW);
                          optimizer_bias.update(B, dB);
                          
                          this.Weights_tensor.Add(W, layer);
                          this.Bias_tensor.Add(B, layer);
                        }
                    }
                 
                 pred_v = predict(batch_x);
                 
                 batch_loss[batch] = pred_v.Loss(batch_y, ENUM_LOSS_FUNCTION(m_loss_function));
                 batch_loss[batch] = MathIsValidNumber(batch_loss[batch]) ? (batch_loss[batch]>1e6 ? 1e6 : batch_loss[batch]) : 1e6; //Check for nan and return some large value if it is nan
                 
                 batch_accuracy[batch] = Metrics::r_squared(batch_y, pred_v);
                 
                 if (show_batch_progress)
                  printf("----> batch[%d/%d] batch-loss %.5f accuracy %.3f",batch+1,num_batches,batch_loss[batch], batch_accuracy[batch]);  
              }
          }
          
//--- End of an epoch
      
        vector validation_loss(cv_tensor.SIZE);
        vector validation_acc(cv_tensor.SIZE);
        for (ulong i=0; i<cv_tensor.SIZE; i++)
          {
            validation_data = cv_tensor.Get(i);
            MatrixExtend::XandYSplitMatrices(validation_data, validation_x, validation_y);
            
            vector val_preds = this.predict(validation_x);;
            
            validation_loss[i] = val_preds.Loss(validation_y, ENUM_LOSS_FUNCTION(m_loss_function));
            validation_acc[i] = Metrics::r_squared(validation_y, val_preds);
          }
                  
        pred_v = this.predict(x);
        
        if (batch_size==0)
          {      
              backprop_struct.training_loss[epoch] = pred_v.Loss(y, ENUM_LOSS_FUNCTION(m_loss_function));
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
        else
          {
              backprop_struct.training_loss[epoch] = batch_loss.Mean();
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
          
        double epoch_stop = GetTickCount();  
        printf("--> Epoch [%d/%d] training -> loss %.8f accuracy %.3f validation -> loss %.5f accuracy %.3f | Elapsed %s ",epoch+1,epochs,backprop_struct.training_loss[epoch],Metrics::r_squared(y, pred_v),backprop_struct.validation_loss[epoch],validation_acc.Mean(),this.ConvertTime((epoch_stop-epoch_start)/1000.0));
     }
     
   isBackProp = false;
   
  if (CheckPointer(this.Input_tensor) != POINTER_INVALID)  delete(this.Input_tensor);
  if (CheckPointer(this.Output_tensor) != POINTER_INVALID)  delete(this.Output_tensor); 
  if (CheckPointer(optimizer)!=POINTER_INVALID)  
    delete optimizer;
    
   return backprop_struct;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
backprop CRegressorNets::backpropagation(const matrix& x, const vector &y, OptimizerRMSprop *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
   isBackProp = true;
   
//---

   backprop backprop_struct;
   backprop_struct.Init(epochs);
   
   ulong rows = x.Rows();
   
   mlp.inputs = x.Cols();
   mlp.outputs = 1;
   
//---

   vector v2 = {(double)mlp.outputs}; //Adding the output layer to the mix of hidden layers
  
   HL_CONFIG = MatrixExtend::concatenate(HL_CONFIG, v2);
   mlp.hidden_layers = HL_CONFIG.Size();
   W_CONFIG.Resize(HL_CONFIG.Size());
     
//---

   if (y.Size() != rows)
     {
        Print(__FUNCTION__," FATAL | Number of rows in the x matrix is not the same the y vector size ");
        return backprop_struct;
     }
     
     
     matrix W, B;
     
//--- GENERATE WEIGHTS
    
     this.Weights_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Bias_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Input_tensor = new CTensors((uint)mlp.hidden_layers);
     this.Output_tensor = new CTensors((uint)mlp.hidden_layers);
     
     ulong layer_input = mlp.inputs; 
     
     for (ulong i=0; i<mlp.hidden_layers; i++)
       {
          W_CONFIG[i] = layer_input*HL_CONFIG[i];
          
          W = MatrixExtend::Random(0.0, 1.0,(ulong)HL_CONFIG[i],layer_input, m_random_state);
          
          W = W * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Weights_tensor.Add(W, i);
          
          B = MatrixExtend::Random(0.0, 0.5,(ulong)HL_CONFIG[i],1,m_random_state);
          
          B = B * sqrt(2/((double)layer_input + HL_CONFIG[i])); //glorot
          this.Bias_tensor.Add(B, i);
          
          layer_input = (ulong)HL_CONFIG[i];
       }
     
//---

   if (MQLInfoInteger(MQL_DEBUG))
      Comment("<-------------------  R E G R E S S O R   N E T S  ------------------------->\n",
            "HL_CONFIG ",HL_CONFIG," TOTAL HL(S) ",mlp.hidden_layers,"\n",
            "W_CONFIG ",W_CONFIG," ACTIVATION ",EnumToString(A_FX),"\n",
            "NN INPUTS ",mlp.inputs," OUTPUT ",mlp.outputs
           );

//--- Optimizer
      
   OptimizerRMSprop optimizer_weights = optimizer;
   OptimizerRMSprop optimizer_bias = optimizer;
   
   if (batch_size>0)
    {
      OptimizerMinBGD optimizer_weights;
      OptimizerMinBGD optimizer_bias;
    }
     
//--- Cross validation

    CCrossValidation cross_validation;      
    CTensors *cv_tensor;
    matrix validation_data = MatrixExtend::concatenate(x, y);
    matrix validation_x;
    vector validation_y;
    
    cv_tensor = cross_validation.KFoldCV(validation_data, 10); //k-fold cross validation | 10 folds selected
    
//---

    matrix DELTA = {};
    double actual=0, pred=0;
    
    matrix temp_inputs ={};
    
    matrix dB = {}; //Bias Derivatives
    matrix dW = {}; //Weight Derivatives
    
   
    for (ulong epoch=0; epoch<epochs && !IsStopped(); epoch++)
      {        
        double epoch_start = GetTickCount(); 

        uint num_batches = (uint)MathFloor(x.Rows()/(batch_size+DBL_EPSILON));
        
        vector batch_loss(num_batches), 
               batch_accuracy(num_batches);
                       
         vector actual_v(1), pred_v(1), LossGradient = {};
         
         if (batch_size==0) //Stochastic Gradient Descent
          {
           for (ulong iter=0; iter<rows; iter++) //iterate through all data points
             {
               pred = predict(x.Row(iter));
               actual = y[iter];
               
               pred_v[0] = pred; 
               actual_v[0] = actual; 
   //---
                
                DELTA.Resize(mlp.outputs,1);
                
                for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                  {    
                     Partial_Derivatives = this.Output_tensor.Get(int(layer));
                     temp_inputs = this.Input_tensor.Get(int(layer));
                     
                     Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                     
                     if (mlp.hidden_layers-1 == layer) //Last layer
                      {                     
                        LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                        
                        DELTA.Col(LossGradient, 0);
                      }
                      
                     else
                      {
                        W = this.Weights_tensor.Get(layer+1);
                        
                        DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                      }
                    
                    //-- Observation | DeLTA matrix is same size as the bias matrix
                    
                    W = this.Weights_tensor.Get(layer);
                    B = this.Bias_tensor.Get(layer);
                  
                   //--- Derivatives wrt weights and bias
                  
                    dB = DELTA;
                    dW = DELTA.MatMul(temp_inputs.Transpose());                   
                    
                   //--- Weights updates
                    
                    optimizer_weights.update(W, dW);
                    optimizer_bias.update(B, dB);
                    
                    this.Weights_tensor.Add(W, layer);
                    this.Bias_tensor.Add(B, layer);
                  }
             }
         }
        else //Batch Gradient Descent
          {
               
            for (uint batch=0, batch_start=0, batch_end=batch_size; batch<num_batches; batch++, batch_start+=batch_size, batch_end=(batch_start+batch_size-1))
               {
                  matrix batch_x = MatrixExtend::Get(x, batch_start, batch_end-1);
                  vector batch_y = MatrixExtend::Get(y, batch_start, batch_end-1);
                  
                  rows = batch_x.Rows();              
                  
                    for (ulong iter=0; iter<rows ; iter++) //iterate through all data points
                      {
                        pred_v[0] = predict(batch_x.Row(iter));
                        actual_v[0] = y[iter];
                        
            //---
                        
                      DELTA.Resize(mlp.outputs,1);
                      
                      for (int layer=(int)mlp.hidden_layers-1; layer>=0 && !IsStopped(); layer--) //Loop through the network backward from last to first layer
                        {    
                           Partial_Derivatives = this.Output_tensor.Get(int(layer));
                           temp_inputs = this.Input_tensor.Get(int(layer));
                           
                           Partial_Derivatives.Derivative(Partial_Derivatives, ENUM_ACTIVATION_FUNCTION(A_FX));
                           
                           if (mlp.hidden_layers-1 == layer) //Last layer
                            {                     
                              LossGradient = pred_v.LossGradient(actual_v, ENUM_LOSS_FUNCTION(m_loss_function));
                              
                              DELTA.Col(LossGradient, 0);
                            }
                            
                           else
                            {
                              W = this.Weights_tensor.Get(layer+1);
                              
                              DELTA = (W.Transpose().MatMul(DELTA)) * Partial_Derivatives;
                            }
                          
                          //-- Observation | DeLTA matrix is same size as the bias matrix
                          
                          W = this.Weights_tensor.Get(layer);
                          B = this.Bias_tensor.Get(layer);
                        
                         //--- Derivatives wrt weights and bias
                        
                          dB = DELTA;
                          dW = DELTA.MatMul(temp_inputs.Transpose());                   
                          
                         //--- Weights updates
                          
                          optimizer_weights.update(W, dW);
                          optimizer_bias.update(B, dB);
                          
                          this.Weights_tensor.Add(W, layer);
                          this.Bias_tensor.Add(B, layer);
                        }
                    }
                 
                 pred_v = predict(batch_x);
                 
                 batch_loss[batch] = pred_v.Loss(batch_y, ENUM_LOSS_FUNCTION(m_loss_function));
                 batch_loss[batch] = MathIsValidNumber(batch_loss[batch]) ? (batch_loss[batch]>1e6 ? 1e6 : batch_loss[batch]) : 1e6; //Check for nan and return some large value if it is nan
                 
                 batch_accuracy[batch] = Metrics::r_squared(batch_y, pred_v);
                 
                 if (show_batch_progress)
                  printf("----> batch[%d/%d] batch-loss %.5f accuracy %.3f",batch+1,num_batches,batch_loss[batch], batch_accuracy[batch]);  
              }
          }
          
//--- End of an epoch
      
        vector validation_loss(cv_tensor.SIZE);
        vector validation_acc(cv_tensor.SIZE);
        for (ulong i=0; i<cv_tensor.SIZE; i++)
          {
            validation_data = cv_tensor.Get(i);
            MatrixExtend::XandYSplitMatrices(validation_data, validation_x, validation_y);
            
            vector val_preds = this.predict(validation_x);;
            
            validation_loss[i] = val_preds.Loss(validation_y, ENUM_LOSS_FUNCTION(m_loss_function));
            validation_acc[i] = Metrics::r_squared(validation_y, val_preds);
          }
                  
        pred_v = this.predict(x);
        
        if (batch_size==0)
          {      
              backprop_struct.training_loss[epoch] = pred_v.Loss(y, ENUM_LOSS_FUNCTION(m_loss_function));
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
        else
          {
              backprop_struct.training_loss[epoch] = batch_loss.Mean();
              backprop_struct.training_loss[epoch] = MathIsValidNumber(backprop_struct.training_loss[epoch]) ? (backprop_struct.training_loss[epoch]>1e6 ? 1e6 : backprop_struct.training_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
              backprop_struct.validation_loss[epoch] = validation_loss.Mean();
              backprop_struct.validation_loss[epoch] = MathIsValidNumber(backprop_struct.validation_loss[epoch]) ? (backprop_struct.validation_loss[epoch]>1e6 ? 1e6 : backprop_struct.validation_loss[epoch]) : 1e6; //Check for nan and return some large value if it is nan
          }
          
        double epoch_stop = GetTickCount();  
        printf("--> Epoch [%d/%d] training -> loss %.8f accuracy %.3f validation -> loss %.5f accuracy %.3f | Elapsed %s ",epoch+1,epochs,backprop_struct.training_loss[epoch],Metrics::r_squared(y, pred_v),backprop_struct.validation_loss[epoch],validation_acc.Mean(),this.ConvertTime((epoch_stop-epoch_start)/1000.0));
     }
     
   isBackProp = false;
   
  if (CheckPointer(this.Input_tensor) != POINTER_INVALID)  delete(this.Input_tensor);
  if (CheckPointer(this.Output_tensor) != POINTER_INVALID)  delete(this.Output_tensor); 
  if (CheckPointer(optimizer)!=POINTER_INVALID)  
    delete optimizer;
    
   return backprop_struct;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CRegressorNets::fit(const matrix &x, const vector &y, OptimizerSGD *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
  trained = true; //The fit method has been called
  
  vector epochs_vector(epochs);  for (uint i=0; i<epochs; i++) epochs_vector[i] = i+1;
  
  backprop backprop_struct;
  
  backprop_struct = this.backpropagation(x, y, optimizer, epochs, batch_size, show_batch_progress); //Run backpropagation
  

  CPlots plt;
    
  backprop_struct.training_loss = log10(backprop_struct.training_loss); //Logarithmic scalling
  plt.Plot("Loss vs Epochs",epochs_vector,backprop_struct.training_loss,"epochs","optimizer-SGD log10(loss)","training-loss",CURVE_LINES);
  backprop_struct.validation_loss = log10(backprop_struct.validation_loss);
  plt.AddPlot(backprop_struct.validation_loss,"validation-loss",clrRed);
  
   while (MessageBox("Close or Cancel Loss Vs Epoch plot to proceed","Training progress",MB_OK)<0)
    Sleep(1);

  isBackProp = false;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CRegressorNets::fit(const matrix &x, const vector &y, OptimizerAdaDelta *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
  trained = true; //The fit method has been called
  
  vector epochs_vector(epochs);  for (uint i=0; i<epochs; i++) epochs_vector[i] = i+1;
  
  backprop backprop_struct;
  
  backprop_struct = this.backpropagation(x, y, optimizer, epochs, batch_size, show_batch_progress); //Run backpropagation
  

  CPlots plt;
    
  backprop_struct.training_loss = log10(backprop_struct.training_loss); //Logarithmic scalling
  plt.Plot("Loss vs Epochs",epochs_vector,backprop_struct.training_loss,"epochs","optimizer-AdaDelta log10(loss)","training-loss",CURVE_LINES);
  backprop_struct.validation_loss = log10(backprop_struct.validation_loss);
  plt.AddPlot(backprop_struct.validation_loss,"validation-loss",clrRed);
  
   while (MessageBox("Close or Cancel Loss Vs Epoch plot to proceed","Training progress",MB_OK)<0)
    Sleep(1);

  isBackProp = false;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CRegressorNets::fit(const matrix &x, const vector &y, OptimizerAdaGrad *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
  trained = true; //The fit method has been called
  
  vector epochs_vector(epochs);  for (uint i=0; i<epochs; i++) epochs_vector[i] = i+1;
  
  backprop backprop_struct;
  
  backprop_struct = this.backpropagation(x, y, optimizer, epochs, batch_size, show_batch_progress); //Run backpropagation
  

  CPlots plt;
    
  backprop_struct.training_loss = log10(backprop_struct.training_loss); //Logarithmic scalling
  plt.Plot("Loss vs Epochs",epochs_vector,backprop_struct.training_loss,"epochs","optimizer-AdaGrad log10(loss)","training-loss",CURVE_LINES);
  backprop_struct.validation_loss = log10(backprop_struct.validation_loss);
  plt.AddPlot(backprop_struct.validation_loss,"validation-loss",clrRed);
  
   while (MessageBox("Close or Cancel Loss Vs Epoch plot to proceed","Training progress",MB_OK)<0)
    Sleep(1);

  isBackProp = false;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CRegressorNets::fit(const matrix &x, const vector &y, OptimizerAdam *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
  trained = true; //The fit method has been called
  
  vector epochs_vector(epochs);  for (uint i=0; i<epochs; i++) epochs_vector[i] = i+1;
  
  backprop backprop_struct;
  
  backprop_struct = this.backpropagation(x, y, optimizer, epochs, batch_size, show_batch_progress); //Run backpropagation
  

  CPlots plt;
    
  backprop_struct.training_loss = log10(backprop_struct.training_loss); //Logarithmic scalling
  plt.Plot("Loss vs Epochs",epochs_vector,backprop_struct.training_loss,"epochs","optimizer-Adam log10(loss)","training-loss",CURVE_LINES);
  backprop_struct.validation_loss = log10(backprop_struct.validation_loss);
  plt.AddPlot(backprop_struct.validation_loss,"validation-loss",clrRed);
  
   while (MessageBox("Close or Cancel Loss Vs Epoch plot to proceed","Training progress",MB_OK)<0)
    Sleep(1);

  isBackProp = false;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CRegressorNets::fit(const matrix &x, const vector &y, OptimizerNadam *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
  trained = true; //The fit method has been called
  
  vector epochs_vector(epochs);  for (uint i=0; i<epochs; i++) epochs_vector[i] = i+1;
  
  backprop backprop_struct;
  
  backprop_struct = this.backpropagation(x, y, optimizer, epochs, batch_size, show_batch_progress); //Run backpropagation
  

  CPlots plt;
    
  backprop_struct.training_loss = log10(backprop_struct.training_loss); //Logarithmic scalling
  plt.Plot("Loss vs Epochs",epochs_vector,backprop_struct.training_loss,"epochs","optimizer-Nadam log10(loss)","training-loss",CURVE_LINES);
  backprop_struct.validation_loss = log10(backprop_struct.validation_loss);
  plt.AddPlot(backprop_struct.validation_loss,"validation-loss",clrRed);
  
   while (MessageBox("Close or Cancel Loss Vs Epoch plot to proceed","Training progress",MB_OK)<0)
    Sleep(1);

  isBackProp = false;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CRegressorNets::fit(const matrix &x, const vector &y, OptimizerRMSprop *optimizer, const uint epochs, uint batch_size=0, bool show_batch_progress=false)
 {
  trained = true; //The fit method has been called
  
  vector epochs_vector(epochs);  for (uint i=0; i<epochs; i++) epochs_vector[i] = i+1;
  
  backprop backprop_struct;
  
  backprop_struct = this.backpropagation(x, y, optimizer, epochs, batch_size, show_batch_progress); //Run backpropagation
  

  CPlots plt;
    
  backprop_struct.training_loss = log10(backprop_struct.training_loss); //Logarithmic scalling
  plt.Plot("Loss vs Epochs",epochs_vector,backprop_struct.training_loss,"epochs","optimizer-RMSProp log10(loss)","training-loss",CURVE_LINES);
  backprop_struct.validation_loss = log10(backprop_struct.validation_loss);
  plt.AddPlot(backprop_struct.validation_loss,"validation-loss",clrRed);
  
   while (MessageBox("Close or Cancel Loss Vs Epoch plot to proceed","Training progress",MB_OK)<0)
    Sleep(1);

  isBackProp = false;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

================================================
FILE: Neural Networks/initializers.mqh
================================================
//+------------------------------------------------------------------+
//|                                                initiallizers.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"

#include <MALE5\MatrixExtend.mqh>

enum enum_weight_initializers
 {
   WEIGHT_INTIALIZER_XAVIER, //Xavier weights
   WEIGHT_INTIALIZER_HE, //He weights 
   WEIGHT_INTIALIZER_RANDOM //Random weights 
 };

//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+
class CWeightsInitializers
  {
protected:

   static double random()  //Generates a random float between 0 (inclusive) and 1 (exclusive)
     {              
       return 0 + double((MathRand() / 32767.0) * (0.9 - 0));
     }
     
   static double uniform(double low, double high)
     {
       return low + (high - low) * random();
     }
     
   static matrix uniform(double low, double high, ulong rows, ulong cols)
    {
      matrix return_matrix(rows, cols);
      for (ulong i=0; i<rows; i++)
        for (ulong j=0; j<cols; j++)
           return_matrix[i][j] = uniform(low, high);
      
      return return_matrix;
    }
   
   static vector uniform(double low, double high, ulong size)
    {
      vector v(size);
      for (ulong i=0; i<size; i++)
        v[i] = uniform(low, high);
      
      return v;
    }
   
public:
                     CWeightsInitializers(void);
                    ~CWeightsInitializers(void);
                    
                    static matrix Xavier(const ulong inputs, const ulong outputs); //Xavier or Glorot initialization
                    static matrix He(const ulong inputs, const ulong outputs);
                    static matrix Random(const ulong inputs, const ulong outputs);
                    static matrix Initializer(const ulong inputs, const ulong outputs, enum_weight_initializers WEIGHT_INIT=WEIGHT_INTIALIZER_XAVIER);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CWeightsInitializers::Xavier(const ulong inputs,const ulong outputs)
 {
   #ifdef RANDOM_STATE
     MathSrand(RANDOM_STATE);
   #endif 
   
   double limit = sqrt(6/(inputs+outputs+DBL_EPSILON));
   return uniform(-limit, limit, inputs, outputs);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CWeightsInitializers::He(const ulong inputs, const ulong outputs)
 {
   #ifdef RANDOM_STATE
     MathSrand(RANDOM_STATE);
   #endif 
   
   double limit = sqrt(2 / (inputs+DBL_EPSILON));
   
   matrix W(inputs, outputs);
   for (ulong i=0; i<outputs; i++)
    {
      vector v = uniform(-limit, limit, inputs);
      W.Col(v, i);
    }
   
   return uniform(-limit, limit, inputs, outputs);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CWeightsInitializers::Random(const ulong inputs,const ulong outputs)
 {
   #ifdef RANDOM_STATE
     MathSrand(RANDOM_STATE);
   #endif 
   
   matrix W(inputs, outputs);
   for (ulong i=0; i<inputs; i++)
     for (ulong j=0; j<outputs; j++)
       W[i][j] = random();
       
   return W;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CWeightsInitializers::Initializer(const ulong inputs,const ulong outputs,enum_weight_initializers WEIGHT_INIT=WEIGHT_INTIALIZER_XAVIER)
 {
   matrix W = {};
   
   switch(WEIGHT_INIT)
     {
      case  WEIGHT_INTIALIZER_HE:
        W = He(inputs, outputs);
        break;
      case  WEIGHT_INTIALIZER_RANDOM:
        W = Random(inputs, outputs);
        break;
      case  WEIGHT_INTIALIZER_XAVIER:
        W = Xavier(inputs, outputs);
        break;
     }
     
   return W;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Neural Networks/kohonen maps.mqh
================================================
//+------------------------------------------------------------------+
//|                                                 kohonen maps.mqh |
//|                                    Copyright 2022, Fxalgebra.com |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Fxalgebra.com"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
#include <MALE5\MatrixExtend.mqh>
#include <MALE5\Tensors.mqh>
#include <MALE5\preprocessing.mqh>
#include <MALE5\MqPlotLib\plots.mqh>

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

class CKohonenMaps
  {
   protected:
     C2DTensor *cluster_tensor;
     
     CPlots   plt;
      
      double  Euclidean_distance(const vector &v1, const vector &v2);
      string  CalcTimeElapsed(double seconds);
      
      matrix     c_matrix; //Clusters
      matrix     w_matrix; //Weights matrix
      vector     w_vector; //weights vector
      matrix     o_matrix; //Output layer matrix
      
      uint m_clusters;
      double m_alpha;
      uint m_epochs; 
      int m_random_state;
      ulong n, m;
      
   public:
                  CKohonenMaps(uint clusters=2, double alpha=0.01, uint epochs=100, int random_state=42);
                 ~CKohonenMaps(void);
                 
                  void fit(const matrix &x);
                  int predict(const vector &x);
                  vector predict(const matrix &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CKohonenMaps::CKohonenMaps(uint clusters=2, double alpha=0.01, uint epochs=100, int random_state=42)
 :m(clusters),
 m_alpha(alpha),
 m_epochs(epochs),
 m_random_state(random_state),
 m_clusters(clusters)
 {   
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CKohonenMaps::fit(const matrix &x)
 {
   n = (uint)x.Cols(); //number of features 
   ulong rows = x.Rows();
   
   cluster_tensor = new C2DTensor();
   cluster_tensor.Init((int)m);
   
   w_matrix =MatrixExtend::Random(0.0, 1.0, n, m, m_random_state); 
   
   #ifdef DEBUG_MODE
      Print("w x\n",w_matrix,"\nMatrix\n",x);
   #endif 
   
   vector D(m); //Euclidean distance btn clusters
   
   
   for (uint epoch=0; epoch<m_epochs; epoch++)
    {
    
      double epoch_start = GetMicrosecondCount()/(double)1e6, epoch_stop=0; 
      
      for (ulong i=0; i<rows; i++)
       {
         for (ulong j=0; j<m; j++)
           {
             D[j] = Euclidean_distance(x.Row(i),w_matrix.Col(j));
           }
         
         #ifdef DEBUG_MODE  
            //Print("Euc distance ",D," Winning cluster ",D.ArgMin());
         #endif 
         
   //--- weights update
         
         ulong min = D.ArgMin();
         
         if (epoch == m_epochs-1) //last iteration
            cluster_tensor[(int)min].Vector = x.Row(i);; 

          
         vector w_new =  w_matrix.Col(min) + (m_alpha * (x.Row(i) - w_matrix.Col(min)));
         
         w_matrix.Col(w_new, min);
       }
  
      epoch_stop =GetMicrosecondCount()/(double)1e6;    
      
      printf("Epoch [%d/%d] | %sElapsed ",epoch+1,m_epochs, CalcTimeElapsed(epoch_stop-epoch_start));
      
    }  //end of the training

//---

  #ifdef DEBUG_MODE
      Print("\nNew weights\n",w_matrix);
  #endif 

//---
   

   vector v;  
   matrix plotmatrix(rows, m); 
   
     for (uint i=0; i<this.cluster_tensor.Size(); i++)
       {
          v = this.cluster_tensor[i].Vector;
                    
          plotmatrix.Col(v, i);
       }   
    
    vector x_axis(plotmatrix.Rows());    for (ulong i=0; i<x_axis.Size(); i++) x_axis[i] = (int)i+1;
    
    CColorGenerator clr;
    
    plt.Plot("kom", x_axis, plotmatrix.Col(0), "map", "clusters","cluster"+string(1),CURVE_POINTS,clr.Next()); //plot the first cluster
    for (ulong i=1; i<plotmatrix.Cols(); i++) //start at the second column in the matrix | the second cluster
      {
        plt.AddPlot(plotmatrix.Col(i), "cluster"+string(i+1),clr.Next()); //Add the rest of clusters to the existing plot 
      }

//---
   
   if (MQLInfoInteger(MQL_DEBUG))
    {
     Print("\nclusters");
     cluster_tensor.Print_();
   }
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CKohonenMaps::~CKohonenMaps(void)
 {
   ZeroMemory(c_matrix); 
   ZeroMemory(w_matrix); 
   ZeroMemory(w_vector); 
   ZeroMemory(o_matrix); 
   delete (cluster_tensor);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

double CKohonenMaps:: Euclidean_distance(const vector &v1, const vector &v2)
  {
   double dist = 0;

   if(v1.Size() != v2.Size())
      Print(__FUNCTION__, " v1 and v2 not matching in size");
   else
     {
      double c = 0;
      for(ulong i=0; i<v1.Size(); i++)
         c += MathPow(v1[i] - v2[i], 2);

      dist = MathSqrt(c);
     }

   return(dist);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
int CKohonenMaps::predict(const vector &v)
 {  
  if (n != v.Size())
   {
     printf("%s Can't predict the cluster | the input vector size is not the same as the trained matrix cols",__FUNCTION__);
     return(-1);
   }
   
   vector D(m); //Euclidean distance btn clusters
   
   for (ulong j=0; j<m; j++)
       D[j] = Euclidean_distance(v, w_matrix.Col(j));

   return((int)D.ArgMin());
 }

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

vector CKohonenMaps::predict(const matrix &x)
 {   
   vector v(x.Rows());
   
   for (ulong i=0; i<x.Rows(); i++)
      v[i] = predict(x.Row(i));
      
    return(v);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

string CKohonenMaps::CalcTimeElapsed(double seconds)
 {
  string time_str = "";
  
  uint minutes=0, hours=0;
  
   if (seconds >= 60)
     time_str = StringFormat("%d Minutes and %.3f Seconds ",minutes=(int)round(seconds/60.0), ((int)seconds % 60));     
   if (minutes >= 60)
     time_str = StringFormat("%d Hours %d Minutes and %.3f Seconds ",hours=(int)round(minutes/60.0), minutes, ((int)seconds % 60));
   else
     time_str = StringFormat("%.3f Seconds ",seconds);
     
   return time_str;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Neural Networks/optimizers.mqh
================================================
//+------------------------------------------------------------------+
//|                                                   optimizers.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"

//+------------------------------------------------------------------+
//|Class containing optimizers for updating neural network parameters|
//+------------------------------------------------------------------+

//+------------------------------------------------------------------+
//|                                                                  |
//| Adam (Adaptive Moment Estimation): Adam is an adaptive learning  |
//| rate optimizer that maintains learning rates for each parameter  |
//| and adapts them based on the first and second moments of the     |
//| gradients. It's known for its fast convergence and robustness to |
//| noisy gradients                                                  |
//|                                                                  |
//+------------------------------------------------------------------+

/*enum Optimizer {
    OPTIMIZER_SGD, //Stochastic Gradient Descent
    OPTIMIZER_MiniBatchGD, //Mini-Batch Gradiend Descent
    OPTIMIZER_Adam, //Adaptive Moment Estimation
    OPTIMIZER_RMSprop, //Root Mean Square Propagation
    OPTIMIZER_Adagrad, //Adaptive Gradient Descent 
    OPTIMIZER_Adadelta, //Adadelta
    OPTIMIZER_Nadam //Nesterov-accelerated Adaptive Moment Estimation
};
*/

class OptimizerAdam
  {
protected:
   int time_step;
   double m_learning_rate;
   double m_beta1;
   double m_beta2;
   double m_epsilon;
   
   matrix moment; //first moment estimate
   matrix cache; //second moment estimate
   
public:
                     OptimizerAdam(double learning_rate=0.01, double beta1=0.9, double beta2=0.999, double epsilon=1e-8);
                    ~OptimizerAdam(void);
                    
                    virtual void update(matrix &parameters, matrix &gradients);
  };
//+------------------------------------------------------------------+
//|  Initializes the Adam optimizer with hyperparameters.            |   
//|                                                                  |
//|  learning_rate: Step size for parameter updates                  |
//|  beta1: Decay rate for the first moment estimate                 |
//|     (moving average of gradients).                               |
//|  beta2: Decay rate for the second moment estimate                |
//|     (moving average of squared gradients).                       |
//|  epsilon: Small value for numerical stability.                   |
//+------------------------------------------------------------------+
OptimizerAdam::OptimizerAdam(double learning_rate=0.010000, double beta1=0.9, double beta2=0.999, double epsilon=1e-8):
 time_step(0),
 m_learning_rate(learning_rate),
 m_beta1(beta1),
 m_beta2(beta2),
 m_epsilon(epsilon)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerAdam::~OptimizerAdam(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void OptimizerAdam::update(matrix &parameters,matrix &gradients)
 {
    // Initialize moment and cache matrices if not already initialized
    if (moment.Rows() != parameters.Rows() || moment.Cols() != parameters.Cols())
    {
        moment.Resize(parameters.Rows(), parameters.Cols());
        moment.Fill(0.0);
    }

    if (cache.Rows() != parameters.Rows() || cache.Cols() != parameters.Cols())
    {
        cache.Resize(parameters.Rows(), parameters.Cols());
        cache.Fill(0.0);
    }

   
    this.time_step++; 
    
    this.moment = this.m_beta1 * this.moment + (1 -  this.m_beta1) * gradients;
    
    this.cache = this.m_beta2 * this.cache + (1 -  this.m_beta2) * MathPow(gradients, 2);

//--- Bias correction

    matrix moment_hat = this.moment / (1 - MathPow(this.m_beta1, this.time_step));
    
    matrix cache_hat = this.cache / (1 - MathPow(this.m_beta2, this.time_step));
    
    parameters -= (this.m_learning_rate * moment_hat) / (MathPow(cache_hat, 0.5) + this.m_epsilon);
 }
 
 
//+------------------------------------------------------------------+
//|                                                                  |
//|                                                                  |
//| Stochastic Gradient Descent (SGD):                               |
//|                                                                  |
//| This is the simplest optimizer                                   |
//| It updates the parameters using the gradients of the loss        |
//| function computed on individual training samples or mini-batches.|
//|                                                                  |
//|                                                                  |
//+------------------------------------------------------------------+


class OptimizerSGD
  {
protected:
   double m_learning_rate;
   
public:
                     OptimizerSGD(double learning_rate=0.01);
                    ~OptimizerSGD(void);
                     
                    virtual void update(matrix &parameters, matrix &gradients);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerSGD::OptimizerSGD(double learning_rate=0.01):
 m_learning_rate(learning_rate)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerSGD::~OptimizerSGD(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void OptimizerSGD::update(matrix &parameters, matrix &gradients)
 {
    parameters -= this.m_learning_rate * gradients;
 }
 
 
//+------------------------------------------------------------------+
//|  Batch Gradient Descent (BGD): This optimizer computes the       |
//|  gradients of the loss function on the entire training dataset   |
//|  and updates the parameters accordingly. It can be slow and      |
//|  memory-intensive for large datasets but tends to provide a      |
//|  stable convergence.                                             |
//+------------------------------------------------------------------+


class OptimizerMinBGD: public OptimizerSGD
  {
public:
                     OptimizerMinBGD(double learning_rate=0.01);
                    ~OptimizerMinBGD(void);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerMinBGD::OptimizerMinBGD(double learning_rate=0.010000): OptimizerSGD(learning_rate)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerMinBGD::~OptimizerMinBGD(void)
 {
 
 }
 
//+------------------------------------------------------------------+
//|                                                                  |
//|                                                                  |
//|                                                                  |
//| RMSprop (Root Mean Square Propagation): RMSprop is similar to    |
//| Adam but only uses the first moment of the gradients to adapt the|
//| moment learning rates. It's effective in handling non-stationary      |
//| objectives and can converge quickly for many problems.           |
//|                                                                  |
//|                                                                  |
//+------------------------------------------------------------------+


class OptimizerRMSprop
  {
protected:
   double m_learning_rate;
   double m_decay_rate;
   double m_epsilon;
   
   matrix<double> cache;
   
   //Dividing double/matrix causes compilation error | this is the fix to the issue
   matrix divide(const double numerator, const matrix &denominator)
    {
      matrix res = denominator;
      
      for (ulong i=0; i<denominator.Rows(); i++)
        res.Row(numerator / denominator.Row(i), i);
     return res;
    }
    
public:
                     OptimizerRMSprop(double learning_rate=0.01, double decay_rate=0.9, double epsilon=1e-8);
                    ~OptimizerRMSprop(void);
                    
                    virtual void update(matrix& parameters, matrix& gradients);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerRMSprop::OptimizerRMSprop(double learning_rate=0.01, double decay_rate=0.9, double epsilon=1e-8):
 m_learning_rate(learning_rate),
 m_decay_rate(decay_rate),
 m_epsilon(epsilon)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerRMSprop::~OptimizerRMSprop(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void OptimizerRMSprop::update(matrix &parameters,matrix &gradients)
 {
 
   if (cache.Rows()!=parameters.Rows() || cache.Cols()!=parameters.Cols())
    {
     cache.Init(parameters.Rows(), parameters.Cols());
     cache.Fill(0.0);
    }
     
//---
    
    cache += m_decay_rate * cache + (1 - m_decay_rate) * MathPow(gradients, 2);
    parameters -= divide(m_learning_rate, cache + m_epsilon) * gradients;
 }


//+------------------------------------------------------------------+
//|                                                                  |
//|                                                                  |
//|                                                                  |
//| Adagrad (Adaptive Gradient Algorithm):                           |
//|                                                                  |
//| Adagrad adapts the learning rates for each parameter based on the|
//| historical gradients. It performs larger updates for infrequent  |
//| parameters and smaller updates for frequent parameters, making   |
//| it suitable for sparse data.                                     |
//|                                                                  |
//|                                                                  |
//|                                                                  |
//+------------------------------------------------------------------+

class OptimizerAdaGrad
  {
protected:
 double m_learning_rate;
 double m_epsilon;
 matrix cache;
 
 
   //Dividing double/matrix causes compilation error | this is the fix to the issue
   matrix divide(const double numerator, const matrix &denominator)
    {
      matrix res = denominator;
      
      for (ulong i=0; i<denominator.Rows(); i++)
        res.Row(numerator / denominator.Row(i), i);
     return res;
    }
 
public:
                     OptimizerAdaGrad(double learning_rate=0.01, double epsilon=1e-8);
                    ~OptimizerAdaGrad(void);
                    
                    virtual void update(matrix &parameters, matrix &gradients);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerAdaGrad::OptimizerAdaGrad(double learning_rate=0.01,double epsilon=1e-8):
 m_learning_rate(learning_rate),
 m_epsilon(epsilon)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerAdaGrad::~OptimizerAdaGrad(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void OptimizerAdaGrad::update(matrix &parameters,matrix &gradients)
 {
   if (cache.Rows()!=parameters.Rows() || cache.Cols()!=parameters.Cols())
    {
     cache.Resize(parameters.Rows(), parameters.Cols());
     cache.Fill(0.0);
    }
     
//--- 
   
    cache += MathPow(gradients, 2);
    parameters -= divide(this.m_learning_rate,  MathSqrt(cache + this.m_epsilon)) * gradients;
 }

//+------------------------------------------------------------------+
//|                                                                  |
//| Adadelta:                                                        |      
//|                                                                  |
//| Adadelta is an extension of Adagrad that aims to address         |
//| its tendency to decrease the learning rate over time. It uses a  |
//| more sophisticated update rule that accounts for the accumulated |
//| gradients over a window of time.                                 |
//|                                                                  |
//+------------------------------------------------------------------+


class OptimizerAdaDelta
  {
protected:
   double m_decay_rate;
   double m_epsilon, m_gamma, lr;
   matrix cache; //Exponential moving average of squared gradients
   
public:
                     OptimizerAdaDelta(double learning_rate=0.01, double decay_rate=0.95, double gamma=0.9, double epsilon=1e-8);
                    ~OptimizerAdaDelta(void);
                    
                     virtual void update(matrix &parameters, matrix &gradients);
  };
//+------------------------------------------------------------------+
//|   decay_rate: Decay rate for the EMA of squared deltas           |
//|   epsilons: Smoothing term to avoid division by zero             |
//|   gamma: Momentum coefficient (hyperparameter)                   |
//+------------------------------------------------------------------+
OptimizerAdaDelta::OptimizerAdaDelta(double learning_rate=0.01, double decay_rate=0.95, double gamma=0.9, double epsilon=1e-8):
  m_decay_rate(decay_rate),
  m_epsilon(epsilon),
  m_gamma(gamma),
  lr(learning_rate)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerAdaDelta::~OptimizerAdaDelta(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void OptimizerAdaDelta::update(matrix &parameters, matrix &gradients)
 {
    // Initialize moment and cache matrices if not already initialized
    if (cache.Rows() != parameters.Rows() || cache.Cols() != parameters.Cols())
    {
        cache.Resize(parameters.Rows(), parameters.Cols());
        cache.Fill(0.0);
    }

//---
   
   this.cache = m_decay_rate * this.cache + (1 - m_decay_rate) * MathPow(gradients, 2);
   
   matrix delta = lr * sqrt(this.cache + m_epsilon) / sqrt(pow(gradients, 2) + m_epsilon); //Adaptive learning rate
   
   matrix momentum_term = this.m_gamma * parameters + (1 - this.m_gamma) * gradients;
   
   parameters -= delta * momentum_term;
 }

//+------------------------------------------------------------------+
//|                                                                  |
//|                                                                  |
//| Nadam (Nesterov-accelerated Adaptive Moment Estimation):         |
//|                                                                  |
//| Nadam combines Nesterov momentum with Adam optimizer, which      |
//| results in faster convergence and better generalization.         |
//|                                                                  |
//|                                                                  |
//+------------------------------------------------------------------+


class OptimizerNadam: protected OptimizerAdam
  {
protected:
   double m_gamma;
   
    
public:
                     OptimizerNadam(double learning_rate=0.01, double beta1=0.9, double beta2=0.999, double gamma=0.9, double epsilon=1e-8);
                    ~OptimizerNadam(void);
                    
                    virtual void update(matrix &parameters, matrix &gradients);
  };
//+------------------------------------------------------------------+
//|  Initializes the Adam optimizer with hyperparameters.            |   
//|                                                                  |
//|  learning_rate: Step size for parameter updates                  |
//|  beta1: Decay rate for the first moment estimate                 |
//|     (moving average of gradients).                               |
//|  beta2: Decay rate for the second moment estimate                |
//|     (moving average of squared gradients).                       |
//|  epsilon: Small value for numerical stability.                   |
//+------------------------------------------------------------------+
OptimizerNadam::OptimizerNadam(double learning_rate=0.010000, double beta1=0.9, double beta2=0.999, double gamma=0.9, double epsilon=1e-8)
:OptimizerAdam(learning_rate, beta1, beta2, epsilon),
 m_gamma(gamma)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
OptimizerNadam::~OptimizerNadam(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void OptimizerNadam::update(matrix &parameters, matrix &gradients)
{
    // Initialize moment and cache matrices if not already initialized
    if (moment.Rows() != parameters.Rows() || moment.Cols() != parameters.Cols())
    {
        moment.Resize(parameters.Rows(), parameters.Cols());
        moment.Fill(0.0);
    }

    if (cache.Rows() != parameters.Rows() || cache.Cols() != parameters.Cols())
    {
        cache.Resize(parameters.Rows(), parameters.Cols());
        cache.Fill(0.0);
    }

    this.time_step++;

    // Update moment and cache similar to Adam
    moment = m_beta1 * moment + (1 - m_beta1) * gradients;
    cache = m_beta2 * cache + (1 - m_beta2) * MathPow(gradients, 2);

    // Bias correction
    matrix moment_hat = moment / (1 - MathPow(m_beta1, time_step));
    matrix cache_hat = cache / (1 - MathPow(m_beta2, time_step));

    // Nesterov accelerated gradient
    matrix nesterov_moment = m_gamma * moment_hat + (1 - m_gamma) * gradients;

    // Update parameters
    parameters -= m_learning_rate * nesterov_moment / sqrt(cache_hat + m_epsilon);
}

 
================================================
FILE: README.md
================================================
<p align="center">
  <img width="25%" align="center" src="https://github.com/MegaJoctan/MALE5/assets/65341461/5a903238-921d-4f09-8e27-1847d4052af3" alt="logo">
</p>
<h1 align="center">
  M A L E 5
</h1>
<p align="center">
 A python-like Machine Learning Library for MQL5
</p>

<p align="center">
  <a href="https://github.com/MegaJoctan/MALE5/releases" target="_blank">
    <img src="https://img.shields.io/github/v/release/MegaJoctan/MALE5?color=%2334D058&label=Version" alt="Version">
  </a>

  <a href="https://github.com/MegaJoctan/MALE5/stargazers">
    <img src="https://img.shields.io/github/stars/MegaJoctan/MALE5?color=brightgreen&label=Stars" alt="Stars"/>
  </a>

  <a href="https://github.com/MegaJoctan/MALE5/blob/main/LICENSE">
    <img src="https://img.shields.io/github/license/MegaJoctan/MALE5?color=blue" alt="License"/>
  </a>

  <a>
    <img src="https://img.shields.io/badge/Platform-Win32%20|%20Linux%20|%20macOS-blue?color=blue" alt="Platform Win32 | Linux | macOS"/>
  </a>

</p>

<p align="center">
  <a href="https://discord.gg/2qgcadfgrx" style="text-decoration:none">
    <img src="https://img.shields.io/badge/Discord-%237289DA?style=flat&logo=discord"/>
  </a>
  <a href="https://t.me/fxalgebra_discussion" style="text-decoration:none">
    <img src="https://img.shields.io/badge/Telegram-%232CA5E0?style=flat&logo=telegram"/>
  </a>
</p>

<p align="center">
English | <a href="README_russian.md">Russian</a> 
</p>

## About the Project

MALE5 is a machine-learning repository for creating trading systems in the c++ like, MQL5 programming language.
It was developed to help build machine learning-based trading robots, effortlessly in the [MetaTrader5](https://www.metatrader5.com/en/automated-trading/metaeditor) platform

**My goal is to make the library**

-   **Python-Like, Simple to use** 
-   **Flexible:** To be usable within a Trading Robot(EA), Custom Indicator, and Scripts.
-   **Resource-efficient:** To make it not consume a lot of resources and memory.

**Disclaimer**
*This project is not for MQL5 programming language beginners. Those with prior experience of machine learning using python might find this project easy to understand*

## Installing 

Download the zip file from the releases section extract the library. Go under MQL5 folder in your MetaEditor, from there paste the MALE5 directory you extracted under the Include folder.

![bandicam 2024-07-19 16-20-07-392](https://github.com/user-attachments/assets/e2829b7e-8fc5-4829-98fb-9277da2d86ba)


## Getting Started with the Library

In this project, machine learning models can be placed into three categories. *See the tables below*.

## 01: Predictive Models

Unlike others which are mostly used for analysis and data processing. These AI models when given an inputs (predictors) in matrices or vectors they provide predictions. Currently Available models include.

| **Model Type**               | **Models**                       |
|------------------------------|----------------------------------|
| **Linear Models**            | - Linear regression              |
|                              | - Logistic regression            |
|                              | - Ridge regression               |
|                              | - Polynomial regression          |
| **Decision Trees**           | - Decision tree                  |
| **Ensemble Models**          | - AdaBoost tree                  |
|                              | - Random forest                  |
| **Support Vector Machine**   | - SVM                            |
| **Neural Networks**          | - Regressor Neural Networks      |
|                              | - Pattern Recognition Neural Networks |
|                              | - Kohonen Maps                   |
| **Naïve Bayes**              | - Naïve Bayes models             |


### Traininng the predictive models

All the predictive models functions for training and deploying them for predictions follow similar patterns.

[![Watch the video](https://github.com/user-attachments/assets/7d68fa9f-0c75-4d37-9c0f-b9926be9c430)](https://www.youtube.com/watch?v=wKk85PZ2ra8&t=1s)


#### For Regression Problems

A regression problem is a type of predictive modeling problem where the goal is to predict a continuous output variable based on one or more input features. In other words, given input data, the model aims to determine a continuous value. For example, predicting the next closing price of a financial instrument.

**How Regression Models Work**

Firstly, we import the necessary libraries we need. In this example, we will be using the Decision Tree Regressor.

```MQL5
#include <MALE5\Decision Tree\tree.mqh>
#include <MALE5\preprocessing.mqh>
#include <MALE5\MatrixExtend.mqh> //helper functions for data manipulations
#include <MALE5\metrics.mqh> //for measuring the performance

StandardizationScaler scaler; //standardization scaler from preprocessing.mqh
CDecisionTreeRegressor *decision_tree; //a decision tree regressor model
```

1. **Data Collection**

Gather a dataset with input features (also called predictors or attributes) and the corresponding target variable (the output).

```MQL5
vector open, high, low, close;     
int data_size = 1000;

//--- Getting the open, high, low, and close values for the past 1000 bars, starting from the recent closed bar of 1
open.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_OPEN, 1, data_size);
high.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_HIGH, 1, data_size);
low.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_LOW, 1, data_size);
close.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_CLOSE, 1, data_size);

matrix X(data_size, 3); //creating the X matrix 

//--- Assigning the open, high, and low price values to the X matrix 
X.Col(open, 0);
X.Col(high, 1);
X.Col(low, 2);

vector y = close; // The target variable is the close price
```

2. **Preprocessing**

This involves cleaning and preprocessing the data, which might involve handling missing values, normalizing the data, and encoding categorical variables if possible in the data. 

```MQL5
//--- We split the data into training and testing samples for training and evaluation
matrix X_train, X_test;
vector y_train, y_test;

double train_size = 0.7; //70% of the data should be used for training, the rest for testing
int random_state = 42; //we put a random state to shuffle the data

MatrixExtend::TrainTestSplitMatrices(X, y, X_train, y_train, X_test, y_test, train_size, random_state); // we split the X and y data into training and testing samples         

//--- Normalizing the independent variables
X_train = scaler.fit_transform(X_train); // fit the scaler on the training data and transform the data
X_test = scaler.transform(X_test); // transform the test data

// Print the processed data for verification
//Print("X_train\n",X_train,"\nX_test\n",X_test,"\ny_train\n",y_train,"\ny_test\n",y_test); 
```

3. **Model Selection**

Choose a regression algorithm. Common algorithms for this type of problem include linear regression, decision trees, support vector regression (SVR), k-nearest neighbors (K-NN), and neural networks.

```MQL5
//--- Model selection
decision_tree = new CDecisionTreeRegressor(2, 5); //a decision tree regressor from DecisionTree class
```

4. **Training**

Use the training data to teach the model how to map input features to the correct continuous output values. During training, the model learns patterns in the data.

```MQL5
//--- Training the model
decision_tree.fit(X_train, y_train); // The training function
```

5. **Evaluation**

Assess the model's performance on a separate test dataset to ensure it can generalize well to new, unseen data. Metrics like R-squared (R²) score, mean absolute error (MAE), and root mean squared error (RMSE) are often used to evaluate the model.

```MQL5
//--- Measuring predictive accuracy 
vector train_predictions = decision_tree.predict(X_train);
printf("Decision Tree training R² score = %.3f ", Metrics::r_squared(y_train, train_predictions));

//--- Evaluating the model on out-of-sample predictions
vector test_predictions = decision_tree.predict(X_test);
printf("Decision Tree out-of-sample R² score = %.3f ", Metrics::r_squared(y_test, test_predictions));
```

6. **Prediction**

Once trained and evaluated, the model can be used to predict the continuous values of new, unseen data points.

```MQL5

void OnTick()
{
   //--- Making predictions live from the market 
   CopyRates(Symbol(), PERIOD_D1, 1, 1, rates); // Get the very recent information from the market
   
   vector x = {rates[0].open, rates[0].high, rates[0].low}; // Assigning data from the recent candle in a similar way to the training data
   
   double predicted_close_price = decision_tree.predict(x);
   
   Comment("Next closing price predicted is = ", predicted_close_price);  
}

```

**Types of Regression**

- **Simple Linear Regression:** Predicting a continuous target variable based on a single input feature.
- **Multiple Linear Regression:** Predicting a continuous target variable based on multiple input features.
- **Polynomial Regression:** Predicting a continuous target variable using polynomial terms of the input features.
- **Non-Linear Regression:** Predicting a continuous target variable using non-linear relationships between input features and the target variable.


#### For Classification Problems

A classification problem is a type of predictive modeling problem where the goal is to predict the category or class that a given data point belongs to. In other words, given input data, the model aims to determine which of the predefined classes the input belongs to. Forexample when trying to predict whether the next candle will be either bullish or bearish.

**How Classification Models Work**

Firstly, we import the necessary libraries we need. In this example we will be using the Decision Tree Classifier.

```MQL5

#include <MALE5\Decision Tree\tree.mqh>
#include <MALE5\preprocessing.mqh>
#include <MALE5\MatrixExtend.mqh> //helper functions for data manipulations
#include <MALE5\metrics.mqh> //fo measuring the performance

StandardizationScaler scaler; //standardization scaler from preprocessing.mqh
CDecisionTreeClassifier *decision_tree; //a decision tree classifier model

```

1. **Data Collection** 

Gather a dataset with input features (also called predictors or attributes) and the corresponding class labels (the output).
> 

```MQL5

     vector open, high, low, close;     
     int data_size = 1000;
     
//--- Getting the open, high, low and close values for the past 1000 bars, starting from the recent closed bar of 1
     
     open.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_OPEN, 1, data_size);
     high.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_HIGH, 1, data_size);
     low.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_LOW, 1, data_size);
     close.CopyRates(Symbol(), PERIOD_D1, COPY_RATES_CLOSE, 1, data_size);
     
     decision_tree = new CDecisionTreeClassifier(2, 5);
     
     matrix X(data_size, 3); //creating the x matrix 
   
//--- Assigning the open, high, and low price values to the x matrix 

     X.Col(open, 0);
     X.Col(high, 1);
     X.Col(low, 2);
     
```

2. **Preprocessing**

This involves clearning and preprocess the data, which might involve analytical techniques such as handling missing values, **normalizing the data**, and encoding categorical variables.

```MQL5

//--- We split the data into training and testing samples for training and evaluation
 
     matrix X_train, X_test;
     vector y_train, y_test;
     
     double train_size = 0.7; //70% of the data should be used for training the rest for testing
     int random_state = 42; //we put a random state to shuffle the data so that a machine learning model understands the patterns and not the order of the dataset, this makes the model durable
      
     MatrixExtend::TrainTestSplitMatrices(X, y, X_train, y_train, X_test, y_test, train_size, random_state); // we split the x and y data into training and testing samples         
     

//--- Normalizing the independent variables
   
     X_train = scaler.fit_transform(X_train); // we fit the scaler on the training data and transform the data alltogether
     X_test = scaler.transform(X_test); // we transform the new data this way
     
     //Print("X_train\n",X_train,"\nX_test\n",X_test,"\ny_train\n",y_train,"\ny_test\n",y_test); 

```

3. **Model Selection** 

Choose a classification algorithm. Common algorithms for this type of problem include; logistic regression, decision trees, support vector machines (SVM), k-nearest neighbors (K-NN), and neural networks.

```MQL5

//--- Model selection
   
     decision_tree = new CDecisionTreeClassifier(2, 5); //a decision tree classifier from DecisionTree class

```

4. **Training** 

Use the training data to teach the model how to map input features to the correct class labels. During training, the model learns patterns in the data.

```MQL5

//--- Training the  model
     
     decision_tree.fit(X_train, y_train); //The training function 
     
```

5. **Evaluation**

Assess the model's performance on a separate test dataset to ensure it can generalize well to new, unseen data. Metrics like accuracy score, precision, recall, and F1 score are often used to evaluate the model.

```MQL5

//--- Measuring predictive accuracy 
   
     vector train_predictions = decision_tree.predict_bin(X_train);
     
     printf("Decision decision_tree training accuracy = %.3f ",Metrics::accuracy_score(y_train, train_predictions));

//--- Evaluating the model on out-of-sample predictions
     
     vector test_predictions = decision_tree.predict_bin(X_test);
     
     printf("Decision decision_tree out-of-sample accuracy = %.3f ",Metrics::accuracy_score(y_test, test_predictions)); 


```

6. **Prediction** 

Once trained and evaluated, the model can be used to predict the class labels of new, unseen data points.

Unlike the `predict` function which is used to obtain predictions in regressors. The predictive functions for the classifiers have different slightly for different name starting with the word predict.

- **predict_bin** - This function can be used to predict the classes in as integer values for classification models. For example: The next candle will be ***bullish*** or ***bearish***
- **predict_proba** - This function predicts the probabilities of a certain classes as double values from 0 for a 0% probability chance to 1 for a 100% probability chance. For example: [0.64, 0.36] probability the next candle will be bullish is 64%, while the probability the next candle will be bearish is 36%

```
void OnTick()
  {
     
//--- Making predictions live from the market 
   
   CopyRates(Symbol(), PERIOD_D1, 1, 1, rates); //Get the very recent information from the market
   
   vector x = {rates[0].open, rates[0].high, rates[0].low}; //Assigning data from the recent candle in a similar way to the training data
   
   double predicted_close_price = decision_tree.predict_bin(x);
   
   Comment("Next closing price predicted is = ",predicted_close_price);  
  }

```

**Types of Classification**

- **Binary Classification:** There are only two classes. For example, classifying emails as spam or not spam.
- **Multiclass Classification:** There are more than two classes. For example, classifying types of animals in an image (e.g., cats, dogs, birds).
- **Multilabel Classification:** Each instance can be assigned multiple classes. For example, tagging a photo with multiple labels like "beach", "sunset", and "vacation".


## 02: Clustering Algorithms

These algorithms are for the special purppose of classifying and grouping data with similar patterns and contents together, they excel in data mining situations

| **Model Type**               | **Models**                       |
|------------------------------|----------------------------------|
| **Nearest Neighbors**        | - KNN nearest neighbors          |
| **K-Means Clustering**       | - k-Means clustering algorithm   |
| **Neural Networks**          | - Kohonen Maps                   |

## 03: Dimensionality Reduction Algorithms

These algorithms are widely used in situations where the dataset is huge and needs adjustmets. they excel at reducing the size of datasets without losing much information. Consider them as the algorithms to zip and shread information in the proper way.

| **Model Type**                         | **Models**                          |
|----------------------------------------|-------------------------------------|
| **Dimensionality Reduction Algorithms**| - Linear Discriminant Analysis (LDA)|
|                                        | - Non Negative Matrix Factorization (NMF) |
|                                        | - Principal Component Analysis (PCA) |
|                                        | - Truncated SVD                     |


## Basic Library functionality & helpers

* [MatrixExtend (MatrixExtend.mqh)](https://github.com/MegaJoctan/MALE5/wiki#matrixextendmatrixextendmqh)
* [Cross Validation Library (cross_validation.mqh)](https://github.com/MegaJoctan/MALE5/wiki/Cross-Validation-Library)
* [Linear Algebra Library (linalg.mqh)](https://github.com/MegaJoctan/MALE5/wiki/Linear-Algebra-Library)
* [Kernels library (kernels.mqh)](https://github.com/MegaJoctan/MALE5/wiki/Kernels-Library)
* [Metrics library (metrics.mqh)](https://github.com/MegaJoctan/MALE5/wiki/Metrics-library)
* [Pre-processing library (preprocessing.mqh)](https://github.com/MegaJoctan/MALE5/wiki/Pre-processing-library)
* [Tensor library (Tensor.mqh)](https://github.com/MegaJoctan/MALE5/wiki/Tensor-Library)


## Opening an issue
You can also post bug reports and feature requests (only) in [GitHub issues](https://github.com/MegaJoctan/MALE5/issues).

## Support the Project
If you find this project helpful, Support us by taking one or more of the actions

[BuyMeCoffee](https://www.buymeacoffee.com/omegajoctan)

[OurProducts](https://www.mql5.com/en/users/omegajoctan/seller)

Register to our recommended broker:

[ICMarkets](https://icmarkets.com/?camp=74639)

## Let's work together
[HIRE ME on MQL5.com by clicking on this link](https://www.mql5.com/en/job/new?prefered=omegajoctan)


================================================
FILE: Sklearn/Cluster/DBSCAN.mqh
================================================
//+------------------------------------------------------------------+
//|                                                       DBSCAN.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"

#include <MALE5\MatrixExtend.mqh>
#include <MALE5\linalg.mqh>

//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+
class CDBSCAN
  {
protected:
   double m_epsilon;
   uint m_minsamples;
   vector labels;
   
   vector get_neighbors(matrix &x, ulong point_index);
   bool expand_cluster(matrix &x, ulong point_index, ulong cluster_id, const vector &neighbors, const vector &cluster_labels);
   
public:
                     CDBSCAN(double epsilon, uint min_samples);
                    ~CDBSCAN(void);
                    
                    vector fit_predict(matrix &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CDBSCAN::CDBSCAN(double epsilon, uint min_samples):
m_epsilon(epsilon),
m_minsamples(min_samples)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CDBSCAN::~CDBSCAN(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CDBSCAN::get_neighbors(matrix &x, ulong point_index)
 {
   vector neighbors = {};
   
   for (ulong i=0, count=0; i<x.Rows(); i++)
    {
      if (LinAlg::norm(x.Row(point_index), x.Row(i)) < this.m_epsilon && i != point_index)
       { 
         count++;
         neighbors.Resize(count);
         neighbors[count-1] = (int)i; //Append the neighbor
       }
    }
   
   return neighbors;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool CDBSCAN::expand_cluster(matrix &x, ulong point_index, ulong cluster_id, const vector &neighbors, const vector &cluster_labels)
 {
 
   this.labels[point_index] = (int)cluster_id;
   vector points_to_explore = {(int)point_index};
   
   Print("points to explore in a cluster: ",points_to_explore);
   
   while (points_to_explore.Size()>0)
     {
       vector current_point = {points_to_explore[0]};
       points_to_explore.Resize(0);
       
       Print("current point: ", current_point);
       
       vector current_neighbors = this.get_neighbors(x, (int)current_point[0]);
       
       if (current_neighbors.Size() >= this.m_minsamples)
         for (int neighbor_index=0; neighbor_index<(int)current_neighbors.Size(); neighbor_index++)
           {
             if (this.labels[neighbor_index] == 0 || this.labels[neighbor_index] == -1)
               {
                  if (this.labels[neighbor_index] == 0)
                    {
                      points_to_explore.Resize(1);
                      points_to_explore[0] = neighbor_index;
                      
                      Print("points to explore: ",points_to_explore);
                    }
                 this.labels[neighbor_index] = (int)cluster_id;
               }  
           }
     }
   
   return true; 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CDBSCAN::fit_predict(matrix &x)
 {
   this.labels.Resize(x.Rows()); labels.Fill(0);
   ulong cluster_id = 0; 
   
   for (ulong i=0; i<x.Rows(); i++) 
     {
       if (this.labels[i] != 0)
         continue;
        
        vector neighbors = get_neighbors(x, i);
        
        
        if (neighbors.Size() < this.m_minsamples)
          this.labels[i] = -1; //Mark as noise
        else
          {
           cluster_id++;
           Print("Expand cluster: ",i);
           expand_cluster(x, i, cluster_id, neighbors, this.labels);
          }  
     }
   return this.labels;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/Cluster/Hierachical Clustering.mqh
================================================
//+------------------------------------------------------------------+
//|                                       Hierachical Clustering.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"

#include "Base.mqh"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+

enum linkage_enum 
 {
   LINKAGE_SINGLE,
   LINKAGE_COMPLETE,
   LINKAGE_AVG
 };
 
class CAgglomerativeClustering
  {
protected:

   linkage_enum linkage;
   vector       labels;
   matrix       clusters_keys;
   
   matrix       calc_distance_matrix(matrix &x, vector &cluster_members);   
   
public:
                     CAgglomerativeClustering(linkage_enum linkage_type=LINKAGE_SINGLE);
                    ~CAgglomerativeClustering(void);
                    
                    void fit(matrix &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CAgglomerativeClustering::CAgglomerativeClustering(linkage_enum linkage_type=LINKAGE_SINGLE)
 :linkage(linkage_type)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CAgglomerativeClustering::~CAgglomerativeClustering(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CAgglomerativeClustering::calc_distance_matrix(matrix &x, vector &cluster_members)
 {
   clusters_keys.Init(1, x.Cols()); //initializes the clusters_keys such that each data point is initially in its own cluster
   for (ulong i=0; i<x.Cols(); i++)    clusters_keys.Col(clusters_keys.Col(i).Fill(i), i); //Filll the initial clusters_keys matrix with their columns incremental values
   
   matrix distance(x.Rows(), x.Rows());
   distance.Fill(0.0);
   
   vector v1, v2;
   
   vector ith_element, jth_element;
   for (ulong i=0; i<distance.Cols(); i++)
    {
     ith_element = cluster_members[(int)clusters_keys[i]];
     for (ulong j=0; j<distance.Cols(); j++)
        {
          jth_element = cluster_members[(int)clusters_keys[j]];
          
          v1 = x.Col(i); v2 = x.Col(j);
          distance[i][j] = Base::norm(v1, v2);
        }
    }
   
   return distance;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CAgglomerativeClustering::fit(matrix &x)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/Cluster/KMeans.mqh
================================================
//+------------------------------------------------------------------+
//|                                                       KMeans.mqh |
//|                                    Copyright 2022, Omega Joctan. |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Omega Joctan."
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+

#include <Graphics\Graphic.mqh>
CGraphic graph;
#include <MALE5\MatrixExtend.mqh>

//+------------------------------------------------------------------+
enum errors
  {
   KM_ERR001, //clusters not matching in size Error
   KM_ERR002
  };

//+------------------------------------------------------------------+
 
class CKMeans
  {
  
private:
   ulong             n; //number of samples
   uint              m_clusters;
   ulong             m_cols;
   matrix            InitialCentroids;
   vector<double>    cluster_assign;

protected:
   matrix            Matrix;
   bool              ErrMsg(errors err); 
   bool              ScatterCurvePlots(
                                       string obj_name,
                                       double &x[],
                                       double &y[],
                                       double &curveArr[],
                                       string legend,
                                       string x_axis_label = "x-axis",
                                       string y_axis_label = "y-axis",
                                       color  clr = clrDodgerBlue,
                                       bool   points_fill = true
                                    );

public:
                     CKMeans(const matrix &_Matrix, int clusters=3);
                    ~CKMeans(void);

   void              KMeansClustering(matrix &clustered_matrix, matrix &centroids, int iterations = 1, bool rand_cluster =false);
   void              ElbowMethod(const int initial_k=1, int total_k=10, bool showPlot = true);
   void              FilterZero(vector &vec);
   void              matrixtoArray(matrix &mat, double &Array[]);
  };
//+------------------------------------------------------------------+
CKMeans::CKMeans(const matrix &_Matrix, int clusters=3)
  {
   m_clusters = clusters;
   Matrix.Copy(_Matrix);

   m_cols = Matrix.Cols();
   n = Matrix.Rows(); //number of elements | Matrix Rows
  }
//+------------------------------------------------------------------+
CKMeans::~CKMeans(void)
  {
   ZeroMemory(m_clusters);
   ZeroMemory(InitialCentroids);
   ZeroMemory(cluster_assign);
  }

//+------------------------------------------------------------------+
 
void CKMeans::KMeansClustering(matrix &clustered_matrix, matrix &centroids, int iterations = 1, bool rand_cluster =false)
  {
   InitialCentroids.Resize(m_clusters, m_cols);
   cluster_assign.Resize(n);
   
   clustered_matrix.Resize(m_clusters, m_cols*n);
   clustered_matrix.Fill(NULL);

   vector cluster_comb_v = {};
   matrix cluster_comb_m = {};

   vector rand_v = {};
   ulong rand_ = 0;

   for(ulong i=0; i<m_clusters; i++)
     {
      rand_ = rand_cluster ? (ulong)MathFloor(i*(n/m_clusters)) : i;
      rand_v = Matrix.Row(rand_);

      InitialCentroids.Row(rand_v, i);
     }

//---

   vector v_row;


   matrix rect_distance = {};  //matrix to store rectilinear distances
   rect_distance.Reshape(n, m_clusters);


   vector v_matrix = {}, v_centroid = {};
   double output = 0;

//---

   for(int iter=0; iter<iterations; iter++)
     {

      for(ulong i=0; i<rect_distance.Rows(); i++)
         for(ulong j=0; j<rect_distance.Cols(); j++)
           {
            v_matrix = Matrix.Row(i);
            v_centroid = InitialCentroids.Row(j);

            ZeroMemory(output);

            for(ulong k=0; k<v_matrix.Size(); k++)
               output += MathAbs(v_matrix[k] - v_centroid[k]); //Rectilinear distance

            rect_distance[i][j] = output;
           }

      //---  Assigning the Clusters

      matrix cluster_cent = {}; //cluster centroids
      ulong cluster = 0;

      for(ulong i=0; i<rect_distance.Rows(); i++)
        {
         v_row = rect_distance.Row(i);
         cluster = v_row.ArgMin();

         cluster_assign[i] = (double)cluster;
        }


      vector temp_cluster_assign = cluster_assign;

      //--- Combining the clusters

      for(ulong i=0, index =0; i<cluster_assign.Size(); i++)
        {
         ZeroMemory(cluster_cent);
         bool classified = false;

         for(ulong j=0, count = 0; j<temp_cluster_assign.Size(); j++)
           {

            if(cluster_assign[i] == temp_cluster_assign[j])
              {
               classified = true;

               count++;

               cluster_comb_m.Resize(count, m_cols);

               cluster_comb_m.Row(Matrix.Row(j), count-1);

               cluster_cent.Resize(count, m_cols);

               // New centroids
               cluster_cent.Row(Matrix.Row(j), count-1);

               temp_cluster_assign[j] = -100; //modify the cluster item so it can no longer be found
              }
            else
               continue;
           }

         //---

         if(classified == true)
           {
            // solving for new cluster and updtating the old ones
            
            
             cluster_comb_v = MatrixExtend::MatrixToVector(cluster_comb_m);
            

            if(iter == iterations-1)
               clustered_matrix.Row(cluster_comb_v, index); 

            index++;
            //---

            vector x_y_z = {0, 0};
            ZeroMemory(rand_v);

            for(ulong k=0; k<cluster_cent.Cols(); k++)
              {
               x_y_z.Resize(cluster_cent.Cols());
               rand_v = cluster_cent.Col(k);

               x_y_z[k] = rand_v.Mean();
              }

            InitialCentroids.Row(x_y_z, i);

           }

         if(index >= m_clusters)
            break;
        }

     } //end of iterations

   ZeroMemory(centroids);
   centroids.Copy(InitialCentroids);
  }

//+------------------------------------------------------------------+

bool CKMeans::ErrMsg(errors err)
  {
   switch(err)
     {

      case  KM_ERR001:
         printf("%s Clusters not matching in Size ", EnumToString(KM_ERR001));
         break;
      default:
         break;
     }
   return(true);
  }

//+------------------------------------------------------------------+
 
void CKMeans::ElbowMethod(const int initial_k=1, int total_k=10, bool showPlot = true)
  {
   matrix clustered_mat, _centroids = {};

   if(total_k > (int)n)
      total_k = (int)n; //k should always be less than n

   vector centroid_v= {}, x_y_z= {};
   vector short_v = {}; //vector for each point
   vector minus_v = {}; //vector to store the minus operation output

   double wcss = 0;
   double WCSS[];
   ArrayResize(WCSS, total_k);
   double kArray[];
   ArrayResize(kArray, total_k);

   for(int k=initial_k, count_k=0; k<ArraySize(WCSS)+initial_k; k++, count_k++)
     {

      wcss = 0;

      m_clusters = k;

      KMeansClustering(clustered_mat, _centroids);

      for(ulong i=0; i<_centroids.Rows(); i++)
        {
         centroid_v = _centroids.Row(i);

         x_y_z = clustered_mat.Row(i);
         FilterZero(x_y_z);


         for(ulong j=0; j<x_y_z.Size()/m_cols; j++)
           {

            MatrixExtend::Copy(x_y_z, short_v, uint(j*m_cols), (uint)m_cols);

            //---                WCSS ( within cluster sum of squared residuals )

            minus_v = (short_v - centroid_v);

            minus_v = MathPow(minus_v, 2);

            wcss += minus_v.Sum();

           }

        }

      WCSS[count_k] = wcss;
      kArray[count_k] = k;
     }

   Print("WCSS");
   ArrayPrint(WCSS);
   Print("kArray");
   ArrayPrint(kArray);

//--- Plotting the Elbow on the graph

   if(showPlot)
     {
      ObjectDelete(0, "elbow");
      ScatterCurvePlots("elbow", kArray, WCSS, WCSS, "Elbow line", "k", "WCSS");
     }
  }

//+------------------------------------------------------------------+
 
void CKMeans::FilterZero(vector &vec)
  {
   vector new_vec = {};

   for(ulong i=0, count =0; i<vec.Size(); i++)
     {
      if(vec[i] != NULL)
        {
         count++;
         new_vec.Resize(count);
         new_vec[count-1] = vec[i];
        }
      else
         continue;
     }

   vec.Copy(new_vec);
  }

//+------------------------------------------------------------------+
//+------------------------------------------------------------------+
 
bool CKMeans::ScatterCurvePlots(
   string obj_name,
   double &x[],
   double &y[],
   double &curveArr[],
   string legend,
   string x_axis_label = "x-axis",
   string y_axis_label = "y-axis",
   color  clr = clrDodgerBlue,
   bool   points_fill = true
)
  {

   if(!graph.Create(0, obj_name, 0, 30, 70, 800, 640))
     {
      printf("Failed to Create graphical object on the Main chart Err = %d", GetLastError());
      return(false);
     }

   ChartSetInteger(0, CHART_SHOW, true);

//---

//graph.CurveAdd(x,y,clrBlack,CURVE_POINTS,y_axis_label);
   graph.CurveAdd(x, curveArr, clr, CURVE_POINTS_AND_LINES, legend);

   graph.XAxis().Name(x_axis_label);
   graph.XAxis().NameSize(13);
   graph.YAxis().Name(y_axis_label);
   graph.YAxis().NameSize(13);
   graph.FontSet("Lucida Console", 13);
   graph.CurvePlotAll();
   graph.Update();

   return(true);
  }

//+------------------------------------------------------------------+
 
void CKMeans::matrixtoArray(matrix &mat, double &Array[])
  {
   ArrayFree(Array);
   ArrayResize(Array, int(mat.Rows()*mat.Cols()));

   int index = 0;
   for(ulong i=0; i<mat.Rows(); i++)
      for(ulong j=0; j<mat.Cols(); j++, index++)
        {
         Array[index] = mat[i][j];
        }
  }

//+------------------------------------------------------------------+ 


================================================
FILE: Sklearn/Cluster/base.mqh
================================================
//+------------------------------------------------------------------+
//|                                                         BaseClustering.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"

#include <MALE5\MatrixExtend.mqh>
#include <MALE5\linalg.mqh>
#include <MALE5\MqPlotLib\plots.mqh>
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+
class BaseClustering
  {
public:
                     BaseClustering(void);
                    ~BaseClustering(void);
                    
                    static matrix Get(matrix &X, vector &index, int axis=0);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix BaseClustering::Get(matrix &X, vector &index, int axis=0)
 {
   matrix ret_matrix = {};
   
   ulong row_col=0;
   bool isRows = true;
    switch(axis)
      {
       case  0:
         row_col = X.Rows();
         isRows = true;
         break;
       case 1:
         row_col = X.Cols();
         isRows = false;
         break;
       default:
         printf("%s Invalid axis %d ",__FUNCTION__,axis);
         return ret_matrix;
         break;
      }
//---
   
   ret_matrix.Resize(isRows?index.Size():X.Rows(), isRows?X.Cols(): index.Size());
   
   for (ulong i=0, count=0; i<row_col; i++)
     for (ulong j=0; j<index.Size(); j++)
        {
          if (isRows)
           {
             if (i==index[j])
              {
                if (isRows)
                  ret_matrix.Row(X.Row(i), count);
                else
                  ret_matrix.Col(X.Col(i), count);
                  
                count++;
              }
           }
        }
     
  return ret_matrix; 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

================================================
FILE: Sklearn/Decomposition/LDA.mqh
================================================
//+------------------------------------------------------------------+
//|                                                          LDA.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+

#include "base.mqh";
#include <MALE5\Numpy\Numpy.mqh>
#include <MALE5\MqPlotLib\plots.mqh>

enum lda_criterion //selecting best components criteria selection
  {
    CRITERION_VARIANCE,
    CRITERION_KAISER,
    CRITERION_SCREE_PLOT
  };

class CLDA
  {  
CPlots   plt;
CNumpy np;

protected:
   uint m_components;
   lda_criterion m_criterion;
   
   matrix projection_matrix;
   ulong num_features;
   double m_regparam;
   vector mean;
   
   uint calculate_variance(vector &eigen_values, double threshold=0.95);
   uint calculate_kaiser(vector &eigen_values);
   
   uint CLDA::extract_components(vector &eigen_values, double threshold=0.95);
   
public:
                     CLDA(uint k=NULL, lda_criterion CRITERION_=CRITERION_SCREE_PLOT, double reg_param =1e-6);
                    ~CLDA(void);
                    
                     matrix fit_transform(const matrix &x, const vector &y);
                     matrix transform(const matrix &x);
                     vector transform(const vector &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CLDA::CLDA(uint k=NULL, lda_criterion CRITERION_=CRITERION_SCREE_PLOT, double reg_param=1e-6)
:m_components(k),
 m_criterion(CRITERION_),
 m_regparam(reg_param)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CLDA::~CLDA(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix  CLDA::fit_transform(const matrix &x, const vector &y)
 {
   vector classes = np.unique(y).unique;
   ulong num_classes = classes.Size();
   num_features = x.Cols();
   
   this.mean = x.Mean(0);
   
   matrix x_centered = BaseDimRed::subtract(x, this.mean);
   
   matrix class_means(classes.Size(), x.Cols());
   class_means.Fill(0.0);
   
   for (ulong i=0; i<num_classes; i++)
    {
     matrix class_samples = {};
      for (ulong j=0, count=0; j<x.Rows(); j++)
         {
           if (y[j] == classes[i])
            {  
               count++;
               class_samples.Resize(count, num_features);
               class_samples.Row(x.Row(j), count-1);
            }
         }
         
      class_means.Row(class_samples.Mean(0), i);
    }
    
    
  matrix SW, SB; //within and between scatter matrices 
  SW.Init(num_features, num_features);
  SB.Init(num_features, num_features);
  
  for (ulong i=0; i<num_classes; i++)
   {
     matrix class_samples = {};
      for (ulong j=0, count=0; j<x.Rows(); j++)
         {
           if (y[j] == classes[i]) //Collect a matrix for samples belonging to a particular class
            {
               count++;
               class_samples.Resize(count, num_features);
               class_samples.Row(x.Row(j), count-1);
            }
         }

         
     matrix diff = BaseDimRed::subtract(class_samples, class_means.Row(i)); //Each row subtracted to the mean
     if (diff.Rows()==0 && diff.Cols()==0) //if the subtracted matrix is zero stop the program for possible bugs or errors
      {
        DebugBreak();
        return x_centered;
      }
     
     SW += diff.Transpose().MatMul(diff); //Find within scatter matrix 
     
     vector mean_diff = class_means.Row(i) - x_centered.Mean(0);
     SB += class_samples.Rows() * mean_diff.Outer(mean_diff); //compute between scatter matrix 
   }
  
//--- Regularization to avoid errors while calculating Eigen values and vectors
   
   SW += this.m_regparam * np.eye((uint)num_features, (uint)num_features, 1); 
   SB += this.m_regparam * np.eye((uint)num_features, (uint)num_features, 1);

//---

  matrix eigen_vectors(x.Cols(), x.Cols());  eigen_vectors.Fill(0.0);
  vector eigen_values(x.Cols()); eigen_values.Fill(0.0);
  
  matrix SBSW = SW.Inv().MatMul(SB);
  
  BaseDimRed::ReplaceNaN(SBSW);
  
  if (!SBSW.Eig(eigen_vectors, eigen_values))
    {
      Print("%s Failed to calculate eigen values and vectors Err=%d",__FUNCTION__,GetLastError());
      DebugBreak();
      
      matrix empty = {};
      return empty;
    }
    
//--- Sort eigenvectors by decreasing eigenvalues
   
   vector args = np.argsort(eigen_values);
   args = np.reverse(args);
   
   eigen_values = BaseDimRed::Sort(eigen_values, args);
   eigen_vectors = BaseDimRed::Sort(eigen_vectors, args);
   
//---
   
  if (this.m_components == NULL)
   {
     this.m_components = extract_components(eigen_values);
     if (this.m_components==0)
      {
        printf("%s Failed to auto detect the best components\n You need to select the value of k yourself by looking at the scree plot",__FUNCTION__);
        this.m_components = (uint)x.Cols();
      }
   }
  else //plot the scree plot 
    extract_components(eigen_values);
    
  this.projection_matrix = BaseDimRed::Slice(eigen_vectors, this.m_components);
    
  return x_centered.MatMul(projection_matrix.Transpose());
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CLDA::transform(const matrix &x)
 {
   if (this.projection_matrix.Rows() == 0)
    {
      printf("%s fit_transform method must be called befor transform",__FUNCTION__);
      matrix empty = {};
      return empty; 
    }
  matrix x_centered = BaseDimRed::subtract(x, this.mean);
  
  return x_centered.MatMul(this.projection_matrix.Transpose());  
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CLDA::transform(const vector &x)
 {
   matrix m = CUtils::VectorToMatrix(x, this.num_features); 
   
   if (m.Rows()==0)
    {
      vector empty={};
      return empty; //return nothing since there is a failure in converting vector to matrix
    }
   
   m = transform(m);
   return np.flatten(m);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
uint CLDA::calculate_variance(vector &eigen_values, double threshold=0.95)
 {
  uint k=0; 
  
   vector eigen_pow = MathPow(eigen_values, 2);
   vector cum_sum = eigen_pow.CumSum();
   double sum = eigen_pow.Sum();
   
   vector cumulative_variance =  cum_sum / sum;
   
   if (MQLInfoInteger(MQL_DEBUG))
     Print("Cummulative variance: ",cumulative_variance);
   
   vector v(cumulative_variance.Size());  v.Fill(0.0);
   for (ulong i=0; i<v.Size(); i++)
     v[i] = (cumulative_variance[i] >= threshold);
      
   k = (uint)v.ArgMax() + 1;
   
   return k;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
uint CLDA::calculate_kaiser(vector &eigen_values)
 {
  vector v(eigen_values.Size()); v.Fill(0.0);
   for (ulong i=0; i<eigen_values.Size(); i++)
     v[i] = (eigen_values[i] >= 1);
   
   return uint(v.Sum());
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
uint CLDA::extract_components(vector &eigen_values, double threshold=0.95)
 {
  uint k = 0;
  
   switch(m_criterion)
     {
      case  CRITERION_VARIANCE: 
         k = calculate_variance(eigen_values, threshold);
         
        break;
        
      case  CRITERION_KAISER:
         k = calculate_kaiser(eigen_values);
        
        break;
        
      case  CRITERION_SCREE_PLOT:
       {  
         vector v_cols(eigen_values.Size());
         
         for (ulong i=0; i<v_cols.Size(); i++)
             v_cols[i] = (int)i+1;
             
          vector vars = eigen_values;
          
          plt.Plot("Scree plot",v_cols,vars,"EigenValue","Principal Components","EigenValue", CURVE_POINTS_AND_LINES);

//---
      string warn = "\n<<<< WARNING >>>>\nThe Scree plot doesn't return the determined number of k m_components\nThe cummulative variance Or kaiser will return the number of k m_components instead\nThe k returned might be different from what you see on the scree plot";
             warn += "\nTo apply the same number of k m_components to the LDA from the scree plot\nCall the LDA model again with that value applied from the plot\n";
      
         Print(warn);
        
        //--- Kaiser
           
           k = calculate_kaiser(eigen_values);
            
            if (k==0) //kaiser wasn't suitable in this particular task
              k = calculate_variance(eigen_values, threshold);
        }          
           
        break;
     } 
     
   return (k);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/Decomposition/NMF.mqh
================================================
//+------------------------------------------------------------------+
//|                                                          NMF.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+
#include "base.mqh";
#include <MALE5\Numpy\Numpy.mqh>
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
class CNMF
  {
protected:

   CNumpy np;
   uint m_components;
   uint m_max_iter;
   int m_randseed;
   ulong n_features;
   matrix W; //Basic matrix
   matrix H; //coefficient matrix
   double m_tol; //loss tolerance
   
public:
                     CNMF(uint max_iter=100, double tol=1e-4, int random_state=-1);
                    ~CNMF(void);
                    
                    matrix fit_transform(matrix &X, uint k=2);
                    matrix transform(matrix &X);
                    vector transform(vector &X);
                    uint select_best_components(matrix &X);
                    
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CNMF::CNMF(uint max_iter=100, double tol=1e-4,int random_state=-1)
 :m_max_iter(max_iter),
 m_randseed(random_state),
 m_tol(tol)
 {
   
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CNMF::~CNMF(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CNMF::transform(matrix &X)
 {
  n_features = X.Cols();
  if (m_components>n_features)
     {
       printf("%s Number of dimensions K[%d] is supposed to be <= number of features %d",__FUNCTION__,m_components,n_features);
       this.m_components = (uint)n_features;
     }
     
  if (this.W.Rows()==0 || this.H.Rows()==0)
    {
      Print(__FUNCTION__," Model not fitted. Call fit method first.");
      matrix mat={};
      return mat;
    }
  
  return X.MatMul(this.H.Transpose());
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CNMF::transform(vector &X)
 {
   matrix INPUT_MAT = np.expand_dims(X, 0);
   matrix OUTPUT_MAT = transform(INPUT_MAT);
   
   return np.flatten(OUTPUT_MAT);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CNMF::fit_transform(matrix &X, uint k=2)
 {
  ulong m = X.Rows(), n = X.Cols();
  double best_frobenius_norm = DBL_MIN;
  
   m_components = m_components == 0 ? (uint)n : k;      
   
//--- Initialize Random values 

   np.random.seed(this.m_randseed);
   this.W = np.random.randn((uint)m, this.m_components);  
   this.H = np.random.randn(this.m_components, (uint)n);
   
//--- Update factors
      
   vector loss(this.m_max_iter);
    for (uint i=0; i<this.m_max_iter; i++)
      {
        // Update W
         this.W *= MathAbs((X.MatMul(this.H.Transpose())) / (this.W.MatMul(this.H.MatMul(this.H.Transpose()))+ 1e-10));
         
        // Update H
         this.H *= MathAbs((this.W.Transpose().MatMul(X)) / (this.W.Transpose().MatMul(this.W.MatMul(this.H))+ 1e-10));
         
         loss[i] = MathPow((X - W.MatMul(H)).Flat(1), 2);
                    
         // Calculate Frobenius norm of the difference
        double frobenius_norm = (X - W.MatMul(H)).Norm(MATRIX_NORM_FROBENIUS);

         if (MQLInfoInteger(MQL_DEBUG))
           printf("%s [%d/%d] Loss = %.5f frobenius norm %.5f",__FUNCTION__,i+1,m_max_iter,loss[i],frobenius_norm);
         
          // Check convergence
          if (frobenius_norm < this.m_tol)
              break;
      }
  
  return this.W.MatMul(this.H); 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
uint CNMF::select_best_components(matrix &X)
{
    uint best_components = 1;
    this.m_components = (uint)X.Cols();
    
    vector explained_ratio(X.Cols());    
    for (uint k = 1; k <= X.Cols(); k++)
    {
       // Calculate explained variance or other criterion 
       matrix X_reduced = fit_transform(X, k);
   
       // Calculate explained variance as the ratio of squared Frobenius norms
       double explained_variance = 1.0 - (X-X_reduced).Norm(MATRIX_NORM_FROBENIUS) / (X.Norm(MATRIX_NORM_FROBENIUS));
        
        if (MQLInfoInteger(MQL_DEBUG))
            printf("k %d Explained Var %.5f",k,explained_variance);
       
       explained_ratio[k-1] = explained_variance;       
    }
    
    return uint(explained_ratio.ArgMax()+1);
}
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/Decomposition/PCA.mqh
================================================
//+------------------------------------------------------------------+
//|                                                          pca.mqh |
//|                                    Copyright 2022, Fxalgebra.com |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Fxalgebra.com"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//|         Principle Component Analysis Library                     |
//+------------------------------------------------------------------+
#include "base.mqh"
#include <MALE5\MqPlotLib\plots.mqh>
#include <MALE5\Numpy\Numpy.mqh>
//+------------------------------------------------------------------+
//|            Principal Component Analysis Class                    |
//+------------------------------------------------------------------+
class CPCA
  {

enum criterion
  {
    CRITERION_VARIANCE,
    CRITERION_KAISER,
    CRITERION_SCREE_PLOT
  };
  
CPlots   plt;
CNumpy   np;

protected:
   uint              m_components;
   criterion         m_criterion;
   
   matrix            components_matrix;
   vector            mean;   
   
   uint              n_features;
                     
                     
                     uint extract_components(vector &eigen_values, double threshold=0.95);
                     
public:
                     CPCA(int k=0, criterion CRITERION_=CRITERION_SCREE_PLOT);
                    ~CPCA(void);
                    
                     matrix fit_transform(matrix &X);
                     matrix transform(matrix &X);
                     vector transform(vector &X);
                     bool save(string dir);
                     bool load(string dir);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CPCA::CPCA(int k=0, criterion CRITERION_=CRITERION_SCREE_PLOT)
 :m_components(k),
  m_criterion(CRITERION_)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CPCA::~CPCA(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CPCA::fit_transform(matrix &X)
 {    
   n_features = (uint)X.Cols();
   
   if (m_components>n_features)
     {
       printf("%s Number of dimensions K[%d] is supposed to be <= number of features %d",__FUNCTION__,m_components,n_features);
       this.m_components = (int)n_features;
       Print(__LINE__);
     }

//---
   
   this.mean = X.Mean(0);
   
   matrix X_centered = BaseDimRed::subtract(X, this.mean);   
   BaseDimRed::ReplaceNaN(X_centered);
   
   matrix cov_matrix = cova(X_centered, false);
   
   matrix eigen_vectors;
   vector eigen_values;
    
   BaseDimRed::ReplaceNaN(cov_matrix);
   
   if (!cov_matrix.Eig(eigen_vectors, eigen_values))
     printf("Failed to caculate Eigen matrix and vectors Err=%d",GetLastError());
   
//--- Sort eigenvectors by decreasing eigenvalues
   
   vector args = np.argsort(eigen_values); 
   args = np.reverse(args);
   
   eigen_values = BaseDimRed::Sort(eigen_values, args);
   eigen_vectors = BaseDimRed::Sort(eigen_vectors, args);
   
//---

   if (MQLInfoInteger(MQL_DEBUG))
      Print("Eigen values: ",eigen_values);
      
   if (m_components==0)
     m_components = this.extract_components(eigen_values);
   else
     this.extract_components(eigen_values);
   
   if (MQLInfoInteger(MQL_DEBUG)) 
     printf("%s Selected components %d",__FUNCTION__,m_components);
   
   this.components_matrix = BaseDimRed::Slice(eigen_vectors, m_components, 1); //Get the components matrix
   //MatrixExtend::NormalizeDouble_(this.components_matrix, 5);
   //this.components_matrix = scaler.fit_transform(this.components_matrix.Transpose()); //Normalize components matrix
   
   this.components_matrix = this.components_matrix.Transpose();
   
   if (MQLInfoInteger(MQL_DEBUG))
     Print("components_matrix\n",components_matrix);
   
//---
      
   return X_centered.MatMul(components_matrix.Transpose()); //return the pca scores
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CPCA::transform(matrix &X)
 {
   if (X.Cols()!=this.n_features)
     {
       printf("%s Inconsistent input X matrix size, It is supposed to be of size %d same as the matrix used under fit_transform",__FUNCTION__,n_features);
       this.m_components = n_features;
     }
     
   matrix X_centered = BaseDimRed::subtract(X, this.mean);

   return X_centered.MatMul(this.components_matrix.Transpose()); //return the pca scores
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CPCA::transform(vector &X)
 {
   matrix INPUT_MAT = np.expand_dims(X, 0);
   matrix OUTPUT_MAT = transform(INPUT_MAT);
      
   return np.flatten(OUTPUT_MAT);
 }
//+------------------------------------------------------------------+
//|   Select the number of components based on some criterion        |
//+------------------------------------------------------------------+
uint CPCA::extract_components(vector &eigen_values, double threshold=0.95)
 {
  uint k = 0;
  
   vector eigen_pow = MathPow(eigen_values, 2);
   vector cum_sum = eigen_pow.CumSum();
   double sum = eigen_pow.Sum();
   
   switch(m_criterion)
     {
      case  CRITERION_VARIANCE: 
         {              
            
            vector cumulative_variance =  cum_sum / sum;
            
            if (MQLInfoInteger(MQL_DEBUG))
              Print("Cummulative variance: ",cumulative_variance);
            
            vector v(cumulative_variance.Size());  v.Fill(0.0);
            for (ulong i=0; i<v.Size(); i++)
              v[i] = (cumulative_variance[i] >= threshold);
               
            k = (uint)v.ArgMax() + 1;
         }  
         
        break;
        
      case  CRITERION_KAISER:
         {
           vector v(eigen_values.Size()); v.Fill(0.0);
            for (ulong i=0; i<eigen_values.Size(); i++)
              v[i] = (eigen_values[i] >= 1);
            
            k = uint(v.Sum());
         } 
        
        break;
        
      case  CRITERION_SCREE_PLOT:
       {  
         vector v_cols(eigen_values.Size());
         
         for (ulong i=0; i<v_cols.Size(); i++)
             v_cols[i] = (int)i+1;
             
          vector vars = eigen_values;
          
          //matrix_utils.Sort(vars); //Make sure they are in ascending first order
          //matrix_utils.Reverse(vars);  //Set them to descending order
          
          plt.Plot("Scree plot",v_cols,vars,"EigenValue","Principal Components","EigenValue",CURVE_POINTS_AND_LINES);

//---
      string warn = "\n<<<< WARNING >>>>\nThe Scree plot doesn't return the determined number of k components\nThe cummulative variance will return the number of k components instead\nThe k returned might be different from what you see on the scree plot";
             warn += "\nTo apply the same number of k components to the PCA from the scree plot\nCall the PCA model again with that value applied from the plot\n";
      
         Print(warn);
        
        //--- Kaiser
        
           vector v(eigen_values.Size()); v.Fill(0.0);
            for (ulong i=0; i<eigen_values.Size(); i++)
              v[i] = (eigen_values[i] >= 1);
            
            k = uint(v.Sum());
        }          
           
        break;
     } 
     
   return (k);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool CPCA::save(string dir)
 { 
   
   matrix m = CUtils::VectorToMatrix(this.mean, this.mean.Size());
   
   if (!CUtils::WriteCsv(dir+"\\PCA-Mean.csv",m,NULL,false,8))
     {
       Print("Failed to Save PCA-Mean information to ",dir);
       return false;
     }

//---

   if (!CUtils::WriteCsv(dir+"\\PCA-ComponentsMatrix.csv",this.components_matrix,NULL,false,8))
     {
       Print("Failed to Save PCA-ComponentsMatrix information to ",dir);
       return false;
     }
     
   return true;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool CPCA::load(string dir)
 {
   string header;
   matrix m = CUtils::ReadCsv(dir+"\\PCA-Mean.csv",header);
   
   if (m.Rows()==0)
     return false;
     
   this.mean = CUtils::MatrixToVector(m);
   this.n_features = (uint)this.mean.Size();
   
//---
   
   this.components_matrix = CUtils::ReadCsv(dir+"\\PCA-ComponentsMatrix.csv",header);
   
   //printf("Components Matrix[%dx%d]",components_matrix.Rows(),components_matrix.Cols());
   
   if (components_matrix.Rows()==0)
     return false;
     
   return true;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

matrix cova(matrix &data, bool row_var=true)
  {
    if (row_var)
        data = data.Transpose();  // Transpose if each row represents a data point

    // Step 1: Center the data
    matrix centered_data = BaseDimRed::subtract(data, data.Mean(0));

    // Step 2: Calculate the covariance matrix
    matrix covariance_matrix = centered_data.Transpose().MatMul(centered_data) / (data.Rows() - 1);

    return covariance_matrix;
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

================================================
FILE: Sklearn/Decomposition/README.md
================================================
## Linear Discriminant Analysis (LDA) 

This documentation explains the `CLDA` class in MQL5, which implements **Linear Discriminant Analysis (LDA)** for dimensionality reduction and classification tasks.

**I. LDA Theory:**

LDA is a supervised learning technique that aims to find **linear projections** of the data that **maximize the separation between different classes** while **minimizing variance within each class**. This makes it particularly useful for **classification** problems where the goal is to distinguish between distinct groups.

**II. CLDA Class:**

The `CLDA` class provides functionalities for performing LDA in MQL5:

**Public Functions:**

* `CLDA(uint k=NULL, lda_criterion CRITERION_=CRITERION_SCREE_PLOT, double reg_param =1e-6)` Constructor, allows setting hyperparameters:
    * `k`: Number of components to extract (default: None, determined automatically).
    * `CRITERION_`: Criterion for selecting the best components (default: CRITERION_SCREE_PLOT).
    * `reg_param`: Regularization parameter to prevent overfitting (default: 1e-6).
* `~CLDA(void)`: Destructor.
* `matrix fit_transform(const matrix &x, const vector &y):` Trains the model on the provided data (`x` - independent variables, `y` - class labels) and returns the transformed data.
* `matrix transform(const matrix &x):` Transforms new data (`x`) using the trained model.
* `vector transform(const vector &x):` Transforms a single new data point (`x`) using the trained model.

**Internal Functions:**

* `calculate_variance(vector &eigen_values, double threshold=0.95)`: Calculates the number of components based on explained variance (optional).
* `calculate_kaiser(vector &eigen_values)`: Calculates the number of components based on Kaiser's criterion (optional).
* `extract_components(vector &eigen_values, double threshold=0.95)`: Extracts the selected number of components based on the chosen criterion.

**III. Additional Notes:**

* The `m_criterion` member variable allows choosing the criterion for selecting the number of components:
    * **CRITERION_VARIANCE:** Retains components that explain a specific percentage of variance (set by `threshold`).
    * **CRITERION_KAISER:** Retains components with eigenvalues greater than 1.
    * **CRITERION_SCREE_PLOT:** Analyzes the scree plot to visually determine the number of components with significant eigenvalues.
* The `m_regparam` member variable allows for regularization to prevent overfitting.
* The class internally uses the `CPlots` class (not documented here) for potential visualization purposes (e.g., scree plot).


## Principal Component Analysis (PCA) 

This documentation explains the `CPCA` class in MQL5, which implements **Principal Component Analysis (PCA)** for dimensionality reduction and data visualization tasks.

**I. PCA Theory:**

PCA is an unsupervised learning technique that aims to find a **linear transformation** of the data that captures the most **variance** in a **reduced number of dimensions**. This allows for:

* **Dimensionality reduction:** Reduce the number of features while retaining most of the information in the data.
* **Data visualization:** Project high-dimensional data onto a lower-dimensional space for easier visualization.

**II. CPCA Class:**

The `CPCA` class provides functionalities for performing PCA in MQL5:

**Public Functions:**

* `CPCA(int k=0, criterion CRITERION_=CRITERION_SCREE_PLOT)` Constructor, allows setting hyperparameters:
    * `k`: Number of components to extract (default: 0, determined automatically using the chosen criterion).
    * `CRITERION_`: Criterion for selecting the best components (default: CRITERION_SCREE_PLOT).
* `~CPCA(void)` Destructor.
* `matrix fit_transform(matrix &X)` Trains the model on the provided data (`X`) and returns the transformed data.
* `matrix transform(matrix &X)` Transforms new data (`X`) using the trained model.
* `vector transform(vector &X)` Transforms a single new data point (`X`) using the trained model.
* `bool save(string dir)` Saves the model parameters to a specified directory (`dir`).
* `bool load(string dir)` Loads the model parameters from a specified directory (`dir`).

**Internal Functions:**

* `extract_components(vector &eigen_values, double threshold=0.95)`: Extracts the selected number of components based on the chosen criterion (similar to the `CLDA` class).

**III. Additional Notes:**

* The `m_criterion` member variable allows choosing the criterion for selecting the number of components (same options as in `CLDA`).
* The class internally uses the `CPlots` class (not documented here) for potential visualization purposes.
* Saving and loading functionalities allow for model persistence and reusability.


## Non-Negative Matrix Factorization (NMF) 

This documentation explains the `CNMF` class in MQL5, which implements **Non-Negative Matrix Factorization (NMF)** for data decomposition and feature extraction tasks.

**I. NMF Theory:**

NMF is a dimensionality reduction technique that decomposes a **non-negative matrix** `V` into two **non-negative matrices** `W` and `H`:

* `V` (shape: `m x n`): The input data matrix, where `m` is the number of data points and `n` is the number of features.
* `W` (shape: `m x k`): The **basis matrix**, where `k` is the number of chosen components and each row represents a **basis vector**.
* `H` (shape: `k x n`): The **coefficient matrix**, where each row corresponds to a basis vector and each element represents the **contribution** of that basis vector to a specific feature in the original data.

By finding a suitable factorization, NMF aims to represent the original data as a **linear combination** of basis vectors while preserving the non-negative nature of the input data. This allows for:

* **Dimensionality reduction:** Reduce the number of features while still capturing essential information.
* **Feature extraction:** Identify underlying factors or patterns in the data through the basis vectors.
* **Data interpretation:** Gain insights into the data by analyzing the non-negative contributions of basis vectors to each feature.

**II. CNMF Class:**

The `CNMF` class provides functionalities for performing NMF :

**Public Functions:**

* `CNMF(uint max_iter=100, double tol=1e-4, int random_state=-1)` Constructor, allows setting hyperparameters:
    * `max_iter`: Maximum number of iterations for the NMF algorithm (default: 100).
    * `tol`: Tolerance for convergence (default: 1e-4).
    * `random_state`: Random seed for initialization (default: -1, uses random seed).
* `~CNMF(void)` Destructor.
* `matrix fit_transform(matrix &X, uint k=2)` Trains the model on the provided data (`X`) and returns the decomposed components (`W` and `H`).
    * `k`: Number of components to extract (default: 2).
* `matrix transform(matrix &X)` Transforms new data (`X`) using the trained model.
* `vector transform(vector &X)` Transforms a single new data point (`X`) using the trained model.
* `uint select_best_components(matrix &X)` Analyzes the input data and suggests an appropriate number of components (implementation details might vary depending on the specific NMF algorithm used).

**III. Additional Notes:**

* The internal implementation details of the NMF algorithm might vary depending on the specific chosen library or technique.
* Choosing the appropriate number of components is crucial for optimal performance and avoiding overfitting. The `select_best_components` function is helpful as a starting point, but further evaluation and domain knowledge might be needed for optimal selection.

By understanding the theoretical foundation and functionalities of the `CNMF` class, MQL5 users can leverage NMF for various tasks, including:

* Dimensionality reduction for data visualization or machine learning algorithms that require lower-dimensional inputs.
* Feature extraction to identify underlying structure or patterns in non-negative data.
* Topic modeling for analyzing text data or other types of document collections.


## Truncated Singular Value Decomposition (Truncated SVD) 

This documentation explains the `CTruncatedSVD` class in MQL5, which implements **Truncated Singular Value Decomposition (Truncated SVD)** for dimensionality reduction and data visualization tasks.

**I. Truncated SVD Theory:**

Truncated SVD is a dimensionality reduction technique based on **Singular Value Decomposition (SVD)**. SVD decomposes a matrix `X` into three matrices:

* `U`: A left singular vectors matrix.
* `Σ`: A diagonal matrix containing the singular values of `X`.
* `V^T`: A right singular vectors matrix (transposed).

Truncated SVD retains only **k** top singular values from `Σ` and their corresponding columns from `U` and `V^T`. This creates a lower-dimensional representation of the original data that captures most of the variance.

**II. CTruncatedSVD Class:**

The `CTruncatedSVD` class provides functionalities for performing Truncated SVD in MQL5:

**Public Functions:**

* `CTruncatedSVD(uint k=0):` Constructor, allows setting the number of components (`k`) to retain (default: 0, determined automatically).
* `~CTruncatedSVD(void):` Destructor.
* `matrix fit_transform(matrix& X):` Trains the model on the provided data (`X`) and returns the transformed data.
* `matrix transform(matrix &X):` Transforms new data (`X`) using the trained model.
* `vector transform(vector &X):` Transforms a single new data point (`X`) using the trained model.
* `ulong _select_n_components(vector &singular_values):` (Internal function, not directly exposed to users) Determines the number of components based on the explained variance ratio (implementation details may vary).

**III. Additional Notes:**

* The class internally uses the `CPlots` class (not documented here) for potential visualization purposes.
* Choosing the appropriate number of components (`k`) is crucial for balancing dimensionality reduction and information preservation. The `_select_n_components` function might use different criteria (e.g., explained variance ratio) for automatic selection, and user discretion might be needed depending on the specific task.

By understanding the theoretical foundation and functionalities of the `CTruncatedSVD` class, MQL5 users can leverage Truncated SVD for:

* **Dimensionality reduction:** Reduce the number of features while retaining most of the information.
* **Data visualization:** Project high-dimensional data onto a lower-dimensional space for easier visualization.
* **Feature extraction:** Identify underlying factors or patterns in the data through the singular vectors (although not explicitly mentioned in the class functionalities).

It's important to note that the specific implementation details of the `CTruncatedSVD` class and the `_select_n_components` function might vary depending on the chosen MQL5 library or framework. Refer to the specific documentation of your chosen library for the most accurate and up-to-date information.


**Reference:**
* [Data Science and Machine Learning (Part 18): The battle of Mastering Market Complexity, Truncated SVD Versus NMF](https://www.mql5.com/en/articles/13968)
* [Data Science and Machine Learning(Part 20) : Algorithmic Trading Insights, A Faceoff Between LDA and PCA in MQL5](https://www.mql5.com/en/articles/14128)


================================================
FILE: Sklearn/Decomposition/TruncatedSVD.mqh
================================================
//+------------------------------------------------------------------+
//|                                                 CTruncatedSVD.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+
#include "base.mqh"
#include <MALE5\MqPlotLib\plots.mqh>

class CTruncatedSVD
  {
CPlots   plt;

uint m_components;
ulong n_features;
matrix components_;
vector mean;
vector explained_variance_;

public:
                     CTruncatedSVD(uint k=0);
                    ~CTruncatedSVD(void);
                    
                    matrix fit_transform(matrix& X);
                    matrix transform(matrix &X);
                    vector transform(vector &X);
                    ulong _select_n_components(vector &singular_values);
  };
//+------------------------------------------------------------------+
//|  Once the k value is left to default value of zero, the function |
//| _select_n_components will be used to find the best number of     |
//| components to use                                                |
//+------------------------------------------------------------------+
CTruncatedSVD::CTruncatedSVD(uint k=0)
:m_components(k)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CTruncatedSVD::~CTruncatedSVD(void)
 {
 
 } 
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CTruncatedSVD::fit_transform(matrix &X)
 {
  n_features = X.Cols();  
    
   if (m_components>n_features)
     {
       printf("%s Number of dimensions K[%d] is supposed to be <= number of features %d",__FUNCTION__,m_components,n_features);
       this.m_components = (uint)n_features;
     }
     
//--- Center the data (subtract mean)

    this.mean = X.Mean(0);
    matrix X_centered = BaseDimRed::subtract(X, this.mean);
    
//--- Compute the covariance matrix
   
    BaseDimRed::ReplaceNaN(X_centered);
    matrix cov_matrix = X_centered.Cov(false);
    
//---  Perform SVD on the covariance matrix

    matrix U={}, Vt={};
    vector Sigma={};
    
    BaseDimRed::ReplaceNaN(cov_matrix);
    
    if (!cov_matrix.SVD(U,Vt,Sigma))
       Print(__FUNCTION__," Line ",__LINE__," Failed to calculate SVD Err=",GetLastError());    
        
     if (m_components == 0)
       {
         m_components = (uint)this._select_n_components(Sigma);
         Print(__FUNCTION__," Best value of K = ",m_components);
       }
                 
    this.components_ = BaseDimRed::Slice(Vt, this.m_components).Transpose();
    BaseDimRed::ReplaceNaN(this.components_);
        
    if (MQLInfoInteger(MQL_DEBUG))
      Print("components_T[",components_.Rows(),"X",components_.Cols(),"]\n",this.components_);
    
    this.explained_variance_ = MathPow(BaseDimRed::Slice(Sigma, this.m_components), 2) / (X.Rows() - 1);
    
    return X_centered.MatMul(components_);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CTruncatedSVD::transform(matrix &X)
 {
   matrix X_centered = BaseDimRed::subtract(X, this.mean);
   
   if (X.Cols()!=this.n_features)
     {
       printf("%s Inconsistent input X matrix size, It is supposed to be of size %d same as the matrix used under fit_transform",__FUNCTION__,n_features);
       this.m_components = (uint)n_features;
     }
    
    return X_centered.MatMul(components_);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CTruncatedSVD::transform(vector &X)
 {
   matrix INPUT_MAT = MatrixExtend::VectorToMatrix(X, X.Size());
   matrix OUTPUT_MAT = transform(INPUT_MAT);
      
   return MatrixExtend::MatrixToVector(OUTPUT_MAT);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
ulong CTruncatedSVD::_select_n_components(vector &singular_values)
 {
    double total_variance = MathPow(singular_values.Sum(), 2);
    
    vector explained_variance_ratio = MathPow(singular_values, 2).CumSum() / total_variance;
    
    if (MQLInfoInteger(MQL_DEBUG))
      Print(__FUNCTION__," Explained variance ratio ",explained_variance_ratio);
    
    vector k(explained_variance_ratio.Size());
    
    for (uint i=0; i<k.Size(); i++)
      k[i] = i+1;
    
    plt.Plot("Explained variance plot",k,explained_variance_ratio,"variance","components","Variance");
    
   return explained_variance_ratio.ArgMax() + 1;  //Choose k for maximum explained variance
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/Decomposition/base.mqh
================================================
//+------------------------------------------------------------------+
//|                                                      helpers.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| BaseDimRed class for dimension reduction, containing most useful       |
//| that are necessary for the algorithms in this folder             |
//+------------------------------------------------------------------+

#include <MALE5\Utils.mqh>

class BaseDimRed
  {
public:
                     BaseDimRed(void);
                    ~BaseDimRed(void);
                    
                    static matrix Slice(const matrix &mat, uint from_0_to, int axis=0);
                    static vector Slice(const vector &v, uint from_0_to);
                    static matrix subtract(const matrix&mat, const vector &v);
                    static void   ReplaceNaN(matrix &mat);
                    static matrix Sort(matrix &mat, vector &args);
                    static vector Sort(vector &v, vector &args);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix BaseDimRed::Slice(const matrix &mat, uint from_0_to, int axis=0)
 {
  matrix ret = {};
  
  if (from_0_to==0)
    {
      printf("%s Cannot slice a vector from index 0 to 0",__FUNCTION__);
      return mat;
    }
  
  switch(axis)
    {
     case  0: 
      ret.Resize(from_0_to, mat.Cols());
       
      for (uint i=0; i<mat.Rows(); i++)
        ret.Row(mat.Row(i), i);   
        
       break;
     case 1:
      ret.Resize(mat.Rows(), from_0_to);
      
      for (uint i=0; i<mat.Cols(); i++)
        ret.Col(mat.Col(i), i);   
        
       break;
     default:
       Print("%s Invalid axis %d axis can be either 0 or 1",__FUNCTION__,axis);
       break;
   }
   
   return ret;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector BaseDimRed::Slice(const vector &v, uint from_0_to)
 {
   vector ret(from_0_to);
   
  if (from_0_to==0)
    {
      printf("%s Cannot slice a vector from index 0 to 0",__FUNCTION__);
      return v;
    }
    
   for (uint i=0; i<ret.Size(); i++)
     ret[i] = v[i];
  
   return ret;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix BaseDimRed::subtract(const matrix&mat, const vector &v)
 {
   matrix ret = mat;
   
   if (mat.Rows()!=v.Size() && mat.Cols()!=v.Size())
     {
       printf("%s Dimensions Mismatch",__FUNCTION__);
       matrix empty = {};
       return empty;
     }
   
   bool isrows = v.Size()==mat.Rows() ? true : false;
   
   for (ulong i=0; i<(isrows?mat.Cols():mat.Rows()); i++)
    {
      if (isrows)
       ret.Col(mat.Col(i)-v, i);
      else
       ret.Row(mat.Row(i)-v, i);
    }
   
   return ret; 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void BaseDimRed::ReplaceNaN(matrix &mat)
 {
   for (ulong i = 0; i < mat.Rows(); i++) 
     for (ulong j = 0; j < mat.Cols(); j++) 
       if (!MathIsValidNumber(mat[i][j]))
          mat[i][j] = 0.0;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix BaseDimRed::Sort(matrix &mat, vector &args)
 {
   matrix m = mat;
   
   if (args.Size() != mat.Cols())
     {
       printf("%s Args size != mat.Cols ");
       return m;
     }
   
   for (ulong i=0; i<mat.Cols(); i++)
       m.Col(mat.Col((ulong)args[i]), i);
       
   return m;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector BaseDimRed::Sort(vector &v, vector &args)
 {
   vector vec = v;
   
   if (args.Size() != v.Size())
     {
       printf("%s Args size != v.size ");
       return vec;
     }
   
   for (ulong i=0; i<v.Size(); i++)
     vec[i] = v[(int)args[i]];
       
   return vec;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/Ensemble/AdaBoost.mqh
================================================
//+------------------------------------------------------------------+
//|                                                     AdaBoost.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+

#include <MALE5\MatrixExtend.mqh>
#include <MALE5\Naive Bayes\Naive Bayes.mqh>

//+------------------------------------------------------------------+
//|      Model class                                                 |
//+------------------------------------------------------------------+

#include <MALE5\Decision Tree\tree.mqh>
#include <MALE5\Linear Models\Logistic Regression.mqh>

//+------------------------------------------------------------------+
//|         AdaBoost class for Decision Tree                         |
//+------------------------------------------------------------------+
namespace DecisionTree
 {
class AdaBoost
  {
  
protected:
                     vector m_alphas;
                     vector classes_in_data;
                     int m_random_state;
                     bool m_boostrapping;
                     uint m_min_split, m_max_depth;
                     
                     CDecisionTreeClassifier *weak_learners[]; //store weak_learner pointers for memory allocation tracking
                     CDecisionTreeClassifier *weak_learner;
                     
                     uint m_estimators;
                     
public:
                     AdaBoost(uint min_split, uint max_split, uint n_estimators=50, int random_state=42, bool bootstrapping=true);
                    ~AdaBoost(void);
                    
                    void fit(matrix &x, vector &y);
                    int predict(vector &x);
                    vector predict(matrix &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
AdaBoost::AdaBoost(uint min_split, uint max_split, uint n_estimators=50, int random_state=42, bool bootstrapping=true)
:m_estimators(n_estimators),
 m_random_state(random_state),
 m_boostrapping(bootstrapping),
 m_min_split(min_split),
 m_max_depth(max_split)
 {
   ArrayResize(weak_learners, m_estimators);   //Resizing the array to retain the number of base weak_learners
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
AdaBoost::~AdaBoost(void)
 {   
   for (uint i=0; i<m_estimators; i++) //Delete the forest | all trees
     if (CheckPointer(weak_learners[i]) != POINTER_INVALID)
      delete(weak_learners[i]);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void AdaBoost::fit(matrix &x,vector &y)
 {
   m_alphas.Resize(m_estimators);  
   classes_in_data = MatrixExtend::Unique(y); //Find the target variables in the class
      
   ulong m = x.Rows(), n = x.Cols();
   vector weights(m); weights = weights.Fill(1.0) / m; //Initialize instance weights
   vector preds(m);
   vector misclassified(m);
   
//---

   matrix data = MatrixExtend::concatenate(x, y);
   matrix temp_data;
   
   matrix x_subset;
   vector y_subset;

   double error = 0;
   
   for (uint i=0; i<m_estimators; i++)
    {      
      temp_data = data;
      MatrixExtend::Randomize(temp_data, this.m_random_state, this.m_boostrapping);
      
       if (!MatrixExtend::XandYSplitMatrices(temp_data, x_subset, y_subset)) //Get randomized subsets
         {  
            ArrayRemove(weak_learners,i,1); //Delete the invalid weak_learner
            printf("%s %d Failed to split data",__FUNCTION__,__LINE__);
            continue;
         }

//---
      
      weak_learner = new CDecisionTreeClassifier(this.m_min_split, m_max_depth);             
              
      weak_learner.fit(x_subset, y_subset); //fiting the randomized data to the i-th weak_learner
      preds = weak_learner.predict_bin(x_subset); //making predictions for the i-th weak_learner
             
       for (ulong j=0; j<m; j++)
          misclassified[j] = (preds[j] != y_subset[j]);
       
       error = (misclassified * weights).Sum() / (double)weights.Sum();
       
      //--- Calculate the weight of a weak learner in the final weak_learner
      
      double alpha = 0.5 * log((1-error) / (error + 1e-10));
      
      //--- Update instance weights
      
      weights *= exp(-alpha * y_subset * preds);
      weights /= weights.Sum();
      
      //--- save a weak learner and its weight
      
      this.m_alphas[i] = alpha;
      this.weak_learners[i] = weak_learner;
      
      printf("Building Estimator [%d/%d] Accuracy Score %.3f",i+1,m_estimators,Metrics::accuracy_score(y_subset,preds));
    }
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
int AdaBoost::predict(vector &x)
 {
   // Combine weak learners using weighted sum   
   
   vector weak_preds(m_estimators), 
          final_preds(m_estimators);
          
   for (uint i=0; i<this.m_estimators; i++)
     weak_preds[i] = this.weak_learners[i].predict_bin(x);
  
  return (int)weak_preds[(this.m_alphas*weak_preds).ArgMax()]; //Majority decision
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector AdaBoost::predict(matrix &x)
 {
   vector ret_v(x.Rows());
   for (ulong i=0; i<ret_v.Size(); i++)
      ret_v[i] = this.predict(x.Row(i));
   
   return ret_v;
 }
}

//+------------------------------------------------------------------+
//|         Adaboost for Logistic Regression                         |
//+------------------------------------------------------------------+

namespace LogisticRegression
 {
class AdaBoost
  {
  
protected:
                     vector m_alphas;
                     vector classes_in_data;
                     int m_random_state;
                     bool m_boostrapping;
                     uint m_min_split, m_max_depth;
                     
                     CLogisticRegression *weak_learners[]; //store weak_learner pointers for memory allocation tracking
                     CLogisticRegression *weak_learner;
                     
                     uint m_estimators;
                     
public:
                     AdaBoost(uint n_estimators=50, int random_state=42, bool bootstrapping=true);
                    ~AdaBoost(void);
                    
                    void fit(matrix &x, vector &y);
                    int predict(vector &x);
                    vector predict(matrix &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
AdaBoost::AdaBoost(uint n_estimators=50, int random_state=42, bool bootstrapping=true)
:m_estimators(n_estimators),
 m_random_state(random_state),
 m_boostrapping(bootstrapping)
 {
   ArrayResize(weak_learners, m_estimators);   //Resizing the array to retain the number of base weak_learners
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
AdaBoost::~AdaBoost(void)
 {   
   for (uint i=0; i<m_estimators; i++) //Delete the forest | all trees
     if (CheckPointer(weak_learners[i]) != POINTER_INVALID)
      delete(weak_learners[i]);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void AdaBoost::fit(matrix &x,vector &y)
 {
   m_alphas.Resize(m_estimators);  
   classes_in_data = MatrixExtend::Unique(y); //Find the target variables in the class
      
   ulong m = x.Rows(), n = x.Cols();
   vector weights(m); weights = weights.Fill(1.0) / m; //Initialize instance weights
   vector preds(m);
   vector misclassified(m);
   
//---

   matrix data = MatrixExtend::concatenate(x, y);
   matrix temp_data;
   
   matrix x_subset;
   vector y_subset;

   double error = 0;
   
   for (uint i=0; i<m_estimators; i++)
    {      
      
      temp_data = data;
      MatrixExtend::Randomize(temp_data, this.m_random_state, this.m_boostrapping);
      
       if (!MatrixExtend::XandYSplitMatrices(temp_data, x_subset, y_subset)) //Get randomized subsets
         {  
            ArrayRemove(weak_learners,i,1); //Delete the invalid weak_learner
            printf("%s %d Failed to split data",__FUNCTION__,__LINE__);
            continue;
         }

//---
      
      weak_learner = new CLogisticRegression();             
              
      weak_learner.fit(x_subset, y_subset); //fiting the randomized data to the i-th weak_learner
      preds = weak_learner.predict(x_subset); //making predictions for the i-th weak_learner
             
       for (ulong j=0; j<m; j++)
          misclassified[j] = (preds[j] != y_subset[j]);
       
       error = (misclassified * weights).Sum() / (double)weights.Sum();
       
      //--- Calculate the weight of a weak learner in the final weak_learner
      
      double alpha = 0.5 * log((1-error) / (error + 1e-10));
      
      //--- Update instance weights
      
      weights *= exp(-alpha * y_subset * preds);
      weights /= weights.Sum();
      
      //--- save a weak learner and its weight
      
      this.m_alphas[i] = alpha;
      this.weak_learners[i] = weak_learner;
      
      printf("Building Estimator [%d/%d] Accuracy Score %.3f",i+1,m_estimators,Metrics::accuracy_score(y_subset,preds));
    }
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
int AdaBoost::predict(vector &x)
 {
   // Combine weak learners using weighted sum   
   
   vector weak_preds(m_estimators), 
          final_preds(m_estimators);
          
   for (uint i=0; i<this.m_estimators; i++)
     weak_preds[i] = this.weak_learners[i].predict(x);
  
  return (int)weak_preds[(this.m_alphas*weak_preds).ArgMax()]; //Majority decision
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector AdaBoost::predict(matrix &x)
 {
   vector ret_v(x.Rows());
   for (ulong i=0; i<ret_v.Size(); i++)
      ret_v[i] = this.predict(x.Row(i));
   
   return ret_v;
 }
}
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/Ensemble/README.md
================================================
## AdaBoost Ensemble Learning

This explanation covers the concept of AdaBoost and its implementation in `adaboost.mqh` for MQL5, highlighting the flexibility of using different weak learners (like decision trees or logistic regression).

**I. AdaBoost Theory (Ensemble Learning Approach)`

AdaBoost, short for Adaptive Boosting, is an ensemble learning algorithm that combines multiple **weak learners** (models with moderate predictive power) into a **strong learner** (model with improved predictive performance). It achieves this by:

1. **Initializing weights for each data point:** Initially, all data points have equal weight.
2. **Iteratively training weak learners:**
    * In each iteration, a weak learner is trained on a **modified** dataset:
        * If the previous learner misclassified a point, its weight is increased.
        * If it was classified correctly, the weight is decreased. This focuses the subsequent learners on the "harder" data points.
    * The weight of the current weak learner is determined based on its performance on the weighted data.
3. **Combining the weak learners:**
    * The final prediction of the ensemble is made by taking a weighted majority vote (classification) or a weighted average (regression) of the individual weak learner predictions, with higher weights given to more accurate learners.

**II. AdaBoost.mqh Documentation:**

The `AdaBoost` class provides functionalities for implementing the AdaBoost algorithm using either **decision trees** or **logistic regression** as weak learners.

**A. Common functionalities (present in both DecisionTree and LogisticRegression namespaces)`

* `AdaBoost(uint n_estimators=50, int random_state=42, bool bootstrapping=true)` Constructor, allows setting hyperparameters (number of weak learners, random state for reproducibility, and enabling/disabling bootstrapping during training).
* `~AdaBoost(void)` Destructor.
* `void fit(matrix &x, vector &y):` Trains the ensemble model using the provided data (`x` - independent variables, `y` - dependent variables).
* `int predict(vector &x):` Predicts the class label (for classification) for a new data point (`x`).
* `vector predict(matrix &x):` Predicts class labels (for classification) for multiple new data points (`x`).

**B. Namespace-specific functionalities:**

* **DecisionTree namespace:**
    * `CDecisionTreeClassifier *weak_learners[];`: Stores weak learner pointers (decision trees) for memory management.
    * `CDecisionTreeClassifier *weak_learner;`: Internal pointer to the currently trained weak learner.
* **LogisticRegression namespace:**
    * `CLogisticRegression *weak_learners[];`: Stores weak learner pointers (logistic regression models) for memory management.
    * `CLogisticRegression *weak_learner;`: Internal pointer to the currently trained weak learner.

**III. Flexibility of Weak Learners:**

The key takeaway here is that the `AdaBoost` class is **not limited to** using decision trees as weak learners. The provided examples showcase its usage with both decision trees and logistic regression. This demonstrates the flexibility of the AdaBoost framework, where any model capable of making predictions (classification or regression) can be used as a weak learner.


## Random Forest Classification and Regression: 

This explanation covers the `CRandomForestClassifier` and `CRandomForestRegressor` classes in MQL5, which implement **random forests** for classification and regression tasks, respectively.

**I. Random Forest Theory (Ensemble Learning Approach)`

A random forest is an ensemble learning method that combines multiple **decision trees** into a single model to improve predictive performance. Each decision tree is trained on a **random subset of features** (independent variables) and a **bootstrapped sample** of the data (randomly drawn with replacement, increasing the importance of potentially informative data points). Predictions from all trees are then aggregated through **majority vote** (classification) or **averaging** (regression) to make the final prediction. This process reduces the variance of the model and helps prevent overfitting.

**II. CRandomForestClassifier Class:**

This class provides functionalities for implementing a random forest for **classification** tasks.

**Public Functions:**

* `CRandomForestClassifier(uint n_trees=100, uint minsplit=NULL, uint max_depth=NULL, int random_state=-1)` Constructor, allows setting hyperparameters (number of trees, minimum samples per split, maximum tree depth, and random state for reproducibility).
* `~CRandomForestClassifier(void)` Destructor.
* `void fit(matrix &x, vector &y, bool replace=true, errors_classifier err=ERR_ACCURACY)` Trains the model on the provided data (`x` - independent variables, `y` - class labels).
    * `replace` controls whether bootstrapping samples with replacement (True) or not (False).
    * `err` specifies the error metric to use for internal training evaluation (default: ERR_ACCURACY).
* `double predict(vector &x)` Predicts the class label for a new data point (`x`).
* `vector predict(matrix &x)` Predicts class labels for multiple new data points (`x`).

**Internal Functions:**

* `ConvertTime(double seconds)`: Converts seconds to a human-readable format (not relevant for core functionality).
* `err_metric(errors_classifier err, vector &actual, vector &preds)`: Calculates the specified error metric (e.g., accuracy) on given data (not directly exposed to users).

**III. CRandomForestRegressor Class:**

This class implements a random forest for **regression** tasks. It inherits from `CRandomForestClassifier` and overrides specific functions for regression-specific behavior.

**Public Functions:**

* `CRandomForestRegressor(uint n_trees=100, uint minsplit=NULL, uint max_depth=NULL, int random_state=-1)` Constructor (same as for the classifier).
* `~CRandomForestRegressor(void)` Destructor (same as for the classifier).
* `void fit(matrix &x, vector &y, bool replace=true, errors_regressor err=ERR_R2_SCORE)` Trains the model (same as for the classifier, but default error metric is ERR_R2_SCORE).
* `double predict(vector &x)` Predicts the continuous value for a new data point (`x`).
* `vector predict(matrix &x)` Predicts continuous values for multiple new data points (`x`).

**Internal Functions:**

* Same as in `CRandomForestClassifier`.

**IV. Key Points:**

* Both classes use decision trees as base learners to build the random forest.
* Hyperparameter tuning (number of trees, minimum samples per split, maximum depth) can significantly impact performance.
* Random forests offer improved generalization and reduced variance compared to single decision trees.


**Reference**
* [Data Science and Machine Learning (Part 17): Money in the Trees? The Art and Science of Random Forests in Forex Trading](https://www.mql5.com/en/articles/13765)
* [Data Science and Machine Learning (Part 19): Supercharge Your AI models with AdaBoost](https://www.mql5.com/en/articles/14034)

================================================
FILE: Sklearn/Ensemble/Random Forest.mqh
================================================
//+------------------------------------------------------------------+
//|                                                       forest.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+
#include <MALE5\Decision Tree\tree.mqh>
#include <MALE5\metrics.mqh>

enum errors_classifier
  {
   ERR_ACCURACY
  };
  
class CRandomForestClassifier
  {

protected:
   uint  m_ntrees;
   uint  m_maxdepth;
   uint  m_minsplit;
   int   m_random_state;
   
   CDecisionTreeClassifier *forest[];
   string ConvertTime(double seconds);
   double err_metric(errors_classifier err, vector &actual, vector &preds);
   
public:
                     CRandomForestClassifier(uint n_trees=100, uint minsplit=NULL, uint max_depth=NULL, int random_state=-1);
                    ~CRandomForestClassifier(void);
                    
                    void fit(matrix &x, vector &y, bool replace=true, errors_classifier err=ERR_ACCURACY);
                    double predict(vector &x);
                    vector predict(matrix &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CRandomForestClassifier::CRandomForestClassifier(uint n_trees=100, uint minsplit=NULL, uint max_depth=NULL, int random_state=-1):
   m_ntrees(n_trees),
   m_maxdepth(max_depth),
   m_minsplit(minsplit),
   m_random_state(random_state)
 {
   
   ArrayResize(forest, n_trees);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CRandomForestClassifier::~CRandomForestClassifier(void)
 {
   for (uint i=0; i<m_ntrees; i++) //Delete the forest | all trees
     if (CheckPointer(forest[i]) != POINTER_INVALID)
      delete(forest[i]);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CRandomForestClassifier::fit(matrix &x, vector &y, bool replace=true, errors_classifier err=ERR_ACCURACY)
 {
  matrix x_subset;
  vector y_subset;
  matrix data = MatrixExtend::concatenate(x, y, 1);
  matrix temp_data = data;
  vector preds;
  
  datetime time_start = GetTickCount(), current_time;
  
  Print("[ Classifier Random Forest Building ]");
    
   for (uint i=0; i<m_ntrees; i++) //Build a given x number of trees
     {
       time_start = GetTickCount();
       
       temp_data = data;
       MatrixExtend::Randomize(temp_data, m_random_state, replace); //Get randomized subsets
       
       if (!MatrixExtend::XandYSplitMatrices(temp_data, x_subset, y_subset)) //split the random subset into x and y subsets
         {
            ArrayRemove(forest,i,1); //Delete the invalid tree in a forest
            printf("%s %d Failed to split data for a tree ",__FUNCTION__,__LINE__);
            continue;
         } 
       
       forest[i] = new CDecisionTreeClassifier(this.m_minsplit, this.m_maxdepth); //Add the tree to the forest
                     
       forest[i].fit(x_subset, y_subset); //Add the trained tree to the forest
       preds = forest[i].predict_bin(x_subset);
       
       current_time = GetTickCount();
       
       printf("   ==> Tree <%d> Rand Seed <%s> Accuracy Score: %.3f Time taken: %s",i+1,m_random_state==-1?"None":string(m_random_state),this.err_metric(err, y_subset, preds), ConvertTime((current_time - time_start) / 1000.0));
     }
     
   m_ntrees = ArraySize(forest); //The successfully build trees
   
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CRandomForestClassifier::predict(vector &x)
 {
   vector predictions(m_ntrees); //predictions from all the trees
    
    for (uint i=0; i<this.m_ntrees; i++) //all trees make the predictions
      predictions[i] = forest[i].predict_bin(x);
      
   vector uniques = MatrixExtend::Unique(predictions);   
   
   return uniques[MatrixExtend::Unique_count(predictions).ArgMax()]; //select the majority decision
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CRandomForestClassifier::predict(matrix &x)
 {
   vector preds(x.Rows());
   
   for (ulong i=0; i<x.Rows(); i++)
     preds[i] = this.predict(x.Row(i));
  
  return preds;     
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
string CRandomForestClassifier::ConvertTime(double seconds)
{
    string time_str = "";
    uint minutes = 0, hours = 0;

    if (seconds >= 60)
    {
        minutes = (uint)(seconds / 60.0) ;
        seconds = fmod(seconds, 1.0) * 60;
        time_str = StringFormat("%d Minutes and %.3f Seconds", minutes, seconds);
    }
    
    if (minutes >= 60)
    {
        hours = (uint)(minutes / 60.0);
        minutes = minutes % 60;
        time_str = StringFormat("%d Hours and %d Minutes", hours, minutes);
    }

    if (time_str == "")
    {
        time_str = StringFormat("%.3f Seconds", seconds);
    }

    return time_str;
}
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CRandomForestClassifier::err_metric(errors_classifier err, vector &actual, vector &preds)
 {
   return Metrics::accuracy_score(actual, preds);
 }

//+------------------------------------------------------------------+
//|                                                                  |
//|                                                                  |
//|                                                                  |
//|                                                                  |
//|      Random Forest for regression problems                       |
//|                                                                  |
//|                                                                  |
//|                                                                  |
//|                                                                  |
//+------------------------------------------------------------------+

enum errors_regressor
  {
   ERR_R2_SCORE,
   ERR_ADJUSTED_R
  };  
  
class CRandomForestRegressor
  {
private:
   uint  m_ntrees;
   uint  m_maxdepth;
   uint  m_minsplit;
   int   m_random_state;
   
   CDecisionTreeRegressor *forest[];
   
   string ConvertTime(double seconds);
   double err_metric(errors_regressor err,vector &actual,vector &preds);
   
public:
                     CRandomForestRegressor(uint n_trees=100, uint minsplit=NULL, uint max_depth=NULL, int random_state=-1);
                    ~CRandomForestRegressor(void);
                    
                    void fit(matrix &x, vector &y, bool replace=true, errors_regressor err=ERR_R2_SCORE);
                    double predict(vector &x);
                    vector predict(matrix &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CRandomForestRegressor::CRandomForestRegressor(uint n_trees=100, uint minsplit=NULL, uint max_depth=NULL, int random_state=-1):
   m_ntrees(n_trees),
   m_maxdepth(max_depth),
   m_minsplit(minsplit),
   m_random_state(random_state)
 {
   
   ArrayResize(forest, n_trees);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CRandomForestRegressor::~CRandomForestRegressor(void)
 {
   for (uint i=0; i<m_ntrees; i++) //Delete the forest | all trees
     if (CheckPointer(forest[i]) != POINTER_INVALID)
      delete(forest[i]);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
string CRandomForestRegressor::ConvertTime(double seconds)
{
    string time_str = "";
    uint minutes = 0, hours = 0;

    if (seconds >= 60)
    {
        minutes = (uint)(seconds / 60.0) ;
        seconds = fmod(seconds, 1.0) * 60;
        time_str = StringFormat("%d Minutes and %.3f Seconds", minutes, seconds);
    }
    
    if (minutes >= 60)
    {
        hours = (uint)(minutes / 60.0);
        minutes = minutes % 60;
        time_str = StringFormat("%d Hours and %d Minutes", hours, minutes);
    }

    if (time_str == "")
    {
        time_str = StringFormat("%.3f Seconds", seconds);
    }

    return time_str;
}
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CRandomForestRegressor::fit(matrix &x, vector &y, bool replace=true, errors_regressor err=ERR_R2_SCORE)
 {
  matrix x_subset;
  vector y_subset;
  matrix data = MatrixExtend::concatenate(x, y, 1);
  matrix temp_data = data;
  
  vector preds;
  datetime time_start = GetTickCount(), current_time;
  
  Print("[ Regressor Random Forest Building ]");
    
   for (uint i=0; i<m_ntrees; i++)
     {
       time_start = GetTickCount();
       
       temp_data = data;
       MatrixExtend::Randomize(temp_data, m_random_state, replace);
       
       if (!MatrixExtend::XandYSplitMatrices(temp_data, x_subset, y_subset)) //Get randomized subsets
         {  
            ArrayRemove(forest,i,1); //Delete the invalid tree in a forest
            printf("%s %d Failed to split data for a tree ",__FUNCTION__,__LINE__);
            continue;
         }
       
       forest[i] = new CDecisionTreeRegressor(this.m_minsplit, this.m_maxdepth);       
       forest[i].fit(x_subset, y_subset); //Add the trained tree to the forest
       preds = forest[i].predict(x_subset);
       
       current_time = GetTickCount();
       
       printf("   ==> Tree <%d> Rand Seed <%s> R_2 Score: %.3f Time taken: %s",i+1,m_random_state==-1?"None":string(m_random_state),this.err_metric(err, y_subset, preds), ConvertTime((current_time - time_start) / 1000.0));
     }
     
   m_ntrees = ArraySize(forest); //The successfully build trees  
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CRandomForestRegressor::predict(vector &x)
 {
    vector predictions(m_ntrees); //predictions from all the trees
    
    for (uint i=0; i<this.m_ntrees; i++)
      predictions[i] = forest[i].predict(x);

   return predictions.Mean();   
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CRandomForestRegressor::predict(matrix &x)
 {
   vector preds(x.Rows());
   
   for (ulong i=0; i<x.Rows(); i++)
     preds[i] = this.predict(x.Row(i));
  
  return preds;     
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CRandomForestRegressor::err_metric(errors_regressor err,vector &actual,vector &preds)
 {
   double acc = 0;
   switch(err)
     {
      case ERR_R2_SCORE:
        acc = Metrics::r_squared(actual, preds);
        break;
      case ERR_ADJUSTED_R:
        acc = Metrics::adjusted_r(actual, preds);
        break; 
     }
     
   return acc;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/Linear Models/Logistic Regression.mqh
================================================
//+------------------------------------------------------------------+
//|                                                 MatrixExtend::mqh |
//|                                  Copyright 2022, Omega Joctan  . |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, MetaQuotes Ltd."
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+
#include <MALE5\Utils.mqh>
#include <MALE5\Sklearn\metrics.mqh>
#include <MALE5\Numpy\Numpy.mqh>
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
class CLogisticRegression
  {
private:
   CNumpy            np;
   vector            classes_in_data;

   bool              istrained;
   bool              checkIsTrained(string func)
     {
      if(!istrained)
        {
         Print(func," Tree not trained, Call fit function first to train the model");
         return false;
        }
      return (true);
     }

   bool              CheckSamplesSize(string func, ulong size)
     {
      if(size != m_features)
        {
         printf("%s x sample size doesn't align with the training data m_features %d",func, size);
         return false;
        }
      return true;
     }

   matrix            weights;
   double            bias;

   //---

   uint              m_epochs;
   double            m_alpha;
   double            m_tol;
   ulong             m_features;
   int               m_random_seed;

public:
                     CLogisticRegression(uint epochs=10, double alpha=0.01, double tol=1e-8, int random_seed = 0);
                    ~CLogisticRegression(void);


   void              fit(matrix &x, vector &y);

   int               predict(vector &x);
   vector            predict(matrix &x);
   double            predict_proba(vector &x);
   vector            predict_proba(matrix &x);

  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CLogisticRegression::CLogisticRegression(uint epochs=10, double alpha=0.01, double tol=1e-8, int random_seed=0)
   :istrained(false),
    m_epochs(epochs),
    m_alpha(alpha),
    m_tol(tol),
    m_random_seed(random_seed)
  {

  }
//+------------------------------------------------------------------+
//| This is where the logistic model gets trained                    |
//+------------------------------------------------------------------+
void CLogisticRegression::fit(matrix &x, vector &y)
  {
   ulong m = x.Rows(), n = x.Cols();
   m_features = n;
   
   np.random.seed(m_random_seed);
   vector rand_v = np.random.uniform(-1, 1, (uint)n);
   this.weights = np.expand_dims(rand_v, 1);
   
   //---
   
   matrix dw; //derivative wrt weights &
   double db; //bias respectively
   vector preds;

   istrained = true;

   double prev_cost = -DBL_MAX, cost =0;
   for(ulong i=0; i<m_epochs; i++)
     {
      preds = this.predict_proba(x);

      //-- Computing gradient(s)

      matrix error = np.expand_dims(preds - y,  1);

      dw = (1/(double)m) * x.Transpose().MatMul(error);
      db = (1/(double)m) * (preds - y).Sum();

      cost = Metrics::mse(y, preds);

      printf("---> Logistic regression build epoch [%d/%d] mse %.5f",i+1,m_epochs, cost);

      this.weights -= this.m_alpha * dw;
      this.bias -= this.bias * db;

      if(MathAbs(prev_cost - cost) < this.m_tol)
        {
         Print("Converged!!!");
         break;
        }

      prev_cost = cost;
     }
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CLogisticRegression::~CLogisticRegression(void)
  {

  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
int CLogisticRegression::predict(vector &x)
  {
   if(!checkIsTrained(__FUNCTION__))
      return 0;

   if(!CheckSamplesSize(__FUNCTION__,x.Size()))
      return 0;

   matrix x_mat = np.expand_dims(x, 1);
   matrix preds = (x_mat.MatMul(this.weights) + this.bias);

   preds.Activation(preds, AF_HARD_SIGMOID);

   if(preds.Rows()>1)
     {
      printf("%s The outcome from a sigmoid must be a scalar value",__FUNCTION__);
      return 0;
     }
   return (int)(preds[0][0]>=0.5);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CLogisticRegression::predict(matrix &x)
  {
   vector v(x.Rows());
   for(ulong i=0; i<x.Rows(); i++)
      v[i] = this.predict(x.Row(i));

   return v;
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CLogisticRegression::predict_proba(vector &x)
  {
   if(!checkIsTrained(__FUNCTION__))
      return 0;

   matrix x_mat = np.expand_dims(x, 1);
   matrix preds = (x_mat.MatMul(this.weights) + this.bias);

   preds.Activation(preds, AF_HARD_SIGMOID);

   if(preds.Rows()>1)
     {
      printf("%s The outcome from a sigmoid must be a scalar value",__FUNCTION__);
      return 0;
     }
   return preds[0][0];
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CLogisticRegression::predict_proba(matrix &x)
  {
   vector v(x.Rows());
   for(ulong i=0; i<x.Rows(); i++)
      v[i] = this.predict_proba(x.Row(i));

   return v;
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/Linear Models/README.md
================================================
## Theory Overview: Linear Regression

Linear regression is a statistical method for modeling the relationship between a dependent variable (what you want to predict) and one or more independent variables (what you are using to predict). It assumes a linear relationship between the variables, meaning the change in the dependent variable is proportional to the change in the independent variable(s).

The goal of linear regression is to find a line (for single independent variable) or hyperplane (for multiple independent variables) that best fits the data points. This line/hyperplane is represented by the following equation:

`y = β₀ + β₁x₁ + β₂x₂ + ... + βₙxₙ`

where:

* `y` is the dependent variable
* `x₁`, `x₂`, ..., `xₙ` are the independent variables
* `β₀` is the intercept (the y-value where the line/hyperplane crosses the y-axis)
* `β₁`, `β₂`, ..., `βₙ` are the coefficients (slopes) of the independent variables

By fitting the line/hyperplane to the data, linear regression allows us to:

* **Make predictions:** We can use the fitted model to predict the dependent variable for new data points based on their independent variable values.
* **Understand relationships:** The coefficients represent the strength and direction of the relationships between the independent and dependent variables.

## CLinearRegression Class Documentation

The `CLinearRegression` class implements linear regression functionality. It provides methods for both training and prediction:

**Public Functions:**

* `CLinearRegression(void)` Default constructor.
* `~CLinearRegression(void)` Destructor.
* `void fit_LeastSquare(matrix &x, vector &y)` Fits the model using the least squares method. 
    * This method trains the model by finding the coefficients (Betas) that minimize the sum of squared errors between the predicted and actual values.
    * Requires `x` (matrix of independent variables) and `y` (vector of dependent variables) as input.
* `void fit_GradDescent(matrix &x, vector &y, double alpha, uint epochs = 1000)` Fits the model using gradient descent.
    * This method trains the model iteratively, updating the coefficients based on the calculated gradients (slopes of the error function).
    * Requires `x` (matrix of independent variables), `y` (vector of dependent variables), `alpha` (learning rate), and optional `epochs` (number of iterations) as input.
* `double predict(vector &x)` Predicts the dependent variable for a new data point represented by the input vector `x`.
    * Requires a vector containing the values for the independent variables of the new data point.
    * Assumes the model is already trained (trained flag checked internally).
* `vector predict(matrix &x)` Predicts the dependent variables for multiple new data points represented by the input matrix `x`.
    * Requires a matrix where each row represents a new data point with its independent variable values.
    * Assumes the model is already trained (trained flag checked internally).

**Additional Notes:**

* The class uses internal member variables to store the trained coefficients (`Betas` and `Betas_v`).
* Internal helper functions (`checkIsTrained`, `TrimNumber`, `dx_wrt_bo`, `dx_wrt_b1`) are not directly accessible from the user but support the core functionalities.
* The class checks if the model is trained before allowing predictions using the `checkIsTrained` function.


## CLogisticRegression Class: Logistic Regression

The `CLogisticRegression` class provides functionalities for implementing logistic regression in MQL5. This statistical method allows you to model the probability of a binary outcome (belonging to one of two classes) based on independent variables.

**Public Functions:**

* `CLogisticRegression(uint epochs=10, double alpha=0.01, double tol=1e-8)` Constructor, allows setting hyperparameters (epochs, learning rate, tolerance) for training.
* `~CLogisticRegression(void)` Destructor.
* `void fit(matrix &x, vector &y)` Trains the model using the provided training data (`x` - independent variables, `y` - binary classification labels).
    * Internally performs gradient descent optimization to find the optimal weights and bias for the model.
* `int predict(vector &x)` Predicts the class label (0 or 1) for a new data point represented by the input vector `x`.
    * Assumes the model is already trained (checked internally).
* `vector predict(matrix &x)` Predicts class labels for multiple new data points represented by the input matrix `x`.
    * Each row in the matrix represents a new data point.
    * Assumes the model is already trained (checked internally).
* `double predict_proba(vector &x)` Predicts the probability of belonging to class 1 for a new data point represented by the input vector `x`.
    * Assumes the model is already trained (checked internally).
* `vector predict_proba(matrix &x)` Predicts the probabilities of belonging to class 1 for multiple new data points represented by the input matrix `x`.
    * Each row in the matrix represents a new data point.
    * Assumes the model is already trained (checked internally).

**Mathematical Theory (Basic Overview):**

Logistic regression uses the sigmoid function to map the linear combination of the input features (weighted sum) to a probability between 0 and 1. 

The mathematical formula for the logistic function is:

```
f(z) = 1 / (1 + exp(-z))
```

where:

* `z` is the linear combination of weights and features (z = w₁x₁ + w₂x₂ + ... + wₙxₙ + b)
* `w_i` are the weights for each feature
* `b` is the bias term
* `f(z)` is the predicted probability of belonging to class 1

By adjusting the weights and bias through training (minimizing the error between predicted and actual labels), the logistic regression model learns to distinguish between the two classes based on the input features and predict probabilities accordingly.

**Additional Notes:**

* The class utilizes gradient descent to optimize the weights and bias during training.
* Hyperparameter tuning (epochs, learning rate, tolerance) can significantly impact model performance and should be considered based on the specific data and task.


## CPolynomialRegression Class: Polynomial Regression

The `CPolynomialRegression` class provides functionalities for implementing polynomial regression in MQL5. This technique extends linear regression by fitting a higher-degree polynomial function to the data, allowing for more complex relationships between the independent and dependent variables.

**Public Functions:**

* `CPolynomialRegression(int degree=2)` Constructor, allows setting the degree of the polynomial (default is 2).
* `~CPolynomialRegression(void)` Destructor.
* `void BIC(ulong k, vector &bic, int &best_degree)` Calculates the Bayesian Information Criterion (BIC) for different polynomial degrees (`k`) and recommends the "best" degree based on the lowest BIC value (stored in `best_degree`).
    * Requires `k` (vector of degree values to evaluate), `bic` (output vector to store BIC values), and `best_degree` (output variable to store the recommended degree).
* `void fit(matrix &x, vector &y)` Trains the model using the provided training data (`x` - independent variables, `y` - dependent variables).
    * Internally fits the polynomial function to the data and stores the coefficients in the `Betas` and `Betas_v` member variables.
* `double predict(vector &x)` Predicts the dependent variable for a new data point represented by the input vector `x`.
    * Assumes the model is already trained (trained flag not explicitly mentioned but potentially implemented internally).
* `vector predict(matrix &x)` Predicts the dependent variables for multiple new data points represented by the input matrix `x`.
    * Each row in the matrix represents a new data point.
    * Assumes the model is already trained (trained flag not explicitly mentioned but potentially implemented internally).

**Mathematical Theory (Basic Overview):**

Polynomial regression models the relationship between the independent and dependent variables using a polynomial function of the form:

```
y = β₀ + β₁x + β₂x² + ... + βₙxⁿ
```

where:

* `y` is the dependent variable
* `x` is the independent variable
* `β₀`, `β₁`, ..., `βₙ` are the coefficients of the polynomial (model parameters)
* `n` is the degree of the polynomial (set during object creation or through the `BIC` function)

By increasing the degree of the polynomial, the model can capture more complex non-linear relationships in the data. However, it is crucial to find a balance between model complexity and overfitting (memorizing the training data poorly generalizing to unseen data).

**Additional Notes:**

* The `BIC` function can be used to help select an appropriate polynomial degree by balancing model complexity and goodness-of-fit.
* Choosing a high polynomial degree without sufficient data can lead to overfitting, so careful consideration and potentially additional techniques like regularization might be necessary.


**References**
* [Data Science and Machine Learning (Part 01): Linear Regression](https://www.mql5.com/en/articles/10459)
* [Data Science and Machine Learning (Part 02): Logistic Regression](https://www.mql5.com/en/articles/10626)
* [Data Science and Machine Learning (Part 07): Polynomial Regression](https://www.mql5.com/en/articles/11477)
* [Data Science and Machine Learning (Part 10): Ridge Regression ](https://www.mql5.com/en/articles/11735)


================================================
FILE: Sklearn/Linear Models/Ridge.mqh
================================================
//+------------------------------------------------------------------+
//|                                             Ridge Regression.mqh |
//|                                  Copyright 2022, MetaQuotes Ltd. |
//|                                             https://www.mql5.com |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Fxalgebra.com"
#property link      "https://www.mql5.com/en/users/omegajoctan"

//+------------------------------------------------------------------+
 
#include <MALE5\Sklearn\preprocessing.mqh>
#include <MALE5\Utils.mqh>
#include "Linear Regression.mqh"

//+------------------------------------------------------------------+

class CRidgeregression
  {
  
   protected: 
                        matrix XMatrix; //matrix of independent variables
                        matrix YMatrix;
                        vector yVector; // Vector of target variables
                        matrix Id_matrix; //Identity matrix
                        
                        matrix Betas;
                        ulong  n; //No of samples
                        ulong  k; //No of regressors 
                        
   public:
                        CRidgeregression(matrix &_matrix);
                       ~CRidgeregression(void);
                         
                       double RSS;
                       double Lr_accuracy;
                       
                       vector L2Norm(double lambda); //Ridge regression
                        
  };
  
//+------------------------------------------------------------------+
/*
CRidgeregression::CRidgeregression(matrix &_matrix)
 {
    n = _matrix.Rows();
    k = _matrix.Cols();
    
    MatrixExtend::XandYSplitMatrices(_matrix,XMatrix,yVector);
    
    YMatrix = MatrixExtend::VectorToMatrix(yVector);
    
//---

    Id_matrix.Resize(k,k);
    
    Id_matrix.Identity();

 }
*/
//+------------------------------------------------------------------+

CRidgeregression::~CRidgeregression(void)
 {
   ZeroMemory(XMatrix);
   ZeroMemory(yVector);
   ZeroMemory(yVector);
   ZeroMemory(Id_matrix); 
 }
 
//+------------------------------------------------------------------+
/*
vector CRidgeregression::L2Norm(double lambda)
 {    
   matrix design = MatrixExtend::DesignMatrix(XMatrix);
   
   matrix XT = design.Transpose();
   
   matrix XTX = XT.MatMul(design);
   
   matrix lamdaxI = lambda * Id_matrix;
   
   matrix sum_matrix = XTX + lamdaxI;
   
   matrix Inverse_sum = sum_matrix.Inv();
   
   matrix XTy = XT.MatMul(YMatrix);
   
   Betas = Inverse_sum.MatMul(XTy);
 
   #ifdef DEBUG_MODE
      //Print("Betas\n",Betas);
   #endif 
   
  return(MatrixExtend::MatrixToVector(Betas));
 }
//+------------------------------------------------------------------+
*/

================================================
FILE: Sklearn/Naive Bayes/Naive Bayes.mqh
================================================
//+------------------------------------------------------------------+
//|                                                  Naive Bayes.mqh |
//|                                    Copyright 2022, Fxalgebra.com |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Fxalgebra.com"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+

#include <MALE5\Utils.mqh> 
//+------------------------------------------------------------------+
//|              N  A  I  V  E     B  A  Y  E S                      |
//|                                                                  |
//|   suitable for classification of discrete values, that have      |
//|   been load to a matrix using the method ReadCSVEncode from      |
//|   CUtils::mqh                                              |
//|                                                                  |
//+------------------------------------------------------------------+

class CNaiveBayes
  {
protected:
                     uint n_features;
                     vector y_target;
                     
                     vector class_proba; //prior class probability
                     vector features_proba; //features probability
                       
                     vector c_prior_proba; //class prior probability
                     vector c_evidence;    //class evidence
                     
                     vector calcProba(vector &v_features);
                     
public:
                     vector classes;       //classes available 
                     
                     CNaiveBayes(void);
                    ~CNaiveBayes(void);
                    
                     void fit(matrix &x, vector &y);
                     int predict(vector &x);
                     vector predict(matrix &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CNaiveBayes::CNaiveBayes(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CNaiveBayes::fit(matrix &x, vector &y)
 {
  ulong samples = x.Rows(),
        features = x.Cols();
  
  vector unique = CUtils::Unique_count(y);
  
  this.class_proba = unique / samples;
  
  if (MQLInfoInteger(MQL_DEBUG))
    Print("class probabilities: ",class_proba);
  
    
/*
   y_target = y;
   n_features = x.Cols();
   
   classes = CUtils::Unique(y);
   
   c_evidence.Resize((ulong)classes.Size());
   
   n = y.Size();
   
   if (n==0) { Print("--> n == 0 | Naive Bayes class failed"); return; }
   
//---

   vector v = {};
   for (ulong i=0; i<c_evidence.Size(); i++)
       {
         v = CUtils::Search(y,classes[i]);
         
         c_evidence[i] = (int)v.Size();
       }

//---    
   
   c_prior_proba.Resize(classes.Size());
   
   for (ulong i=0; i<classes.Size(); i++)
      c_prior_proba[i] = c_evidence[i]/(double)n;
   
  
   Print("---> GROUPS ",classes);
   Print("Prior Class Proba ",c_prior_proba,"\nEvidence ",c_evidence);
*/  
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CNaiveBayes::~CNaiveBayes(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
int CNaiveBayes::predict(vector &x)
 {   
   vector v = calcProba(x);
   
   double sum = v.Sum();
   
   for (ulong i=0; i<v.Size(); i++) //converting the values into probabilities
      v[i] = NormalizeDouble(v[i]/sum,2);       
   
   vector p = v;
   
   #ifdef   DEBUG_MODE
      Print("Probabilities ",p);
   #endif 
   
   return((int)classes[p.ArgMax()]);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CNaiveBayes::predict(matrix &x)
 {
  ulong rows = x.Rows();
 
  vector v(rows), pred(rows); 
  
   for (ulong i=0; i<rows; i++)
    { 
       v = x.Row(i);
       pred[i] = predict(v);
    }
    
   return pred;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
/*
vector CNaiveBayes::calcProba(vector &v_features)
 {
    vector proba_v(classes.Size()); //vector to return
    
    if (v_features.Size() != n_features)
      {
         printf("FATAL | Can't calculate probability,  fetures columns size = %d is not equal to x_matrix columns =%d",v_features.Size(),n_features);
         return proba_v;
      }

//---
    
    vector v = {}; 
    
    for (ulong c=0; c<classes.Size(); c++)
      {
        double proba = 1;
          for (ulong i=0; i<n_features; i++)
            {
                v = x_matrix.Col(i);
                
                int count =0;
                for (ulong j=0; j<v.Size(); j++)
                  {
                     if (v_features[i] == v[j] && classes[c] == y[j])
                        count++;
                  }
                  
                proba *= count==0 ? 1 : count/(double)c_evidence[c]; //do not calculate if there isn't enough evidence'
            }
          
        proba_v[c] = proba*c_prior_proba[c];
     }
     
    return proba_v;
 }*/
//+------------------------------------------------------------------+
//|                                                                  |
//|                                                                  |
//|            NORMAL DISTRIBUTION CLASS                             |
//|                                                                  |
//|                                                                  |
//|                                                                  |
//+------------------------------------------------------------------+

class CNormDistribution
  {

public:
   
   double m_mean; //Assign the value of the mean
   double m_std;  //Assign the value of Variance
   
                     CNormDistribution(void);
                    ~CNormDistribution(void);
                    
                     double PDF(double x); //Probability density function
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

CNormDistribution::CNormDistribution(void)
 {
   
 }

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

CNormDistribution::~CNormDistribution(void)
 {
   ZeroMemory(m_mean);
   ZeroMemory(m_std);
 }
 
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

double CNormDistribution::PDF(double x)
 {
   double nurm = MathPow((x - m_mean),2)/(2*MathPow(m_std,2));
   nurm = exp(-nurm);
   
   double denorm = 1.0/(MathSqrt(2*M_PI*MathPow(m_std,2)));
      
  return(nurm*denorm);
 }

//+------------------------------------------------------------------+
//|                                                                  |
//|          GAUSSIAN NAIVE BAYES CLASS                              |
//|                                                                  |
//|   Suitable for classification based on features with             |
//|   continuous variables,                                          |
//|                                                                  |
//+------------------------------------------------------------------+


/*
class CGaussianNaiveBayes
  {
   protected:
   
      CNormDistribution norm_distribution;

      vector            c_prior_proba; //prior probability
      vector            c_evidence;
      ulong             n;
      
      ulong              m_cols;  //columns in x_matrix
      vector             calcProba(vector &v_features);
   
   public:              
   
      vector            classes; //Target classes     
             
                        CGaussianNaiveBayes(void);
                       ~CGaussianNaiveBayes(void);
                        
                        void fit(matrix &x, vector &y);
                        
                        int predict_bin(vector &x);
                        vector predict_bin(matrix &x);
                        vector predict_proba(vector &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CGaussianNaiveBayes::CGaussianNaiveBayes(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CGaussianNaiveBayes::fit(matrix &x, vector &y)
 { 
   
   classes = CUtils::Unique(y);
   m_cols = n_features;
    
//---
   
   c_evidence.Resize((ulong)classes.Size());
   
   n = y.Size();
   
   if (n==0) { Print("---> n == 0 | Gaussian Naive Bayes class failed"); return; }
   
//---
   
   vector v = {};
   for (ulong i=0; i<c_evidence.Size(); i++)
       {          
         v = CUtils::Search(y, classes[i]);
         
         c_evidence[i] = (int)v.Size();
       }
   
   c_prior_proba.Resize(classes.Size());
   
   for (ulong i=0; i<classes.Size(); i++)
      c_prior_proba[i] = c_evidence[i]/(double)n;

//---       
   
   Print("---> GROUPS ",classes);
   Print("\n---> Prior_proba ",c_prior_proba," Evidence ",c_evidence);

//---

   during_training = false; 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CGaussianNaiveBayes::~CGaussianNaiveBayes(void)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

int CGaussianNaiveBayes::predict_bin(vector &x)
 {     
   if (x.Size() != m_cols)
     {
       Print("CRITICAL | The given x have different size than the trained x");
       return (-1);
     }
   
   vector p = calcProba(x);
   
   return((int)classes[p.ArgMax()]);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CGaussianNaiveBayes::predict_proba(vector &x)
 {
  vector x = x;
  vector ret_v = {};
  
   if (x.Size() != m_cols)
     {
       Print("CRITICAL | The given x have different size than the trained x");
       return (ret_v);
     }
        
   ret_v = calcProba(x);
   
   return (ret_v);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CGaussianNaiveBayes::predict_bin(matrix &x)
 {
  ulong rows = x.Rows();
  vector v(rows), pred(rows); 
  
   for (ulong i=0; i<rows; i++)
    { 
       v = x.Row(i);
       
       pred[i] = predict_bin(v);
    }
   
   return pred;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

vector CGaussianNaiveBayes::calcProba(vector &v_features)
 {    
    vector proba_v(classes.Size()); //vector to return
    proba_v.Fill(-1);
    
    if (v_features.Size() != m_cols)
      {
         printf("FATAL | Can't calculate probability, fetures columns size = %d is not equal to x_matrix columns =%d",v_features.Size(),m_cols);
         return proba_v;
      }

//---
    
    vector v = {}; 
    
    for (ulong c=0; c<classes.Size(); c++)
      {
        double proba = 1;
          for (ulong i=0; i<m_cols; i++)
            {
                v = x_matrix.Col(i);
                
                int count =0;
                vector calc_v = {};
                
                for (ulong j=0; j<v.Size(); j++)
                  {
                     if (classes[c] == y[j])
                       {
                         count++;
                         calc_v.Resize(count);
                         
                         calc_v[count-1] = v[j];
                       }
                  } 
                
                norm_distribution.m_mean = calc_v.Mean(); //Assign these to Gaussian Normal distribution
                norm_distribution.m_std = calc_v.Std();   
                 
                
                #ifdef DEBUG_MODE
                  printf("mean %.5f std %.5f ",norm_distribution.m_mean,norm_distribution.m_std);
                #endif 
                
                proba *= count==0 ? 1 : norm_distribution.PDF(v_features[i]); //do not calculate if there isn't enought evidence'
            }
          
        proba_v[c] = proba*c_prior_proba[c]; //Turning the probability density into probability
        
        #ifdef DEBUG_MODE
         Print(">> Proba ",proba," prior proba ",c_prior_proba);
        #endif 
     }

//--- Normalize probabilities
    
    proba_v = proba_v / proba_v.Sum();
    
    return proba_v;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
*/

================================================
FILE: Sklearn/Naive Bayes/README.md
================================================
## Naive Bayes Classifier

This documentation explains the `CNaiveBayes` class in MQL5, which implements a **Naive Bayes classifier** for classification tasks.

**I. Naive Bayes Theory:**

Naive Bayes is a probabilistic classifier based on **Bayes' theorem**. It assumes that the features used for classification are **independent** of each other given the class label. This simplifies the calculations involved in making predictions.

**II. CNaiveBayes Class:**

The `CNaiveBayes` class provides functionalities for training and using a Naive Bayes classifier in MQL5:

**Public Functions:**

* **CNaiveBayes(void):** Constructor.
* **~CNaiveBayes(void):** Destructor.
* **void fit(matrix &x, vector &y):** Trains the model on the provided data (`x` - features, `y` - target labels).
* **int predict(vector &x):** Predicts the class label for a single input vector.
* **vector predict(matrix &x):** Predicts class labels for all rows in the input matrix.

**Internal Variables:**

* `n_features`: Number of features in the data.
* `y_target`: Vector of target labels used during training.
* `classes`: Vector containing the available class labels.
* `class_proba`: Vector storing the prior probability of each class.
* `features_proba`: Matrix storing the conditional probability of each feature value given each class.
* `c_prior_proba`: Vector storing the calculated prior probability of each class after training.
* `c_evidence`: Vector storing the calculated class evidence for a new data point.
* `calcProba(vector &v_features)`: Internal function (not directly accessible) that likely calculates the class probabilities for a given feature vector.

**III. Class Functionality:**

1. **Training:**
    * The `fit` function takes the input data (features and labels) and performs the following:
        * Calculates the prior probability of each class (number of samples belonging to each class divided by the total number of samples).
        * Estimates the conditional probability of each feature value given each class (using techniques like Laplace smoothing to handle unseen features).
    * These probabilities are stored in the internal variables for later use in prediction.

2. **Prediction:**
    * The `predict` functions take a new data point (feature vector) and:
        * Calculate the class evidence for each class using Bayes' theorem, considering the prior probabilities and conditional probabilities of the features.
        * The class with the **highest class evidence** is predicted as the most likely class for the new data point.

**IV. Additional Notes:**

* The class assumes the data is already preprocessed and ready for use.

**Reference**
* [Data Science and Machine Learning (Part 11): Naïve Bayes, Probability theory in Trading](https://www.mql5.com/en/articles/12184)

================================================
FILE: Sklearn/Naive Bayes/naive bayes visuals.py
================================================
# -*- coding: utf-8 -*-
"""
Created on Tue Feb 14 10:37:36 2023

@author: Omega Joctan
"""

import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Change this directory to be the one containing the Files

directory = r"C:\Users\Omega Joctan\AppData\Roaming\MetaQuotes\Terminal\F4F6C6D7A7155578A6DEA66D12B1D40D\MQL5\Files\NAIVE BAYES"

data = pd.read_csv(f"{directory}\\vars.csv")

for var in data:
    sns.distplot(data[var])
    plt.show()

================================================
FILE: Sklearn/Neighbors/KNN_nearest_neighbors.mqh
================================================
//+------------------------------------------------------------------+
//|                                        KNN_nearest_neighbors.mqh |
//|                                    Copyright 2022, Omega Joctan. |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Omega Joctan."
#property link      "https://www.mql5.com/en/users/omegajoctan"

//+------------------------------------------------------------------+

bool isdebug = true;

//+------------------------------------------------------------------+ 

class CKNNNearestNeighbors
  {
private:
   uint              k;
   matrix<double>    Matrix;
   ulong             m_rows, m_cols;
   vector            m_target;
   vector            m_classesVector;
   matrix            m_classesMatrix;

   double            Euclidean_distance(const vector &v1, const vector &v2);
   vector            ClassVector(); //global vector of target classes
   void              MatrixRemoveRow(matrix &mat, ulong row);
   void              VectorRemoveIndex(vector &v, ulong index);
   double            Mse(vector &A, vector &P);
public:
                     CKNNNearestNeighbors(matrix<double> &Matrix_, uint k_);
                     CKNNNearestNeighbors(matrix<double> &Matrix_);
                    ~CKNNNearestNeighbors(void);

   int               KNNAlgorithm(vector &vector_);
   vector            CrossValidation_LOOCV(uint initial_k = 0, uint final_k=1); //Leave One out Cross Validation (LOOCV)
   matrix            ConfusionMatrix(vector &A,vector &P);
   float             TrainTest(double train_size = 0.7); //returns accuracy of the tested dataset
  };

//+------------------------------------------------------------------+

CKNNNearestNeighbors:: CKNNNearestNeighbors(matrix<double> &Matrix_, uint k_)
  {
   k = k_;
   
   if(k %2 ==0)
      {
         k = k+1;
         if (isdebug)
            printf("K = %d is an even number, It will be added by One so it becomes an odd Number %d", k_, k);
      }

   Matrix.Copy(Matrix_);

   m_rows = Matrix.Rows();
   m_cols = Matrix.Cols();

   m_target = Matrix.Col(m_cols-1);
   m_classesVector = ClassVector();
   
   if (isdebug)
      Print("classes vector | Neighbors ", m_classesVector);
  }

//+------------------------------------------------------------------+

CKNNNearestNeighbors::CKNNNearestNeighbors(matrix<double> &Matrix_)
  {
   Matrix.Copy(Matrix_);

   k = (int)round(MathSqrt(Matrix.Rows()));
   k = k%2 ==0 ? k+1 : k; //make sure the value of k ia an odd number

   m_rows = Matrix.Rows();
   m_cols = Matrix.Cols();

   m_target = Matrix.Col(m_cols-1);
   m_classesVector = ClassVector();
   Print("classes vector | Neighbors ", m_classesVector);
  }

//+------------------------------------------------------------------+

CKNNNearestNeighbors::~CKNNNearestNeighbors(void)
  {
   ZeroMemory(k);
   ZeroMemory(m_classesVector);
   ZeroMemory(m_classesMatrix);
  }

//+------------------------------------------------------------------+ 

int CKNNNearestNeighbors::KNNAlgorithm(vector &vector_)
  {
   vector vector_2 = {};
   vector euc_dist;
   euc_dist.Resize(m_rows);

   //matrix temp_matrix = Matrix;
   //temp_matrix.Resize(Matrix.Rows(), Matrix.Cols()-1); //remove the last column of independent variables
   
   for(ulong i=0; i<m_rows; i++)
     {
      vector_2 = Matrix.Row(i);
      vector_2.Resize(m_cols-1);
       
      euc_dist[i] = NormalizeDouble(Euclidean_distance(vector_, vector_2), 5);
     }

//---   

   if(isdebug)
     {
      matrix dbgMatrix = Matrix; //temporary debug matrix
      dbgMatrix.Resize(dbgMatrix.Rows(), dbgMatrix.Cols()+1);
      dbgMatrix.Col(euc_dist, dbgMatrix.Cols()-1);

      //Print("Matrix w Euclidean Distance\n",dbgMatrix);

      ZeroMemory(dbgMatrix);
     }

//---
   
   uint size = (uint)m_target.Size();

   double tarArr[];
   ArrayResize(tarArr, size);
   double eucArray[];
   ArrayResize(eucArray, size);

   for(ulong i=0; i<size; i++)  //convert the vectors to array
     {      
      tarArr[i] = m_target[i];
      eucArray[i] = euc_dist[i];
     }

   double track[], NN[];
   ArrayCopy(track, tarArr);


   int max; 
   
   for(int i=0; i<(int)m_target.Size(); i++)
     {
      if(ArraySize(track) > (int)k)
        {
         max = ArrayMaximum(eucArray);
         ArrayRemove(eucArray, max, 1);
         ArrayRemove(track, max, 1);
        }
     }
   ArrayCopy(NN, eucArray);
/*
   Print("NN ");
   ArrayPrint(NN);
   Print("Track ");
   ArrayPrint(track);
*/
//--- Voting process

   vector votes(m_classesVector.Size());

   for(ulong i=0; i<votes.Size(); i++)
     {
      int count = 0;
      for(ulong j=0; j<track.Size(); j++)
        {
         if(m_classesVector[i] == track[j])
            count++;
        }

      votes[i] = (double)count;

      if(votes.Sum() == k)  //all members have voted
         break;
     }

   if(isdebug)
      Print(vector_, " belongs to class ", (int)m_classesVector[votes.ArgMax()]);
      
     return((int)m_classesVector[votes.ArgMax()]);
  }

//+------------------------------------------------------------------+
 
double CKNNNearestNeighbors:: Euclidean_distance(const vector &v1, const vector &v2)
  {
   double dist = 0;

   if(v1.Size() != v2.Size())
      Print(__FUNCTION__, " v1 and v2 not matching in size");
   else
     {
      double c = 0;
      for(ulong i=0; i<v1.Size(); i++)
         c += MathPow(v1[i] - v2[i], 2);

      dist = MathSqrt(c);
     }

   return(dist);
  }

//+------------------------------------------------------------------+
 
vector CKNNNearestNeighbors::ClassVector()
  {
   vector t_vectors = Matrix.Col(m_cols-1); //target variables are found on the last column in the matrix
   vector temp_t = t_vectors, v = {t_vectors[0]};

   for(ulong i=0, count =1; i<m_rows; i++)  //counting the different neighbors
     {
      for(ulong j=0; j<m_rows; j++)
        {
         if(t_vectors[i] == temp_t[j] && temp_t[j] != -1000)
           {
            bool count_ready = false;

            for(ulong n=0; n<v.Size(); n++)
               if(t_vectors[i] == v[n])
                  count_ready = true;

            if(!count_ready)
              {
               count++;
               v.Resize(count);

               v[count-1] = t_vectors[i];

               temp_t[j] = -1000; //modify so that it can no more be counted
              }
            else
               break;
            //Print("t vectors vector ",t_vectors);
           }
         else
            continue;
        }
     }

   return(v);
  }

//+------------------------------------------------------------------+

vector CKNNNearestNeighbors::CrossValidation_LOOCV(uint initial_k = 0, uint final_k=1)
  {
 
    uint iterations = final_k-initial_k;
    
     vector cv(iterations); 
        
      ulong N = m_rows;
      
      matrix OG_Matrix = Matrix; //The original matrix
      ulong OG_rows = m_rows; //the primarly value of rows
      vector OG_target = m_target;
      
      ulong size = N-1;
      
      m_rows = m_rows-1;  //leavo one row out
      
      for (uint z = initial_k; z<final_k; z++)
        { 
          if (iterations>1) k = z;
               
          double sum_mse = 0;
          
          for (ulong i=0; i<size; i++)
            { 
               MatrixRemoveRow(Matrix,i);
               m_target.Resize(m_rows);
               
               vector P(1), A = { OG_target[i] }, v;
               
                    {
                        v = OG_Matrix.Row(i);
                        v.Resize(m_cols-1);
                        
                        P[0] = KNNAlgorithm(v);
                    }
               
               
               if (isdebug)
                   Print("\n Actual ",A," Predicted ",P," ",i," MSE = ",Mse(A,P),"\n");
                
               sum_mse += Mse(A,P);
               
               Matrix.Copy(OG_Matrix);
            }
         
         cv[z] = (float)sum_mse/size;
       } 
      
      Matrix.Copy(OG_Matrix);
      m_rows = OG_rows;
      m_target = OG_target;
      
      return (cv);
  }

//+------------------------------------------------------------------+


void CKNNNearestNeighbors::MatrixRemoveRow(matrix &mat,ulong row)
 {
    matrix new_matrix(mat.Rows()-1,mat.Cols()); //Remove the one column
    
     for (ulong j=0; j<mat.Cols(); j++)
      for (ulong i=0, new_rows=0; i<mat.Rows(); i++)
           {
               if (i == row) continue; 
               else  
                 {
                   new_matrix[new_rows][j] = mat[i][j];
                 
                   new_rows++;
                 }
           }
           
    mat.Copy(new_matrix);
 }
//+------------------------------------------------------------------+

void CKNNNearestNeighbors::VectorRemoveIndex(vector &v, ulong index)
 {
   vector new_v(v.Size()-1);
   
   for (ulong i=0, count = 0; i<v.Size(); i++)
      if (i == index)
        {
          new_v[count] = new_v[i];
          count++;
        }
 }

//+------------------------------------------------------------------+

double CKNNNearestNeighbors::Mse(vector &A,vector &P)
 {
   double err = 0;
   vector c;
   
    if (A.Size() != P.Size()) 
      Print(__FUNCTION__," Err, A and P vectors not the same in size");
    else
      {
         ulong size = A.Size();
         c.Resize(size);
         
         c = MathPow(A - P,2); 
         
         err = (c.Sum()) / size;          
      }
    return (err);
 }

//+------------------------------------------------------------------+
matrix CKNNNearestNeighbors::ConfusionMatrix(vector &A,vector &P)
 {
   ulong size = m_classesVector.Size();
   matrix mat_(size,size);
   
   if (A.Size() != P.Size()) 
      Print("Cant create confusion matrix | A and P not having the same size ");
   else
     {
      
         int tn = 0,fn =0,fp =0, tp=0;
         for (ulong i = 0; i<A.Size(); i++)
            {              
               if (A[i]== P[i] && P[i]==m_classesVector[0])
                  tp++; 
               if (A[i]== P[i] && P[i]==m_classesVector[1])
                  tn++;
               if (P[i]==m_classesVector[0] && A[i]==m_classesVector[1])
                  fp++;
               if (P[i]==m_classesVector[1] && A[i]==m_classesVector[0])
                  fn++;
            }
            
       mat_[0][0] = tn; mat_[0][1] = fp;
       mat_[1][0] = fn; mat_[1][1] = tp;

    }
     
   return(mat_);
    
 }
//+------------------------------------------------------------------+
float CKNNNearestNeighbors::TrainTest(double train_size=0.700000)
 {
//--- Split the matrix
   
   matrix default_Matrix = Matrix; 
   
   int train = (int)MathCeil(m_rows*train_size),
       test  = (int)MathFloor(m_rows*(1-train_size));
   
   if (isdebug) printf("Train %d test %d",train,test);

   matrix TrainMatrix(train,m_cols), TestMatrix(test,m_cols);
   int train_index = 0, test_index =0;

//---
   
   for (ulong r=0; r<Matrix.Rows(); r++)
      {
         if ((int)r < train)
           {
             TrainMatrix.Row(Matrix.Row(r),train_index);
             train_index++;
           }
         else
           {
             TestMatrix.Row(Matrix.Row(r),test_index);
             test_index++;
           }     
      }

   if (isdebug) 
    Print("TrainMatrix\n",TrainMatrix,"\nTestMatrix\n",TestMatrix);
   
//--- Training the Algorithm
   
   Matrix.Copy(TrainMatrix); //That's it ???
   
//--- Testing the Algorithm
   
   vector TestPred(TestMatrix.Rows());
   vector TargetPred = TestMatrix.Col(m_cols-1);
   vector v_in = {};
   
   for (ulong i=0; i<TestMatrix.Rows(); i++)
     {
        v_in = TestMatrix.Row(i);
        v_in.Resize(v_in.Size()-1); //Remove independent variable
        
        TestPred[i] = KNNAlgorithm(v_in);        
     }
   
   matrix cf_m = ConfusionMatrix(TargetPred,TestPred);
   vector diag = cf_m.Diag();
   float acc = (float)(diag.Sum()/cf_m.Sum())*100;
   
   Print("Confusion Matrix\n",cf_m,"\nAccuracy ------> ",acc,"%");
   
   return(acc);      
 }
//+------------------------------------------------------------------+

================================================
FILE: Sklearn/Tree/README.md
================================================
## Decision Trees in MQL5: Classification and Regression

Decision trees are powerful machine learning algorithms that use a tree-like structure to make predictions. They work by splitting the data based on features (independent variables) into increasingly homogeneous subsets, ultimately reaching leaves representing the final prediction. MQL5 offers functionalities for implementing both **classification** and **regression** decision trees through the `tree.mqh` library.

**Decision Tree Theory (Basic Overview):**

1. **Start with the entire dataset at the root node.**
2. **Choose the feature and threshold that best splits the data into two subsets such that each subset is more homogeneous concerning the target variable (dependent variable).**
    * For classification, this often involves maximizing information gain or minimizing Gini impurity.
    * For regression, it involves maximizing variance reduction between the parent node and child nodes.
3. **Repeat step 2 for each child node recursively until a stopping criterion is met (e.g., reaching a maximum depth, minimum samples per node, or sufficient homogeneity).**
4. **Assign a prediction value to each leaf node.**
    * For classification, this is the most frequent class in the leaf node.
    * For regression, this is the average value of the target variable in the leaf node.

**CDecisionTreeClassifier Class:**

This class implements a decision tree for classification tasks. It offers the following functionalities:

* `CDecisionTreeClassifier(uint min_samples_split=2, uint max_depth=2, mode mode_=MODE_GINI)` Constructor, allows setting hyperparameters (minimum samples per split, maximum tree depth, and splitting criterion).
* `~CDecisionTreeClassifier(void)` Destructor.
* `void fit(const matrix &x, const vector &y)` Trains the model on the provided data (`x` - independent variables, `y` - class labels).
* `void print_tree(Node *tree, string indent=" ",string padl=")` Prints the tree structure in a readable format.
* `double predict(const vector &x)` Predicts the class label for a new data point (`x`).
* `vector predict(const matrix &x)` Predicts class labels for multiple new data points (`x`).

**CDecisionTreeRegressor Class:**

This class inherits from `CDecisionTreeClassifier` and specializes in regression tasks. It overrides specific functions and implements different splitting criteria:

* `CDecisionTreeRegressor(uint min_samples_split=2, uint max_depth=2):` Constructor, allows setting hyperparameters (minimum samples per split and maximum tree depth).
* `~CDecisionTreeRegressor(void):` Destructor.
* `void fit(matrix &x, vector &y):` Trains the model on the provided data (`x` - independent variables, `y` - continuous values).
* `double predict(const vector &x)` Predicts the continuous value for a new data point (`x`).

**Additional Notes:**

* Both classes use internal helper functions for building the tree, calculating splitting criteria (information gain, Gini impurity, variance reduction), and making predictions.
* The `check_is_fitted` function ensures the model is trained before allowing predictions.
* Choosing appropriate hyperparameters (especially maximum depth) is crucial to avoid overfitting the model.

**Reference**

[Data Science and Machine Learning (Part 16): A Refreshing Look at Decision Trees](https://www.mql5.com/en/articles/13862)

================================================
FILE: Sklearn/Tree/tree.mqh
================================================
//+------------------------------------------------------------------+
//|                                                         tree.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+
#include <MALE5\Utils.mqh>


#define log2(leaf_value) MathLog(leaf_value) / MathLog(2)


class Node
{
  public:
    // for decision node
       
    uint feature_index;
    double threshold;
    double info_gain;
     
    // for leaf node
     
    double leaf_value;   
      
    Node *left_child; //left child Node
    Node *right_child; //right child Node

    Node() : left_child(NULL), right_child(NULL) {} // default constructor

    Node(int feature_index_, double threshold_=0.0, Node *left_=NULL, Node *right_=NULL, double info_gain_=NULL, double value_=NULL)
        : left_child(left_), right_child(right_)
    {
        this.feature_index = feature_index_;
        this.threshold = threshold_;
        this.info_gain = info_gain_;
        this.leaf_value = value_;
    }
    
   void __Print__()
    {
      printf("feature_index: %d \nthreshold: %f \ninfo_gain: %f \nleaf_value: %f",feature_index,threshold, info_gain, leaf_value);
    }    
};

struct split_info
  {
   uint feature_index;
   double threshold;
   matrix dataset_left,
          dataset_right;
   double info_gain;
  };

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
enum mode {MODE_ENTROPY, MODE_GINI};

class CDecisionTreeClassifier
  {
protected:  
   
   Node *build_tree(matrix &data, uint curr_depth=0);
   double  calculate_leaf_value(vector &Y);
   
   bool is_fitted;
   bool check_is_fitted(string func)
     {
       if (!is_fitted)
         {
           Print(func," Tree not trained, Call fit function first to train the model");
           return false;   
         }
       return (true);
     }
//---
   
   uint m_max_depth;
   uint m_min_samples_split;   
   mode m_mode;
   
   double  gini_index(vector &y);
   double  entropy(vector &y);
   double  information_gain(vector &parent, vector &l_child, vector &r_child);
   
   
   split_info  get_best_split(const matrix &data, uint num_features);
   split_info  split_data(const matrix &data, uint feature_index, double threshold=0.5);
   
   double make_predictions(const vector &x, const Node &tree);
   
   void delete_tree(Node* node);
   
   Node *nodes[]; //Keeping track of all the nodes in a tree
   
public:
                     Node *root;
                     
                     CDecisionTreeClassifier(uint min_samples_split=2, uint max_depth=2, mode mode_=MODE_GINI);
                    ~CDecisionTreeClassifier(void);
                    
                     void fit(const matrix &x, const vector &y);
                     void print_tree(Node *tree, string indent=" ",string padl="");
                     double predict(const vector &x);
                     vector predict(const matrix &x);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CDecisionTreeClassifier::CDecisionTreeClassifier(uint min_samples_split=2, uint max_depth=2, mode mode_=MODE_GINI)
 {
   m_min_samples_split = min_samples_split;
   m_max_depth = max_depth;
   
   m_mode = mode_;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CDecisionTreeClassifier::~CDecisionTreeClassifier(void)
 {   
   #ifdef DEBUG_MODE
      Print(__FUNCTION__," Deleting Tree nodes =",nodes.Size());
   #endif 
   
   this.delete_tree(root);
   
   for (int i=0; i<(int)nodes.Size(); i++)
     this.delete_tree(nodes[i]);  
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CDecisionTreeClassifier::delete_tree(Node* node)
 {
    if (CheckPointer(node) != POINTER_INVALID)
    {
        delete_tree(node.left_child);
        delete_tree(node.right_child);
        delete node;
    }
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CDecisionTreeClassifier::gini_index(vector &y)
 {
   vector unique = CUtils::Unique_count(y);
   
   vector probabilities = unique / (double)y.Size();
   
   return 1.0 - MathPow(probabilities, 2).Sum();
 }
//+------------------------------------------------------------------+
//|      function to compute entropy                                 |
//+------------------------------------------------------------------+
double CDecisionTreeClassifier::entropy(vector &y)
 {    
   vector class_labels = CUtils::Unique_count(y);
     
   vector p_cls = class_labels / double(y.Size());
  
   vector entropy = (-1 * p_cls) * log2(p_cls);
  
  return entropy.Sum();
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CDecisionTreeClassifier::information_gain(vector &parent, vector &l_child, vector &r_child)
 {  
    double weight_left = l_child.Size() / (double)parent.Size(),
           weight_right = r_child.Size() / (double)parent.Size();
    
    double gain =0;    
    switch(m_mode)
      {
       case  MODE_GINI:
         gain = gini_index(parent) - ( (weight_left*gini_index(l_child)) + (weight_right*gini_index(r_child)) );
         break;
       case MODE_ENTROPY:
         gain = entropy(parent) - ( (weight_left*entropy(l_child)) + (weight_right*entropy(r_child)) );
         break;
      }
    
   return gain;
 }
//+------------------------------------------------------------------+
//|         function to print the tree                               |
//+------------------------------------------------------------------+
void CDecisionTreeClassifier::print_tree(Node *tree, string indent=" ",string padl="")
  {
     if (tree.leaf_value != NULL)
        Print((padl+indent+": "),tree.leaf_value); 
     else //if we havent' reached the leaf node keep printing child trees
       {
         padl += " ";
         
         Print((padl+indent)+": X_",tree.feature_index, "<=", tree.threshold, "?", tree.info_gain);
         
         print_tree(tree.left_child, "left","--->"+padl);
         
         print_tree(tree.right_child, "right","--->"+padl);
       }
  }  
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CDecisionTreeClassifier::fit(const matrix &x, const vector &y)
 {   
   matrix data = CUtils::concatenate(x, y, 1);
   
   this.root = this.build_tree(data);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
split_info CDecisionTreeClassifier::split_data(const matrix &data, uint feature_index, double threshold=0.5)
 {
   int left_size=0, right_size =0;
   vector row = {};
   
   split_info split;
   
   ulong cols = data.Cols(),
         rows = data.Rows();
   
   split.dataset_left.Resize(0, cols);
   split.dataset_right.Resize(0, cols);
   
   
    for (ulong i=0; i<rows; i++)
     {       
       row = data.Row(i);
       
       if (row[feature_index] <= threshold)
        {
          left_size++;
          split.dataset_left.Resize(left_size, cols);
          split.dataset_left.Row(row, left_size-1); 
        }
       else
        {
         right_size++;
         split.dataset_right.Resize(right_size, cols);
         split.dataset_right.Row(row, right_size-1);         
        }
     }
     
   return split;
 }
//+------------------------------------------------------------------+
//|      Return the Node for the best split                          |
//+------------------------------------------------------------------+
split_info CDecisionTreeClassifier::get_best_split(const matrix &data, uint num_features)
  {
  
   double max_info_gain = -DBL_MAX;
   vector feature_values = {};
   vector left_v={}, right_v={}, y_v={};
   
//---
   
   split_info best_split;
   split_info split;
   
   for (int i=0; i<(int)num_features; i++)
     {
       feature_values = data.Col(i);
       vector possible_thresholds = CUtils::Unique(feature_values);
              
        if (possible_thresholds.Size() <= 1)
           continue; // Skip this feature as it won't provide meaningful splits
             
       //---
             
         for (int j=0; j<(int)possible_thresholds.Size(); j++)
            {                            
              split = this.split_data(data, i, possible_thresholds[j]);
              
              if (split.dataset_left.Rows()>0 && split.dataset_right.Rows() > 0)
                {
                  y_v = data.Col(data.Cols()-1);
                  right_v = split.dataset_right.Col(split.dataset_right.Cols()-1);
                  left_v = split.dataset_left.Col(split.dataset_left.Cols()-1);
                  
                  double curr_info_gain = this.information_gain(y_v, left_v, right_v);
                                    
                  if (curr_info_gain > max_info_gain)
                    {             
                      #ifdef DEBUG_MODE
                        printf("    split left: [%dx%d] split right: [%dx%d] curr_info_gain: %f max_info_gain: %f",split.dataset_left.Rows(),split.dataset_left.Cols(),split.dataset_right.Rows(),split.dataset_right.Cols(),curr_info_gain,max_info_gain);
                      #endif 
                        
                      best_split.feature_index = i;
                      best_split.threshold = possible_thresholds[j];
                      best_split.dataset_left = split.dataset_left;
                      best_split.dataset_right = split.dataset_right;
                      best_split.info_gain = curr_info_gain;
                      
                      max_info_gain = curr_info_gain;
                    }
                }
            }    
     }
     
    return best_split;
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
Node *CDecisionTreeClassifier::build_tree(matrix &data, uint curr_depth=0)
 {
    matrix X;
    vector Y;
    
         
    if (!CUtils::XandYSplitMatrices(data,X,Y)) //Split the input matrix into feature matrix X and target vector Y.    
      {
         #ifdef DEBUG_MODE
            printf("%s Line %d Failed to build a tree Data Empty",__FUNCTION__,__LINE__);
         #endif 
         
         return NULL; //return null pointer
      }
    
    is_fitted = true;
     
    ulong samples = X.Rows(), features = X.Cols(); //Get the number of samples and features in the dataset.
        
    ArrayResize(nodes, nodes.Size()+1); //Append the nodes to memory
    Node *left_child, *right_child;
            
    if (samples >= m_min_samples_split && curr_depth<=m_max_depth)
      {
         split_info best_split = this.get_best_split(data, (uint)features);
         
         #ifdef DEBUG_MODE
             Print(__FUNCTION__," | ",__LINE__,"\nbest_split left: [",best_split.dataset_left.Rows(),"x",best_split.dataset_left.Cols(),"]\nbest_split right: [",best_split.dataset_right.Rows(),"x",best_split.dataset_right.Cols(),"]\nfeature_index: ",best_split.feature_index,"\nInfo gain: ",best_split.info_gain,"\nThreshold: ",best_split.threshold);
         #endif 
                  
         if (best_split.info_gain > 0)
           {
             left_child = this.build_tree(best_split.dataset_left, curr_depth+1);
             right_child = this.build_tree(best_split.dataset_right, curr_depth+1);
                      
             nodes[nodes.Size()-1] = new Node(best_split.feature_index,best_split.threshold,left_child,right_child,best_split.info_gain);  
             return nodes[nodes.Size()-1];
           }
      }      
     
     nodes[nodes.Size()-1] = new Node();
     nodes[nodes.Size()-1].leaf_value = this.calculate_leaf_value(Y);
     
     return nodes[nodes.Size()-1];
 }
//+------------------------------------------------------------------+
//|   returns the element from Y that has the highest count,         |
//|  effectively finding the most common element in the list.        |
//+------------------------------------------------------------------+
double CDecisionTreeClassifier::calculate_leaf_value(vector &Y)
 {   
   vector uniques_count = CUtils::Unique_count(Y);
   vector unique = CUtils::Unique(Y);
   
   return unique[uniques_count.ArgMax()];
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CDecisionTreeClassifier::make_predictions(const vector &x, const Node &tree)
 {   
   if (!check_is_fitted(__FUNCTION__))
     return 0;
   
   //if (CheckPointer(tree)=POINTER_INVALID)
     
    if (tree.leaf_value != NULL) //This is a leaf_value
      return tree.leaf_value;
    
    #ifdef DEBUG_MODE
      printf("Tree.threshold %f tree.feature_index %d leaf_value %f",tree.threshold,tree.feature_index,tree.leaf_value);
    #endif 
    
    if (tree.feature_index>=x.Size())
      return tree.leaf_value;
          
    double feature_value = x[tree.feature_index];
    double pred = 0;
    
    if (feature_value <= tree.threshold)
      {
       if (CheckPointer(tree.left_child)!=POINTER_INVALID)
          pred = this.make_predictions(x, tree.left_child);  
      }
    else
     {
       if (CheckPointer(tree.right_child)!=POINTER_INVALID)
         pred = this.make_predictions(x, tree.right_child);
     }
     
   return pred;
 }
//+------------------------------------------------------------------+
//|      Commonly used for making predictions in REAL-TIME           |
//+------------------------------------------------------------------+
double CDecisionTreeClassifier::predict(const vector &x)
 {
   if (!check_is_fitted(__FUNCTION__))
     return 0;
          
   return this.make_predictions(x, this.root);
 }
//+------------------------------------------------------------------+
//|   Commonly used for making predictions in TRAIN-TEST             |
//+------------------------------------------------------------------+
vector CDecisionTreeClassifier::predict(const matrix &x)
 {
    vector ret(x.Rows());
 
   if (!check_is_fitted(__FUNCTION__))
     return ret;
        
    for (ulong i=0; i<x.Rows(); i++)
       ret[i] = this.predict(x.Row(i));
       
   return ret;
 }

//+------------------------------------------------------------------+
//|                                                                  |
//|                                                                  |
//|                                                                  |
//|                                                                  |
//|                                                                  |
//|                                                                  |
//|                                                                  |
//+------------------------------------------------------------------+

class CDecisionTreeRegressor: public CDecisionTreeClassifier
  {
private:
                     double  calculate_leaf_value(vector &Y);
                     split_info  get_best_split(matrix &data, uint num_features);
                     double variance_reduction(vector &parent, vector &l_child, vector &r_child);
                     
                     Node *build_tree(matrix &data, uint curr_depth=0);
public:
                     CDecisionTreeRegressor(uint min_samples_split=2, uint max_depth=2);
                    ~CDecisionTreeRegressor(void);
                    
                     void fit(matrix &x, vector &y);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CDecisionTreeRegressor::CDecisionTreeRegressor(uint min_samples_split=2, uint max_depth=2):CDecisionTreeClassifier(min_samples_split, max_depth)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CDecisionTreeRegressor::~CDecisionTreeRegressor(void)
 {
 
 }
//+------------------------------------------------------------------+
//|         function to compute variance reduction                   |
//+------------------------------------------------------------------+
double CDecisionTreeRegressor::variance_reduction(vector &parent, vector &l_child, vector &r_child)
 {
    double weight_l = l_child.Size() / (double)parent.Size(),
           weight_r = r_child.Size() / (double)parent.Size();
     
    return parent.Var() - ((weight_l * l_child.Var()) + (weight_r * r_child.Var()));
 }
//+------------------------------------------------------------------+
//|      Return the Node for the best split                          |
//+------------------------------------------------------------------+
split_info CDecisionTreeRegressor::get_best_split(matrix &data, uint num_features)
  {
   double max_info_gain = -DBL_MAX;
   vector feature_values = {};
   vector left_v={}, right_v={}, y_v={};
   
//---
   
   split_info best_split;
   split_info split;
   
   for (uint i=0; i<num_features; i++)
     {
       feature_values = data.Col(i);
       vector possible_thresholds = CUtils::Unique(feature_values);
                  
         for (uint j=0; j<possible_thresholds.Size(); j++)
            {              
              split = this.split_data(data, i, possible_thresholds[j]);
              
              if (split.dataset_left.Rows()>0 && split.dataset_right.Rows() > 0)
                {
                  y_v = data.Col(data.Cols()-1);
                  right_v = split.dataset_right.Col(split.dataset_right.Cols()-1);
                  left_v = split.dataset_left.Col(split.dataset_left.Cols()-1);
                  
                  double curr_info_gain = this.variance_reduction(y_v, left_v, right_v);
                                    
                  if (curr_info_gain > max_info_gain)
                    {             
                      #ifdef DEBUG_MODE
                        printf(__FUNCTION__," | ",__LINE__,"\nsplit left: [%dx%d] split right: [%dx%d] curr_info_gain: %f max_info_gain: %f",split.dataset_left.Rows(),split.dataset_left.Cols(),split.dataset_right.Rows(),split.dataset_right.Cols(),curr_info_gain,max_info_gain);
                      #endif 
                      
                      best_split.feature_index = i;
                      best_split.threshold = possible_thresholds[j];
                      best_split.dataset_left = split.dataset_left;
                      best_split.dataset_right = split.dataset_right;
                      best_split.info_gain = curr_info_gain;
                      
                      max_info_gain = curr_info_gain;
                    }
                }
            }    
     }
     
    return best_split;
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
Node *CDecisionTreeRegressor::build_tree(matrix &data, uint curr_depth=0)
 {
    matrix X;
    vector Y;
      
    if (!CUtils::XandYSplitMatrices(data,X,Y)) //Split the input matrix into feature matrix X and target vector Y.    
      {
         #ifdef DEBUG_MODE 
           printf("%s Line %d Failed to build a tree Data Empty",__FUNCTION__,__LINE__);
         #endif 
         
         return NULL; //Return a NULL pointer
      }
      
    ulong samples = X.Rows(), features = X.Cols(); //Get the number of samples and features in the dataset.
        
    ArrayResize(nodes, nodes.Size()+1); //Append the nodes to memory
    Node *left_child, *right_child;
            
    if (samples >= m_min_samples_split && curr_depth<=m_max_depth)
      {
         split_info best_split = this.get_best_split(data, (uint)features);
         
         #ifdef DEBUG_MODE
           Print(__FUNCTION__," | ",__LINE__,"\nbest_split left: [",best_split.dataset_left.Rows(),"x",best_split.dataset_left.Cols(),"]\nbest_split right: [",best_split.dataset_right.Rows(),"x",best_split.dataset_right.Cols(),"]\nfeature_index: ",best_split.feature_index,"\nInfo gain: ",best_split.info_gain,"\nThreshold: ",best_split.threshold);
         #endif 
                  
         if (best_split.info_gain > 0)
           {
             left_child = this.build_tree(best_split.dataset_left, curr_depth+1);
             right_child = this.build_tree(best_split.dataset_right, curr_depth+1);
                      
             nodes[nodes.Size()-1] = new Node(best_split.feature_index,best_split.threshold,left_child,right_child,best_split.info_gain);  
             return nodes[nodes.Size()-1];
           }
      }      
     
     nodes[nodes.Size()-1] = new Node();
     nodes[nodes.Size()-1].leaf_value = this.calculate_leaf_value(Y);
     
     return nodes[nodes.Size()-1];
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CDecisionTreeRegressor::fit(matrix &x, vector &y)
 {
   matrix data = CUtils::concatenate(x, y, 1);
      
   this.root = this.build_tree(data);
   
   is_fitted = true;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double CDecisionTreeRegressor::calculate_leaf_value(vector &Y)
 {
   return Y.Mean();
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Sklearn/metrics.mqh
================================================
//+------------------------------------------------------------------+
//|                                                      metrics.mqh |
//|                                    Copyright 2022, Fxalgebra.com |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Fxalgebra.com"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//|                                                                  |
//|                                                                  |
//+------------------------------------------------------------------+

#include <MALE5\Numpy\Numpy.mqh>
#include <MALE5\MqPlotLib\plots.mqh>

struct roc_curve_struct
 {
   vector TPR,
          FPR, 
          Thresholds;
 };

struct confusion_matrix_struct
 { 
   matrix MATRIX;
   vector CLASSES;
   vector TP, 
          TN, 
          FP, 
          FN;
 };
 
enum regression_metrics
{
   METRIC_R_SQUARED,   // R-squared
   METRIC_ADJUSTED_R,  // Adjusted R-squared
   METRIC_RSS,         // Residual Sum of Squares
   METRIC_MSE,         // Mean Squared Error
   METRIC_RMSE,        // Root Mean Squared Error
   METRIC_MAE          // Mean Absolute Error
};

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
class Metrics
  {
protected:   
  
   static int SearchPatterns(const vector &True, int value_A, const vector &B, int value_B);
   static confusion_matrix_struct confusion_matrix(const vector &True, const vector &Preds);
   
public:

   Metrics(void);
   ~Metrics(void);

   //--- Regression metrics

   static double r_squared(const vector &True, const vector &Pred);
   static double adjusted_r(const vector &True, const vector &Pred, uint indep_vars = 1);

   static double rss(const vector &True, const vector &Pred);
   static double mse(const vector &True, const vector &Pred);
   static double rmse(const vector &True, const vector &Pred);
   static double mae(const vector &True, const vector &Pred);
   
   static double RegressionMetric(const vector &True, const vector &Pred, regression_metrics METRIC_);

   //--- Classification metrics

   static double accuracy_score(const vector &True, const vector &Pred);
   
   static vector accuracy(const vector &True, const vector &Preds);
   static vector precision(const vector &True, const vector &Preds);
   static vector recall(const vector &True, const vector &Preds);
   static vector f1_score(const vector &True, const vector &Preds);
   static vector specificity(const vector &True, const vector &Preds);
   
   static roc_curve_struct roc_curve(const vector &True, const vector &Preds, bool show_roc_curve=false);
   static void classification_report(const vector &True, const vector &Pred, bool show_roc_curve=false);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
Metrics::Metrics(void)
  {

  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
Metrics::~Metrics(void)
  {

  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double Metrics::r_squared(const vector &True, const vector &Pred)
  {
   return(Pred.RegressionMetric(True, REGRESSION_R2));
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double Metrics::adjusted_r(const vector &True, const vector &Pred, uint indep_vars = 1)
  {
   if(True.Size() != Pred.Size())
     {
      Print(__FUNCTION__, " Vector True and P are not equal in size ");
      return(0);
     }

   double r2 = r_squared(True, Pred);
   ulong N = Pred.Size();

   return(1 - ((1 - r2) * (N - 1)) / (N - indep_vars - 1));
  }

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
confusion_matrix_struct Metrics::confusion_matrix(const vector &True, const vector &Preds)
 {
  confusion_matrix_struct confusion_matrix; 
   
  vector classes = CNumpy::unique(True).unique;
  confusion_matrix.CLASSES = classes;
  
//--- Fill the confusion matrix
   
   matrix MATRIX(classes.Size(), classes.Size());
   MATRIX.Fill(0.0);
   
   for(ulong i = 0; i < classes.Size(); i++)
      for(ulong j = 0; j < classes.Size(); j++)
         MATRIX[i][j] = SearchPatterns(True, (int)classes[i], Preds, (int)classes[j]);
   
   confusion_matrix.MATRIX = MATRIX;
   confusion_matrix.TP = MATRIX.Diag();
   confusion_matrix.FP = MATRIX.Sum(0) - confusion_matrix.TP;
   confusion_matrix.FN = MATRIX.Sum(1) - confusion_matrix.TP;
   confusion_matrix.TN = MATRIX.Sum() - (confusion_matrix.TP + confusion_matrix.FP + confusion_matrix.FN);
     
   return confusion_matrix;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector Metrics::accuracy(const vector &True,const vector &Preds)
 {
  confusion_matrix_struct conf_m = confusion_matrix(True, Preds);
  
  return (conf_m.TP + conf_m.TN) / conf_m.MATRIX.Sum();
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector Metrics::precision(const vector &True,const vector &Preds)
 {
   confusion_matrix_struct conf_m = confusion_matrix(True, Preds);

   return conf_m.TP / (conf_m.TP + conf_m.FP + DBL_EPSILON); 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector Metrics::f1_score(const vector &True,const vector &Preds)
 {
   vector precision = precision(True, Preds);
   vector recall = recall(True, Preds);
   
   return 2 * precision * recall / (precision + recall + DBL_EPSILON); 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector Metrics::recall(const vector &True,const vector &Preds)
 {
   confusion_matrix_struct conf_m = confusion_matrix(True, Preds);

   return conf_m.TP / (conf_m.TP + conf_m.FN + DBL_EPSILON); 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector Metrics::specificity(const vector &True,const vector &Preds)
 {
   confusion_matrix_struct conf_m = confusion_matrix(True, Preds);

   return conf_m.TN / (conf_m.TN + conf_m.FP + DBL_EPSILON); 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
roc_curve_struct Metrics::roc_curve(const vector &True,const vector &Preds, bool show_roc_curve=false)
 {
   roc_curve_struct roc;
   confusion_matrix_struct conf_m = confusion_matrix(True, Preds);
   
   roc.TPR = recall(True, Preds);
   roc.FPR = conf_m.FP / (conf_m.FP + conf_m.TN + DBL_EPSILON);
   
   if (show_roc_curve)
   {
      CPlots plt;
      plt.Plot("Roc Curve",roc.FPR,roc.TPR,"roc_curve","False Positive Rate(FPR)","True Positive Rate(TPR)");
      
      while (MessageBox("Close or Cancel ROC CURVE to proceed","Roc Curve",MB_OK)<0)
       Sleep(1);
   } 
   
   return roc;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double Metrics::accuracy_score(const vector &True, const vector &Preds)
  {
   confusion_matrix_struct conf_m = confusion_matrix(True, Preds);
   
   return conf_m.MATRIX.Diag().Sum() / (conf_m.MATRIX.Sum() + DBL_EPSILON);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void Metrics::classification_report(const vector &True, const vector &Pred, bool show_roc_curve=false)
  {
  
  vector accuracy = accuracy(True, Pred);
  vector precision = precision(True, Pred);
  vector specificity = specificity(True, Pred);
  vector recall = recall(True, Pred);
  vector f1_score = f1_score(True, Pred); 
  
  double acc = accuracy_score(True, Pred);
  
  confusion_matrix_struct conf_m = confusion_matrix(True, Pred);
  
//--- support
   
   ulong size = conf_m.MATRIX.Rows();
   
   vector support(size);
   
   for(ulong i = 0; i < size; i++)
      support[i] = NormalizeDouble(MathIsValidNumber(conf_m.MATRIX.Row(i).Sum()) ? conf_m.MATRIX.Row(i).Sum() : 0, 8);

   int total_size = (int)conf_m.MATRIX.Sum();

//--- Avg and w avg
   
   vector avg, w_avg;
   avg.Resize(5);
   w_avg.Resize(5);

   avg[0] = precision.Mean();

   avg[1] = recall.Mean();
   avg[2] = specificity.Mean();
   avg[3] = f1_score.Mean();

   avg[4] = total_size;

//--- w avg

   vector support_prop = support / double(total_size + 1e-10);

   vector c = precision * support_prop;
   w_avg[0] = c.Sum();

   c = recall * support_prop;
   w_avg[1] = c.Sum();

   c = specificity * support_prop;
   w_avg[2] = c.Sum();

   c = f1_score * support_prop;
   w_avg[3] = c.Sum();

   w_avg[4] = (int)total_size;

//--- Report

      string report = "\n[CLS] \t\t\t\t\t\t\tprecision \trecall \tspecificity \tf1 score \tsupport";

      for(ulong i = 0; i < size; i++)
        {
         report += "\n\t\t[" + string(conf_m.CLASSES[i])+"]\t\t\t";
         //for (ulong j=0; j<3; j++)

         report += StringFormat("\t\t\t\t\t %.2f \t\t\t\t\t %.2f \t\t\t\t\t %.2f \t\t\t\t\t %.2f \t\t\t\t %d", precision[i], recall[i], specificity[i], f1_score[i], (int)support[i]);
        }
      
      report += "\n";
      report += StringFormat("\naccuracy\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t\t %.2f \t\t\t\t %d",acc,(int)conf_m.MATRIX.Sum());
      
      report += StringFormat("\naverage\t\t\t\t\t\t\t\t\t %.2f \t\t\t\t\t %.2f \t\t\t\t\t %.2f \t\t\t\t\t %.2f \t\t\t\t %d", avg[0], avg[1], avg[2], avg[3], (int)avg[4]);
      report += StringFormat("\nWeighed avg\t\t\t \t %.2f \t\t\t\t\t %.2f \t\t\t\t\t %.2f \t\t\t\t\t %.2f \t\t\t\t %d", w_avg[0], w_avg[1], w_avg[2], w_avg[3], (int)w_avg[4]);

      Print("Confusion Matrix\n", conf_m.MATRIX);
      Print("\nClassification Report\n", report);
      
      roc_curve(True, Pred, show_roc_curve);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double Metrics::rss(const vector &True, const vector &Pred)
  {
   vector c = True - Pred;
   c = MathPow(c, 2);

   return (c.Sum());
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double Metrics::mse(const vector &True, const vector &Pred)
  {
   vector c = True - Pred;
   c = MathPow(c, 2);

   return(c.Sum() / c.Size());
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
int Metrics::SearchPatterns(const vector &True, int value_A, const vector &B, int value_B)
  {
   int count=0;
   
   for(ulong i = 0; i < True.Size(); i++)
      if(True[i] == value_A && B[i] == value_B)
         count++;

   return count;
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double Metrics::rmse(const vector &True, const vector &Pred)
  {
   return Pred.RegressionMetric(True, REGRESSION_RMSE);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double Metrics::mae(const vector &True, const vector &Pred)
  {
   return Pred.RegressionMetric(True, REGRESSION_MAE);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
double Metrics::RegressionMetric(const vector &True,const vector &Pred,regression_metrics METRIC_)
 {
  double err = 0;
  
  switch (METRIC_)
   {
     case METRIC_MSE:
         err = mse(True, Pred);
         break;
     case METRIC_RMSE:
         err = rmse(True, Pred);
         break;
     case METRIC_MAE:
         err = mae(True, Pred);
         break;
     case METRIC_RSS:
         err = rss(True, Pred);
         break;
     case METRIC_R_SQUARED:
         err = r_squared(True, Pred);
         break;
     case METRIC_ADJUSTED_R:
         err = adjusted_r(True, Pred);
         break;
     default:
         break;
   }

  return err;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

================================================
FILE: Stats Models/ADF.mqh
================================================
//+------------------------------------------------------------------+
//|                                                          ADF.mqh |
//|                                  Copyright 2023, MetaQuotes Ltd. |
//|                                             https://www.mql5.com |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, MetaQuotes Ltd."
#property link      "https://www.mql5.com"
#include<Math\Stat\Math.mqh>
#include<Math\Alglib\specialfunctions.mqh>
#include "OLS.mqh"
#define SQRTEPS 1.4901161193847656e-08
//+------------------------------------------------------------------+
//| Information criterion                                            |
//+------------------------------------------------------------------+
enum ENUM_INFO_CRIT
  {
   INFO_NONE=0,
   INFO_AIC,
   INFO_BIC
  };
//+------------------------------------------------------------------+
//| Options for  trimming invalid observations                       |
//+------------------------------------------------------------------+
enum ENUM_TRIM
  {
   TRIM_NONE=0,
   TRIM_FORWARD,
   TRIM_BACKWARD,
   TRIM_BOTH
  };
//+------------------------------------------------------------------+
//| options for how to handle original data set                      |
//+------------------------------------------------------------------+

enum ENUM_ORIGINAL
  {
   ORIGINAL_EX=0,
   ORIGINAL_IN,
   ORIGINAL_SEP
  };
//+------------------------------------------------------------------+
//| Constant and trend used in regression model                      |
//+------------------------------------------------------------------+

enum ENUM_TREND
  {
   TREND_NONE=0,
   TREND_CONST_ONLY,
   TREND_LINEAR_ONLY,
   TREND_LINEAR_CONST,
   TREND_QUAD_LINEAR_CONST
  };
//+------------------------------------------------------------------+
//| Options for how to handle existing constants                     |
//+------------------------------------------------------------------+

enum ENUM_HAS_CONST
  {
   HAS_CONST_RAISE=0,
   HAS_CONST_SKIP,
   HAS_CONST_ADD
  };
//+------------------------------------------------------------------+
//|helper function : adds selected trend and\or constant             |
//+------------------------------------------------------------------+
bool addtrend(matrix &in,matrix &out,ENUM_TREND trend=TREND_CONST_ONLY, bool prepend=false, ENUM_HAS_CONST has_const=HAS_CONST_SKIP)
  {
//---
   ulong trendorder=0;
//---
   if(trend==TREND_NONE)
      return out.Copy(in);
//---
   if(trend==TREND_CONST_ONLY)
      trendorder = 0;
   else
      if(trend==TREND_LINEAR_CONST || trend==TREND_LINEAR_ONLY)
         trendorder = 1;
      else
         if(trend==TREND_QUAD_LINEAR_CONST)
            trendorder = 2;
//---
   ulong nobs = in.Rows();
//---
   vector tvector,temp;
//---
   if(!tvector.Resize(nobs) || !temp.Resize(nobs))
     {
      Print(__FUNCTION__," ",__LINE__," Resize Error ", ::GetLastError());
      return false;
     }
//---
   double sequence[];
//---
   if(!MathSequence(1,nobs,1,sequence) || !tvector.Assign(sequence))
     {
      Print(__FUNCTION__," ",__LINE__," Error ", ::GetLastError());
      return false;
     }
//---
   matrix trendmat;
//---
   if(!trendmat.Resize(tvector.Size(),(trend==TREND_LINEAR_ONLY)?1:trendorder+1))
     {
      Print(__FUNCTION__," ",__LINE__," Resize Error ", ::GetLastError());
      return false;
     }
//---
   for(ulong i = 0; i<trendmat.Cols(); i++)
     {
      temp = MathPow(tvector,(trend==TREND_LINEAR_ONLY)?double(i+1):double(i));
      if(!trendmat.Col(temp,i))
        {
         Print(__FUNCTION__," ",__LINE__," Matrix Assign Error ", ::GetLastError());
         return false;
        }
     }
//---
   vector ptp = in.Ptp(0);
//---
   if(!ptp.Min())
     {
      if(has_const==HAS_CONST_RAISE)
        {
         Print("Input matrix contains one or more constant columns");
         return false;
        }
      if(has_const==HAS_CONST_SKIP)
        {
         matrix vsplitted[];

         ulong parts[] = {1,trendmat.Cols()-1};

         trendmat.Vsplit(parts,vsplitted);

         if(!trendmat.Copy(vsplitted[1]))
           {
            Print(__FUNCTION__," ",__LINE__," Resize Error ", ::GetLastError());
            return false;
           }
        }
     }
//---
   int order = (prepend)?1:-1;
//---
   if(!out.Resize(trendmat.Rows(),trendmat.Cols()+in.Cols()))
     {
      Print(__FUNCTION__," ",__LINE__," Resize Error ", ::GetLastError());
      return false;
     }
//---
   ulong j = 0;
   matrix mtemp;
//---
   if(prepend)
      mtemp.Copy(trendmat);
   else
      mtemp.Copy(in);
//---
   for(j = 0; j<mtemp.Cols(); j++)
     {
      vector col = mtemp.Col(j);

      if(!out.Col(col,j))
        {
         Print(__FUNCTION__," ",__LINE__," Matrix Assign Error ", ::GetLastError());
         return false;
        }

     }
//---
   ulong minus = j;
//---
   if(prepend)
      mtemp.Copy(in);
   else
      mtemp.Copy(trendmat);
//---
   for(; j<out.Cols(); j++)
     {
      vector col = mtemp.Col(j-minus);

      if(!out.Col(col,j))
        {
         Print(__FUNCTION__," ",__LINE__," Matrix Assign Error ", ::GetLastError());
         return false;
        }

     }
//---
   return true;
//---
  }

//+----------------------------------------------------------------------+
//| calculates MacKinnon's approximate p-value for a given test statistic|
//+----------------------------------------------------------------------+
double mackinnonp(double teststat, ENUM_TREND trend = TREND_CONST_ONLY,ulong nseries = 1, uint lags =0)
  {
   vector small_scaling =  {1, 1, 1e-2};
   vector large_scaling =  {1, 1e-1, 1e-1, 1e-2};

   double tau_star_nc []= {-1.04, -1.53, -2.68, -3.09, -3.07, -3.77};
   double tau_min_nc []= {-19.04, -19.62, -21.21, -23.25, -21.63, -25.74};
   double tau_max_nc []= {double("inf"), 1.51, 0.86, 0.88, 1.05, 1.24};
   double tau_star_c []= {-1.61, -2.62, -3.13, -3.47, -3.78, -3.93};
   double tau_min_c []= {-18.83, -18.86, -23.48, -28.07, -25.96, -23.27};
   double tau_max_c []= {2.74, 0.92, 0.55, 0.61, 0.79, 1};
   double tau_star_ct []= {-2.89, -3.19, -3.50, -3.65, -3.80, -4.36};
   double tau_min_ct []= {-16.18, -21.15, -25.37, -26.63, -26.53, -26.18};
   double tau_max_ct []= {0.7, 0.63, 0.71, 0.93, 1.19, 1.42};
   double tau_star_ctt []= {-3.21, -3.51, -3.81, -3.83, -4.12, -4.63};
   double tau_min_ctt []= {-17.17, -21.1, -24.33, -24.03, -24.33, -28.22};
   double tau_max_ctt []= {0.54, 0.79, 1.08, 1.43, 3.49, 1.92};

   double tau_nc_smallp [][3]=
     {
        {0.6344, 1.2378, 3.2496},
        {1.9129, 1.3857, 3.5322},
        {2.7648, 1.4502, 3.4186},
        {3.4336, 1.4835, 3.19},
        {4.0999, 1.5533, 3.59},
        {4.5388, 1.5344, 2.9807}
     };

   double tau_c_smallp [][3]=
     {
        {2.1659, 1.4412, 3.8269},
        {2.92, 1.5012, 3.9796},
        {3.4699, 1.4856, 3.164},
        {3.9673, 1.4777, 2.6315},
        {4.5509, 1.5338, 2.9545},
        {5.1399, 1.6036, 3.4445}
     };

   double tau_ct_smallp [][3]=
     {
        {3.2512, 1.6047, 4.9588},
        {3.6646, 1.5419, 3.6448},
        {4.0983, 1.5173, 2.9898},
        {4.5844, 1.5338, 2.8796},
        {5.0722, 1.5634, 2.9472},
        {5.53, 1.5914, 3.0392}
     };

   double tau_ctt_smallp [][3]=
     {
        {4.0003, 1.658, 4.8288},
        {4.3534, 1.6016, 3.7947},
        {4.7343, 1.5768, 3.2396},
        {5.214, 1.6077, 3.3449},
        {5.6481, 1.6274, 3.3455},
        {5.9296, 1.5929, 2.8223}
     };


   double tau_nc_largep [][4]=
     {
        {0.4797, 9.3557, -0.6999, 3.3066},
        {1.5578, 8.558, -2.083, -3.3549},
        {2.2268, 6.8093, -3.2362, -5.4448},
        {2.7654, 6.4502, -3.0811, -4.4946},
        {3.2684, 6.8051, -2.6778, -3.4972},
        {3.7268, 7.167, -2.3648, -2.8288}
     };

   double tau_c_largep [][4]=
     {
        {1.7339, 9.3202, -1.2745, -1.0368},
        {2.1945, 6.4695, -2.9198, -4.2377},
        {2.5893, 4.5168, -3.6529, -5.0074},
        {3.0387, 4.5452, -3.3666, -4.1921},
        {3.5049, 5.2098, -2.9158, -3.3468},
        {3.9489, 5.8933, -2.5359, -2.721}
     };

   double tau_ct_largep [][4]=
     {
        {2.5261, 6.1654, -3.7956, -6.0285},
        {2.85, 5.272, -3.6622, -5.1695},
        {3.221, 5.255, -3.2685, -4.1501},
        {3.652, 5.9758, -2.7483, -3.2081},
        {4.0712, 6.6428, -2.3464, -2.546},
        {4.4735, 7.1757, -2.0681, -2.1196}
     };

   double tau_ctt_largep [][4]=
     {
        {3.0778, 4.9529, -4.1477, -5.9359},
        {3.4713, 5.967, -3.2507, -4.2286},
        {3.8637, 6.7852, -2.6286, -3.1381},
        {4.2736, 7.6199, -2.1534, -2.4026},
        {4.6679, 8.2618, -1.822, -1.9147},
        {5.0009, 8.3735, -1.6994, -1.6928}
     };


   vector maxstat,minstat,starstat;
   matrix tau_smallps, tau_largeps;

   switch(trend)
     {
      case TREND_NONE:
         if(!maxstat.Assign(tau_max_nc) ||
            !minstat.Assign(tau_min_nc) ||
            !starstat.Assign(tau_star_nc)||
            !tau_smallps.Assign(tau_nc_smallp)||
            !tau_largeps.Assign(tau_nc_largep))
           {
            Print("assignment error :", GetLastError());
            return double("inf");
           }
         else
            break;
      case TREND_CONST_ONLY:
         if(!maxstat.Assign(tau_max_c) ||
            !minstat.Assign(tau_min_c) ||
            !starstat.Assign(tau_star_c)||
            !tau_smallps.Assign(tau_c_smallp)||
            !tau_largeps.Assign(tau_c_largep))
           {
            Print("assignment error :", GetLastError());
            return double("inf");
           }
         else
            break;
      case TREND_LINEAR_CONST:
         if(!maxstat.Assign(tau_max_ct) ||
            !minstat.Assign(tau_min_ct) ||
            !starstat.Assign(tau_star_ct)||
            !tau_smallps.Assign(tau_ct_smallp)||
            !tau_largeps.Assign(tau_ct_largep))
           {
            Print("assignment error :", GetLastError());
            return double("inf");
           }
         else
            break;
      case TREND_QUAD_LINEAR_CONST:
         if(!maxstat.Assign(tau_max_ctt) ||
            !minstat.Assign(tau_min_ctt) ||
            !starstat.Assign(tau_star_ctt)||
            !tau_smallps.Assign(tau_ctt_smallp)||
            !tau_largeps.Assign(tau_ctt_largep))
           {
            Print("assignment error :", GetLastError());
            return double("inf");
           }
         else
            break;
      default:
         Print(__FUNCTION__," Error invalid input for trend argument");
         return double("nan");
     }

   if(teststat>maxstat[nseries-1])
      return 1.0;
   else
      if(teststat<minstat[nseries-1])
         return 0.0;


   vector tau_coef;

   if(teststat<=starstat[nseries-1])
      tau_coef = small_scaling*(tau_smallps.Row(nseries-1));
   else
      tau_coef = large_scaling*(tau_largeps.Row(nseries-1));


   double rv,tau[];

   ArrayResize(tau,int(tau_coef.Size()));

   for(ulong i=0; i<tau_coef.Size(); i++)
      tau[i]=tau_coef[tau_coef.Size()-1-i];

   rv=polyval(tau,teststat);

   return CNormalDistr::NormalCDF(rv);
  }

//+------------------------------------------------------------------+
//| helper function : evaluates a polynomial                         |
//+------------------------------------------------------------------+
double polyval(double &in_array[], double coeff)
  {
   double retv = 0;

   for(uint i = 0; i<in_array.Size(); i++)
      retv = retv * coeff + in_array[i];

   return retv;
  }
//+------------------------------------------------------------------+
//|Computes critical values                                          |
//+------------------------------------------------------------------+
vector mackinnoncrit(ulong nseries = 1,ENUM_TREND trend = TREND_CONST_ONLY, ulong num_obs=ULONG_MAX)
  {
   matrix tau_nc_2010 [] = {{
           {-2.56574, -2.2358, -3.627, 0},  // N [] = 1
           {-1.94100, -0.2686, -3.365, 31.223},
           {-1.61682, 0.2656, -2.714, 25.364}
        }
     };

   matrix tau_c_2010 [] =
     {
        {  {-3.43035, -6.5393, -16.786, -79.433},  // N [] = 1, 1%
           {-2.86154, -2.8903, -4.234, -40.040},   // 5 %
           {-2.56677, -1.5384, -2.809, 0}
        },        // 10 %
        {  {-3.89644, -10.9519, -33.527, 0},       // N [] = 2
           {-3.33613, -6.1101, -6.823, 0},
           {-3.04445, -4.2412, -2.720, 0}
        },
        {  {-4.29374, -14.4354, -33.195, 47.433},  // N [] = 3
           {-3.74066, -8.5632, -10.852, 27.982},
           {-3.45218, -6.2143, -3.718, 0}
        },
        {  {-4.64332, -18.1031, -37.972, 0},       // N [] = 4
           {-4.09600, -11.2349, -11.175, 0},
           {-3.81020, -8.3931, -4.137, 0}
        },
        {  {-4.95756, -21.8883, -45.142, 0},       // N [] = 5
           {-4.41519, -14.0405, -12.575, 0},
           {-4.13157, -10.7417, -3.784, 0}
        },
        {  {-5.24568, -25.6688, -57.737, 88.639},  // N [] = 6
           {-4.70693, -16.9178, -17.492, 60.007},
           {-4.42501, -13.1875, -5.104, 27.877}
        },
        {  {-5.51233, -29.5760, -69.398, 164.295},  // N [] = 7
           {-4.97684, -19.9021, -22.045, 110.761},
           {-4.69648, -15.7315, -5.104, 27.877}
        },
        {  {-5.76202, -33.5258, -82.189, 256.289},  // N [] = 8
           {-5.22924, -23.0023, -24.646, 144.479},
           {-4.95007, -18.3959, -7.344, 94.872}
        },
        {  {-5.99742, -37.6572, -87.365, 248.316},  // N [] = 9
           {-5.46697, -26.2057, -26.627, 176.382},
           {-5.18897, -21.1377, -9.484, 172.704}
        },
        {  {-6.22103, -41.7154, -102.680, 389.33},  // N [] = 10
           {-5.69244, -29.4521, -30.994, 251.016},
           {-5.41533, -24.0006, -7.514, 163.049}
        },
        {  {-6.43377, -46.0084, -106.809, 352.752},  // N [] = 11
           {-5.90714, -32.8336, -30.275, 249.994},
           {-5.63086, -26.9693, -4.083, 151.427}
        },
        {  {-6.63790, -50.2095, -124.156, 579.622},  // N [] = 12
           {-6.11279, -36.2681, -32.505, 314.802},
           {-5.83724, -29.9864, -2.686, 184.116}
        }
     };

   matrix tau_ct_2010 [] =
     {
        {  {-3.95877, -9.0531, -28.428, -134.155},   // N [] = 1
           {-3.41049, -4.3904, -9.036, -45.374},
           {-3.12705, -2.5856, -3.925, -22.380}
        },
        {  {-4.32762, -15.4387, -35.679, 0},         // N [] = 2
           {-3.78057, -9.5106, -12.074, 0},
           {-3.49631, -7.0815, -7.538, 21.892}
        },
        {  {-4.66305, -18.7688, -49.793, 104.244},   // N [] = 3
           {-4.11890, -11.8922, -19.031, 77.332},
           {-3.83511, -9.0723, -8.504, 35.403}
        },
        {  {-4.96940, -22.4694, -52.599, 51.314},    // N [] = 4
           {-4.42871, -14.5876, -18.228, 39.647},
           {-4.14633, -11.2500, -9.873, 54.109}
        },
        {  {-5.25276, -26.2183, -59.631, 50.646},    // N [] = 5
           {-4.71537, -17.3569, -22.660, 91.359},
           {-4.43422, -13.6078, -10.238, 76.781}
        },
        {  {-5.51727, -29.9760, -75.222, 202.253},   // N [] = 6
           {-4.98228, -20.3050, -25.224, 132.03},
           {-4.70233, -16.1253, -9.836, 94.272}
        },
        {  {-5.76537, -33.9165, -84.312, 245.394},   // N [] = 7
           {-5.23299, -23.3328, -28.955, 182.342},
           {-4.95405, -18.7352, -10.168, 120.575}
        },
        {  {-6.00003, -37.8892, -96.428, 335.92},    // N [] = 8
           {-5.46971, -26.4771, -31.034, 220.165},
           {-5.19183, -21.4328, -10.726, 157.955}
        },
        {  {-6.22288, -41.9496, -109.881, 466.068},  // N [] = 9
           {-5.69447, -29.7152, -33.784, 273.002},
           {-5.41738, -24.2882, -8.584, 169.891}
        },
        {  {-6.43551, -46.1151, -120.814, 566.823},  // N [] = 10
           {-5.90887, -33.0251, -37.208, 346.189},
           {-5.63255, -27.2042, -6.792, 177.666}
        },
        {  {-6.63894, -50.4287, -128.997, 642.781},  // N [] = 11
           {-6.11404, -36.4610, -36.246, 348.554},
           {-5.83850, -30.1995, -5.163, 210.338}
        },
        {  {-6.83488, -54.7119, -139.800, 736.376},  // N [] = 12
           {-6.31127, -39.9676, -37.021, 406.051},
           {-6.03650, -33.2381, -6.606, 317.776}
        }
     };

   matrix tau_ctt_2010 [] =
     {
        {  {-4.37113, -11.5882, -35.819, -334.047},  // N [] = 1
           {-3.83239, -5.9057, -12.490, -118.284},
           {-3.55326, -3.6596, -5.293, -63.559}
        },
        {  {-4.69276, -20.2284, -64.919, 88.884},    // N [] =2
           {-4.15387, -13.3114, -28.402, 72.741},
           {-3.87346, -10.4637, -17.408, 66.313}
        },
        {  {-4.99071, -23.5873, -76.924, 184.782},   // N [] = 3
           {-4.45311, -15.7732, -32.316, 122.705},
           {-4.17280, -12.4909, -17.912, 83.285}
        },
        {  {-5.26780, -27.2836, -78.971, 137.871},   // N [] = 4
           {-4.73244, -18.4833, -31.875, 111.817},
           {-4.45268, -14.7199, -17.969, 101.92}
        },
        {  {-5.52826, -30.9051, -92.490, 248.096},   // N [] = 5
           {-4.99491, -21.2360, -37.685, 194.208},
           {-4.71587, -17.0820, -18.631, 136.672}
        },
        {  {-5.77379, -34.7010, -105.937, 393.991},  // N [] = 6
           {-5.24217, -24.2177, -39.153, 232.528},
           {-4.96397, -19.6064, -18.858, 174.919}
        },
        {  {-6.00609, -38.7383, -108.605, 365.208},  // N [] = 7
           {-5.47664, -27.3005, -39.498, 246.918},
           {-5.19921, -22.2617, -17.910, 208.494}
        },
        {  {-6.22758, -42.7154, -119.622, 421.395},  // N [] = 8
           {-5.69983, -30.4365, -44.300, 345.48},
           {-5.42320, -24.9686, -19.688, 274.462}
        },
        {  {-6.43933, -46.7581, -136.691, 651.38},   // N [] = 9
           {-5.91298, -33.7584, -42.686, 346.629},
           {-5.63704, -27.8965, -13.880, 236.975}
        },
        {  {-6.64235, -50.9783, -145.462, 752.228},  // N [] = 10
           {-6.11753, -37.056, -48.719, 473.905},
           {-5.84215, -30.8119, -14.938, 316.006}
        },
        {  {-6.83743, -55.2861, -152.651, 792.577},  // N [] = 11
           {-6.31396, -40.5507, -46.771, 487.185},
           {-6.03921, -33.8950, -9.122, 285.164}
        },
        {  {-7.02582, -59.6037, -166.368, 989.879},  // N [] = 12
           {-6.50353, -44.0797, -47.242, 543.889},
           {-6.22941, -36.9673, -10.868, 418.414}
        }
     };

   vector ret_vector = {0,0,0};

   switch(trend)
     {
      case TREND_CONST_ONLY:
         process(tau_c_2010,ret_vector,num_obs,nseries);
         break;
      case TREND_NONE:
         process(tau_nc_2010,ret_vector,num_obs,nseries);
         break;
      case TREND_LINEAR_CONST:
         process(tau_ct_2010,ret_vector,num_obs,nseries);
         break;
      case TREND_QUAD_LINEAR_CONST:
         process(tau_ctt_2010,ret_vector,num_obs,nseries);
         break;
      default:
         Print("Invalid input for trend argument");
         return ret_vector;
     }

   return ret_vector;
  }
//+------------------------------------------------------------------+
//|helper function: evaluates a multiple variable polynomial         |
//+------------------------------------------------------------------+
void process(matrix &tau[], vector &out, ulong numobs, ulong ns)
  {
   if(numobs==ULONG_MAX)
      out = tau[ns-1].Col(0);
   else
     {
      for(ulong i=0; i<tau[ns-1].Cols(); i++)
         out = out * (1.0/double(numobs)) + tau[ns-1].Col(tau[ns-1].Cols()-1-i);
     }
   return;
  }

  
//+---------------------------------------------------------------------+
//|Class CAdf                                                           |
//|   encapsulates the the Augmented Dickey Fuller Test for Stationarity|
//+---------------------------------------------------------------------+

class CAdf
{
 private:
  double m_adf_stat,  //adf statistic
         m_bestic,    //optimal bic or aic
         m_pvalue;    //p-value
  ulong  m_usedlag;   //lag used for optimal reg model
  vector m_critvals;  //estimated critical values
  OLS    *m_ols;      //internal ordinary least squares reg model
   // private methods
 bool   gridsearch(vector &LHS, matrix &RHS, ulong f_lag, ulong l_lag,ENUM_INFO_CRIT crit, double &b_ic, ulong &best_lag);
 bool   lagmat(matrix &in,matrix &out[],ulong mlag,ENUM_TRIM trim=TRIM_BOTH,ENUM_ORIGINAL original=ORIGINAL_IN);
 bool   prepare_lhs_rhs(vector &lhs, matrix &rhs, double &in[], double &in_diff[],ulong lag);
 
 
 public:
  CAdf(void);
  ~CAdf(void);
  
 bool Adfuller(double &array[],ulong max_lag = 0,ENUM_TREND trend = TREND_CONST_ONLY, ENUM_INFO_CRIT autolag=INFO_AIC);
 vector CriticalValues(void) {  return m_critvals; }
 double AdfStatistic(void)   {  return m_adf_stat; }
 double Pvalue(void)         {  return m_pvalue;   }
};
//+------------------------------------------------------------------+
//| Constructor                                                      |
//+------------------------------------------------------------------+
CAdf::CAdf(void)
{
 m_ols = new OLS();
 
 m_adf_stat = m_bestic = m_pvalue = EMPTY_VALUE;
 
 m_usedlag = 0;
 
 m_critvals = vector::Zeros(3);
}
//+------------------------------------------------------------------+
//| Destructor                                                       |
//+------------------------------------------------------------------+
CAdf::~CAdf(void)
{
 if(CheckPointer(m_ols)==POINTER_DYNAMIC)
    delete m_ols;

}
//+------------------------------------------------------------------+
//| Augmented Dickey-Fuller unit root test                           |
//+------------------------------------------------------------------+
bool CAdf::Adfuller(double&array[],ulong max_lag = 0,ENUM_TREND trend = TREND_CONST_ONLY, ENUM_INFO_CRIT autolag=INFO_AIC)
  {
//---  
   if(CheckPointer(m_ols)==POINTER_INVALID)
    {
     Print("Critical internal error: Invalid Pointer to OLS object");
     return false;
    }
//---
   if(array[ArrayMaximum(array)]==array[ArrayMinimum(array)])
     {
      Print(__FUNCTION__," ",__LINE__," Invalid input series is made of constants ");
      return false;
     }
//---
   uint nobs = array.Size();
//---
   uint ntrend = (trend>1)?uint(trend)-1:uint(trend);
//---
   ulong maxlag;
//---
   if(!max_lag)
     {
      maxlag =  uint(ceil(12.0 * pow(nobs / 100.0, 1.0 / 4.0)));
      maxlag =  MathMin(nobs / 2 - ntrend - 1, maxlag);

      if(ntrend>=2)
        {
         Print("sample size is too short to use selected regression component: Adjust trend input value ");
         return false;
        }
     }
   else
     {
      maxlag = max_lag;

      if(ntrend>=2)
        {
         Print("sample size is too short to use selected regression component: Adjust trend input value ");
         return false;
        }

      if(maxlag>floor(nobs/2-ntrend-1))
        {
         Print("maxlag must be less than (nobs/2 - 1 - ntrend) \n where ntrend is the number of included deterministic regressors");
         return false;
        }
     }
//---
   double diff[];
//---
   if(!MathDifference(array,1,diff))
     {
      Print(__FUNCTION__," ",__LINE__," Error differencing error : ",::GetLastError());
      return false;
     }
//---
   vector xdshort, tmp;
//---
   matrix xdiff;
//---
   if(!xdiff.Resize(diff.Size(),1) || !tmp.Resize(diff.Size()) || !tmp.Assign(diff) || !xdiff.Col(tmp,0))
     {
      Print(__FUNCTION__," ",__LINE__," Resize or assign error : ",::GetLastError());
      return false;
     }
//---
   matrix xdall[];
//---
   if(!lagmat(xdiff,xdall,maxlag))
      return false;
//---
   if(!prepare_lhs_rhs(xdshort,xdall[0],array,diff,maxlag))
      return false;

//---
   matrix fullRHS;
   double bestic;
   ulong startlag,bestlag,usedlag;
//---
   if(autolag!=INFO_NONE)
     {
      if(trend!=TREND_NONE)
        {
         if(!addtrend(xdall[0],fullRHS,trend,true))
            return false;
        }
      else
        {
         if(!fullRHS.Copy(xdall[0]))
           {
            Print(__FUNCTION__," ",__LINE__," Resize or assign error : ",::GetLastError());
            return false;
           }
        }

      startlag = fullRHS.Cols() - xdall[0].Cols() + 1;

      gridsearch(xdshort,fullRHS,startlag,maxlag,autolag,bestic,bestlag);

      bestlag-=startlag;

      if(!lagmat(xdiff,xdall,bestlag))
         return false;

      if(!prepare_lhs_rhs(xdshort,xdall[0],array,diff,bestlag))
         return false;

      usedlag = bestlag;

     }
   else
     {
      usedlag = maxlag;
      bestic = 0;
     }
//---
   m_usedlag = usedlag;
   m_bestic = bestic;
//---   
   matrix xv;
//---
   xv.Resize(xdall[0].Rows(),ulong(usedlag+1),2);
//---
   for(ulong k=0; k<ulong(usedlag+1); k++)
     {
      if(!xv.Col(xdall[0].Col(k),k))
        {
         Print(__FUNCTION__," ",__LINE__," Error adding column: ",::GetLastError());
         return false;
        }
     }
//---
   if(trend!=TREND_NONE)
     {
      if(!addtrend(xv,fullRHS,trend))
        {
         Print(__FUNCTION__," ",__LINE__," Error processing input ");
         return false;
        }
     }
   else
     {
      if(!fullRHS.Copy(xv))
        {
         Print(__FUNCTION__," ",__LINE__," Error processing input ");
         return false;
        }
     }


   if(!m_ols.Fit(fullRHS, xdshort))
     {
      Print(__FUNCTION__," ",__LINE__," Error OLS fit: ",::GetLastError());
      return false;
     }
//---
   vector adfstat = m_ols.Tvalues();
//---
   m_adf_stat = adfstat[0];
//---
   m_pvalue = mackinnonp(m_adf_stat,trend);
//---
   m_critvals = mackinnoncrit(1,trend,fullRHS.Rows());
//---
   return true;
  }
//+------------------------------------------------------------------+
//| helper function prepares rhs of equation                         |
//+------------------------------------------------------------------+
bool CAdf::prepare_lhs_rhs(vector &lhs, matrix &rhs, double &in[], double &in_diff[],ulong lag)
  {
   ulong len= rhs.Rows();

   if(!lhs.Resize(len))
     {
      Print(__FUNCTION__," ",__LINE__," Resize or assign error : ",::GetLastError());
      return false;
     }

   vector cpy;
   if(!cpy.Resize(len))
     {
      Print(__FUNCTION__," ",__LINE__," Resize or assign error : ",::GetLastError());
      return false;
     }

   ulong mm = ulong(in.Size())-(len+1);

   for(ulong i=mm; i<ulong(in.Size()-1); i++)
      cpy[i-mm] = in[i];

   if(!rhs.Col(cpy,0))
     {
      Print(__FUNCTION__," ",__LINE__," Resize or assign error : ",::GetLastError());
      return false;
     }

   mm = ulong(in_diff.Size())-(len);

   for(ulong i=mm; i<ulong(in_diff.Size()); i++)
      lhs[i-mm] = in_diff[i];

   return true;
  }
//+-----------------------------------------------------------------------------+
//|  helper function performs search for optimal lag based in selected criterion|
//+-----------------------------------------------------------------------------+
bool CAdf::gridsearch(vector &LHS, matrix &RHS, ulong f_lag, ulong l_lag,ENUM_INFO_CRIT crit, double &b_ic, ulong &best_lag)
  {
//---
   matrix xv;
//---
   b_ic=DBL_MAX;
//---
   double ic=0;
//---
   for(ulong i = f_lag; i<f_lag+l_lag+1; i++)
     {
      //---
      xv.Resize(RHS.Rows(),ulong(i),2);
      //---
      //vector v;
      //---
      for(ulong k=0; k<ulong(i); k++)
        {
         if(!xv.Col(RHS.Col(k),k))
           {
            Print(__FUNCTION__," ",__LINE__," Error adding column: ",::GetLastError());
            return false;
           }
        }

      //---
      if(!m_ols.Fit(xv, LHS))
        {
         Print(__FUNCTION__," ",__LINE__," Error OLS fit: ",::GetLastError());
         return false;
        }
      //---
      switch(crit)
        {
         case INFO_AIC:
            ic = m_ols.Aic();
            break;
         case INFO_BIC:
            ic = m_ols.Bic();
            break;
        }
      //---
      if(ic<b_ic)
        {
         b_ic = ic;
         best_lag = i;
        }
      //---
     }
//---

   return true;
  }
//+------------------------------------------------------------------+
//| helper function: transforms rhs matrix                           |
//+------------------------------------------------------------------+
bool CAdf::lagmat(matrix &in,matrix &out[],ulong mlag,ENUM_TRIM trim=TRIM_BOTH,ENUM_ORIGINAL original=ORIGINAL_IN)
  {
//---
   ulong nobs=in.Rows();
   ulong nvars =in.Cols();
   ulong dropidx = 0;
//---
   if(mlag>=nobs)
     {
      Print("mlag should be < number of rows of the input matrix");
      return false;
     }
//---
   if(original==ORIGINAL_EX || original==ORIGINAL_SEP)
      dropidx = nvars;
//---
   matrix nn;
//---
   if(!nn.Resize(nobs + mlag,nvars * (mlag + 1)))
     {
      Print(__FUNCTION__," ",__LINE__," Resize Error ", ::GetLastError());
      return false;
     }
//---
   nn.Fill(0.0);
//---
   ulong maxlag=mlag;
//---
   ulong row_end,row_start,col_end,col_start,j,z;
   row_end=row_start=col_end=col_start=j=z=0;
//---
   for(ulong k = 0; k<(maxlag+1); k++)
     {
      row_start = maxlag-k;
      row_end = nobs+maxlag-k;
      col_start = nvars*(maxlag-k);
      col_end = nvars*(maxlag-k+1);
      j = 0;
      for(ulong irow = row_start; irow < row_end; irow++, j++)
        {
         z = 0;
         for(ulong icol = col_start; icol < col_end; icol++, z++)
            nn[irow][icol]=in[j][z];
        }
     }
//---
   ulong startobs,stopobs;
   if(trim==TRIM_NONE || trim==TRIM_FORWARD)
      startobs=0;
   else
      startobs=maxlag;
//---
   if(trim==TRIM_NONE || trim==TRIM_BACKWARD)
      stopobs=nn.Rows();
   else
      stopobs=nobs;
//---
   if(dropidx)
      ArrayResize(out,2);
   else
      ArrayResize(out,1);
//---
   if(!out[0].Resize(stopobs-startobs,nn.Cols()-dropidx))
     {
      Print(__FUNCTION__," ",__LINE__," Resize Error ", ::GetLastError());
      return false;
     }
//---
   for(ulong irow = startobs; irow<stopobs; irow++)
      for(ulong icol=dropidx; icol<nn.Cols(); icol++)
         out[0][irow-startobs][icol-dropidx]=nn[irow][icol];
//---
   if(out.Size()>1)
     {
      if(!out[1].Resize(stopobs-startobs,dropidx))
        {
         Print(__FUNCTION__," ",__LINE__," Resize Error ", ::GetLastError());
         return false;
        }
      //---
      for(ulong irow = startobs; irow<stopobs; irow++)
         for(ulong icol=0; icol<out[1].Cols(); icol++)
            out[1][irow-startobs][icol]=nn[irow][icol];
     }
//---
   return true;
  }


================================================
FILE: Stats Models/ARIMA.mqh
================================================
//+------------------------------------------------------------------+
//|                                                        ARIMA.mqh |
//|                                     Copyright 2023, Omega Joctan |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"
//+------------------------------------------------------------------+
//| defines                                                          |
//+------------------------------------------------------------------+

#include <MALE5\Linear Models\Linear Regression.mqh>
#include <MALE5\MatrixExtend.mqh>

struct ar_struct
 {
   vector residuals; //The differences between actual and predicted values.
   vector theta; //The coefficients of the AR model.
   double intercept; //The intercept term from the regression model.
 };

struct ma_struct
 {
   vector theta;
   double intercept;
 };

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
 
class CARIMA
  {
protected:

   CLinearRegression  *ar_lr, *ma_lr;
   
   
   vector Shift(const vector &v, int shift); 
   vector Pad(const vector &v, int padSize, double padValue=EMPTY_VALUE);
   
   ar_struct AR(const uint p, const vector &series_data);
   ma_struct MA(const uint q, const vector &residuals);
   
   uint __p__,__d__, __q__;  
    
   ar_struct ar_parameters;
   ma_struct ma_parameters;
                     
public:
                     CARIMA(const uint p, const uint d, const uint q);
                    ~CARIMA(void);
                    
                     vector difference(const vector &ts, uint interval=1);
                     double inverse_difference(const vector &history, double y_hat, uint interval=1);
                    
                     void fit(const vector &series);
                     vector predict(const vector &series, const uint steps=10);
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CARIMA::CARIMA(const uint p, const uint d, const uint q)
 :__p__(p),
  __q__(q),
  __d__(d)
 {
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CARIMA::~CARIMA(void)
 {
   if (CheckPointer(ar_lr) != POINTER_INVALID)
     delete ar_lr;
     
   if (CheckPointer(ma_lr) != POINTER_INVALID)
     delete ma_lr;
 }
//+------------------------------------------------------------------+
//|   This function shifts series_data similarly to                  |
//|   pandas.DataFrame.shift                                         |
//+------------------------------------------------------------------+
vector CARIMA::Shift(const vector &v, int shift) 
 {
   int size = (int)v.Size();
   
   vector new_v(v.Size());
   new_v.Fill(EMPTY_VALUE);
   
   // If shift is positive, shift right
   if(shift > 0) 
    {
      for(int i = size - 1; i >= shift; i--) 
        new_v[i] = v[i - shift];
     }
   
   // If shift is negative, shift left
   else if(shift < 0) 
    {
      shift = -shift;
      for(int i = 0; i < size - shift; i++) 
        new_v[i] = v[i + shift];
     }
     
   return new_v;
 }

//+------------------------------------------------------------------+
//|      Function to pad a vector with a specified value             |
//+------------------------------------------------------------------+
vector CARIMA::Pad(const vector &v, int padSize, double padValue=EMPTY_VALUE)
{
   int originalSize = (int)v.Size();
   int newSize = originalSize + padSize;
   
   vector results(newSize); //a vector to hold the padded results
   
   // Fill the beginning of the array with the padValue
   for (int i = 0; i < padSize; i++)
      results[i] = padValue;
   
   // Copy the original array to the new array after the padding
   for (int i = 0; i < originalSize; i++)
      results[i + padSize] = v[i];
   
   return results;
}
//+------------------------------------------------------------------+
//|                                                                  |
//|      Perform differencing to make time series stationary         |
//|                                                                  |
//+------------------------------------------------------------------+
vector CARIMA::difference(const vector &ts, uint interval=1)
 {
   if (interval>=ts.Size())
     {
       printf("%s fatal, interval=%d must be less than the timeseries vector size=%d",__FUNCTION__,interval,ts.Size());
       vector empty={};
       return empty;
     }
   
   vector diff(ts.Size()-interval);
   
   for (uint i=interval, count=0; i<ts.Size(); i++)
     diff[i-interval] = ts[i] - ts[i-interval];
     
   return diff;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//|  To invert the differencing, we need to add the differenced value|
//|  y_hat back to the last observed value before the differencing.  |
//|                                                                  |
//|  Parameters                                                      |     
//|  history: The original time series data before differencing.     |
//|  yhat: The differenced value or forecast that we want to convert |
//|         back to the original scale.                              |
//|  interval: The differencing interval, default value is 1 for     |
//|            first-order differencing                              |
//|                                                                  |
//+------------------------------------------------------------------+
double CARIMA::inverse_difference(const vector &history, double y_hat, uint interval=1)
 {
   return y_hat + history[history.Size()-interval];
 }
//+------------------------------------------------------------------+
//|                                                                  |
//|  This function fits an AutoRegressive model of order p to the    |
//|  time series data by leveraging linear regression.               |
//|                                                                  |
//|  It predicts the current value of the time series based on its   |
//|  previous p values, calculates the prediction errors, and        |
//|  provides the arima model coefficients and intercept values.     |
//|                                                                  |   
//|                                                                  |
//|  p: The order of the AR model, which specifies how many lagged   |
//|     values of the time series to include as predictors.          |
//|  series_data: The time series series_data.                       |
//|                                                                  |
//+------------------------------------------------------------------+
ar_struct CARIMA::AR(const uint p, const vector &series_data)
 {
   ar_struct ret_struct;
   
   ulong size = series_data.Size();
   
   matrix autoregressive_series_data(size, p+1);
   autoregressive_series_data.Col(series_data, 0);
   
   vector shifted_series_data = {};
 
    for (ulong i=1; i<p+1; i++) //generate lagged values
      {
         shifted_series_data = Shift(series_data, (uint)i);
         autoregressive_series_data.Col(shifted_series_data, i);
      } 
      
//---
      
   autoregressive_series_data = MatrixExtend::Slice(autoregressive_series_data,p,-1); 
   
//--- Since the y vector is the first column of this matrix
   
   matrix X;
   vector y;
   
   MatrixExtend::XandYSplitMatrices(autoregressive_series_data, X, y, 0); //index of 0 gets the first column assigned as y vector
   
//--- Fitting a linear regression model to the outo-regressive series_data
   
   ar_lr = new CLinearRegression();
   
   ar_lr.fit(X, y);
   vector y_pred = ar_lr.predict(X);
      
//---

   ret_struct.residuals = y - y_pred;
   ret_struct.theta = ar_lr.coeff_;
   ret_struct.intercept = ar_lr.intercept_;
   
   if (MQLInfoInteger(MQL_DEBUG))
     printf("AR(p=%d) model - RMSE: %.4f",p,y_pred.RegressionMetric(y, REGRESSION_RMSE));
   
   return ret_struct;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//|  The MA function constructs a Moving Average (MA) model by       |
//|  regressing the current residuals against the past q residuals.  |
//|  It uses linear regression to determine the coefficients theta   |
//|  and the intercept that best fit the relationship between the    |
//|  residuals and their lagged values.                              |   
//|  The resulting model helps in forecasting future residuals based |   
//|  on past errors.                                                 |
//|                                                                  |
//|  Parameters:                                                     |
//|  q: The order of the MA model, indicating how many lagged        |
//|     residuals (errors) should be considered.                     |
//|  residuals: The array of residuals (errors) from the previous AR |
//|     model fitting.                                               |
//|                                                                  |
//+------------------------------------------------------------------+
ma_struct CARIMA::MA(const uint q,const vector &residuals)
 {
   ma_struct ret_struct;
   
   ulong size = residuals.Size();
   
   matrix autoregressive_residuals(size, q+1);
   autoregressive_residuals.Col(residuals, 0);
   
   vector shifted_eesiduals = {};
 
    for (ulong i=1; i<q+1; i++) //This loop creates lagged versions of the residuals.
      {
         shifted_eesiduals = Shift(residuals, (uint)i);
         autoregressive_residuals.Col(shifted_eesiduals, i);
      } 
     
//---
      
   autoregressive_residuals = MatrixExtend::Slice(autoregressive_residuals,q,-1); 
   
//--- Since the y vector is the first column of this matrix
   
   matrix X;
   vector y;
   
   MatrixExtend::XandYSplitMatrices(autoregressive_residuals, X, y, 0); //index of 0 gets the first column assigned as y vector
   
//--- Fitting a linear regression model to the outo-regressive residuals
   
   ma_lr = new CLinearRegression();
   ma_lr.fit(X, y);
   vector y_pred = ma_lr.predict(X);
      
//---
   
   ret_struct.theta = ma_lr.coeff_;
   ret_struct.intercept = ma_lr.intercept_;   

//---

   if (MQLInfoInteger(MQL_DEBUG))
     printf("MA(q=%d) model - RMSE: %.4f",q,y_pred.RegressionMetric(y, REGRESSION_RMSE));
     
   return ret_struct;   
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CARIMA::fit(const vector &series)
 {
   ar_parameters = AR(__p__, series);
   ma_parameters = MA(__q__, ar_parameters.residuals); 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CARIMA::predict(const vector &series,const uint steps=10)
 {
    vector forecasted_values(steps);
    vector temp_series = series;
    
    //--- We initialize the residuals for the new data
    
    vector temp_residuals(series.Size() + steps);
    temp_residuals.Fill(0);
    
    for (uint step=0; step<steps; step++)
      {
        
        //--- Auto-regressive part
        
           vector ar_terms = MatrixExtend::Slice(temp_series,temp_series.Size()-__p__, -1);
           MatrixExtend::Reverse(ar_terms);
           
           double ar_part = ar_parameters.theta.MatMul(ar_terms) + ar_parameters.intercept;
           
        //--- Moving-average part | Generating MA terms
        
           vector ma_terms = MatrixExtend::Slice(temp_residuals,temp_residuals.Size()-__q__, -1);
           MatrixExtend::Reverse(ma_terms);
           
           double ma_part = ma_parameters.theta.MatMul(ma_terms) + ma_parameters.intercept;
           
        //--- Calculate forecast value difference 
        
           double forecast_value_diff = ar_part + ma_part;
           double new_value = temp_series[temp_series.Size()-1] + forecast_value_diff; // We use the last value in the series to convert the differenced forecast back to original scale

           forecasted_values[step] = new_value;
           
         //--- Update the temp_residuals with the new forecasted value
           
           temp_series = MatrixExtend::concatenate(temp_series, new_value);
           
           Print("Temp series\n",temp_series);
           
           double new_residual = forecast_value_diff;
           temp_residuals = MatrixExtend::concatenate(temp_residuals, new_residual);
           
           Print("Temp residuals\n",temp_residuals);
      }
          
    return forecasted_values;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: Stats Models/OLS.mqh
================================================
//+------------------------------------------------------------------+
//|                                                          OLS.mqh |
//|                                  Copyright 2023, MetaQuotes Ltd. |
//|                                             https://www.mql5.com |
//+------------------------------------------------------------------+
#property copyright "Copyright 2023, MetaQuotes Ltd."
#property link      "https://www.mql5.com"
//+------------------------------------------------------------------+
//| Ordinary least squares class                                     |
//+------------------------------------------------------------------+
class OLS
  {
private:
   bool   m_const_prepended;    //check column for constant in design matrix
   matrix m_exog,               //design matrix
          m_pinv,               //pseudo-inverse of matrix
          m_cov_params,         //covariance of matrix
          m_m_error,            //error matrix
          m_norm_cov_params;    //normalized covariance matrix
   vector m_endog,              //dependent variables
          m_weights,            //weights
          m_singularvalues,     //singular values of solution
          m_params,             //coefficients of regression model(solution)
          m_tvalues,            //test statistics of model
          m_bse,                //standard errors of model
          m_const_cols,         //mark constant columns in design matrix
          m_resid;              //residuals of model
   ulong  m_obs,                //number of observations
          m_model_dof,          //degrees of freedom of model
          m_resid_dof,          //degrees of freedom of residuals
          m_kconstant,          //number of constants
          m_rank;               //rank of design matrix
   double m_aic,                //Akiake information criteria
          m_bic,                //Bayesian information criteria
          m_scale,              //scale of model
          m_llf,                //loglikelihood of model
          m_sse,                //sum of squared errors
          m_rsqe,               //r-squared of model
          m_centeredtss,        //centered sum of squares
          m_uncenteredtss;      //uncentered sum of squares
   uint              m_error;              //error flag
   // private methods
   ulong             countconstants(void);
   void              scale(void);
   void              sse(void);
   void              rsqe(void);
   void              centeredtss(void);
   void              uncenteredtss(void);
   void              aic(void);
   void              bic(void);
   void              bse(void);
   void              llf(void);
   void              tvalues(void);
   void              covariance_matrix(void);


public:
   //constructor
                     OLS(void);
   //destructor
                    ~OLS(void);
   //public methods
   bool              Fit(const matrix & x, const vector &y);
   double            predict(vector &x);
   double            predict(double x);
   //get properties of OLS model
   ulong             ModelDOF(void) { if(m_error) return 0; else return m_model_dof;}
   ulong             ResidDOF(void) { if(m_error) return 0; else return m_resid_dof;}
   double            Scale(void)  { if(m_error) return EMPTY_VALUE; else return m_scale;    }
   double            Aic(void)    { if(m_error) return EMPTY_VALUE; else return m_aic;      }
   double            Bic(void)    { if(m_error) return EMPTY_VALUE; else return m_bic;    }
   double            Sse(void)    { if(m_error) return EMPTY_VALUE; else return m_sse;    }
   double            Rsqe(void)   { if(m_error) return EMPTY_VALUE; else return m_rsqe;   }
   double            C_tss(void)  { if(m_error) return EMPTY_VALUE; else return m_centeredtss;}
   double            Loglikelihood(void) { if(m_error) return EMPTY_VALUE; return m_llf; }
   vector            Tvalues(void) { if(m_error) return m_m_error.Col(0); return m_tvalues; }
   vector            Residuals(void) { if(m_error) return m_m_error.Col(0); return m_resid; }
   vector            ModelParameters(void) { if(m_error) return m_m_error.Col(0); return m_params; }
   vector            Bse(void) { if(m_error) return m_m_error.Col(0);  return m_bse; } 
   matrix            CovarianceMatrix(void) { if(m_error) return m_m_error; return m_cov_params; }
  };
//+------------------------------------------------------------------+
//|  constructor                                                     |
//+------------------------------------------------------------------+
OLS::OLS(void)
  {
   m_kconstant = 0;
   m_obs = 0;
   m_model_dof = 0;
   m_resid_dof = 0;
   m_kconstant = 0;
   m_rank = 0;
   m_aic = 0;
   m_bic = 0;
   m_scale = 0;
   m_llf   = 0;
   m_error = 1;

   m_m_error.Resize(2,2);
   m_m_error.Fill(EMPTY_VALUE);

  }
//+------------------------------------------------------------------+
//|Destructor                                                        |
//+------------------------------------------------------------------+
OLS::~OLS(void)
  {

  }
//+------------------------------------------------------------------+
//| Fit data                                                         |
//+------------------------------------------------------------------+
bool OLS::Fit(const matrix & x, const vector &y)
  {
//---re-initialize internal properties
   m_endog = y;
//---
   m_exog  = x;
//---
   m_kconstant = countconstants();
//---
   m_error = 0;
//---
   m_model_dof = m_resid_dof = m_rank = m_obs= 0;
//---
   m_aic = m_bic= m_llf=0;
//---
   m_obs=m_exog.Rows();
//---
   m_weights.Resize(m_obs);
//---
   m_weights.Fill(1.0);
//---
   m_rank = m_exog.Rank();
//---
   m_model_dof = m_rank - m_kconstant;
//---
   m_resid_dof = m_obs - m_rank;
//---
   if(y.Size()!=x.Rows())
     {
      Print(__FUNCTION__," ",__LINE__," Error Invalid x Rows in x not equal to length of y");
      m_error = 1;
      return false;
     }
//---
   matrix U,V;
//---
   ::ResetLastError();
//--- SVD operation
   if(!m_exog.SVD(U,V,m_singularvalues))
     {
      Print(__FUNCTION__," ",__LINE__," SVD operation failed : ",::GetLastError());
      m_error = 1;
      return false;
     }
//--- Compute the pseudo-inverse of a matrix by the Moore-Penrose method
   m_pinv = m_exog.PInv();
//--- transpose m_pinv
   matrix pinv_t = m_pinv.Transpose();
//--- normalize covariance matrix
   m_norm_cov_params = m_pinv.MatMul(pinv_t);
//---
   matrix diag;
   if(!diag.Diag(m_singularvalues))
     {
      Print(__FUNCTION__," ",__LINE__," Diag operation failed : ",::GetLastError());
      m_error = 1;
      return false;
     }
//--- rank of diag
   m_rank = diag.Rank();
//--- estimate parameters of the model
   m_params = m_pinv.MatMul(m_endog);
//--- caluclate its degrees of freedom
   m_model_dof = m_rank - m_kconstant;
//--- as well as those of the residuals
   m_resid_dof = m_obs - m_rank;
//---get the residuals
   m_resid = m_endog - m_exog.MatMul(m_params);
//---compute scale of model
   scale();
//--- compute covariance matrix
   covariance_matrix();
//--- compute standard errors
   bse();
//--- compute sum of squared errors
   sse();
//--- compute loglikelihood function
   llf();
//--- compute centered sum of squares
   centeredtss();
//--- compute uncentered sum of squares
   uncenteredtss();
//--- compute r-squared
   rsqe();
//--- compute AIC
   aic();
//--- compute BIC
   bic();
//--- compute tvalues
   tvalues();
//---
   return true;
  }
//+------------------------------------------------------------------+
//| predict next value based on model parameters                     |
//+------------------------------------------------------------------+
double OLS::predict(vector &x)
  {
//---
   if(m_error)
     {
      Print("Invalid model");
      return EMPTY_VALUE;
     }
//---
   if(x.Size()!=(m_params.Size()-m_kconstant))
     {
      Print("invalid x: supplied vector does not match size of model parameters");
      return EMPTY_VALUE;
     }
//---
   double prediction = 0;
//---   
   for(ulong i = 0,k = 0;i<m_const_cols.Size(); i++)
      {
       if(!m_const_cols[i])
          prediction+=(m_params[i]*x[k++]); 
       else
          prediction+=(m_params[i]);   
      }           
//---
   return prediction;
  }
//+------------------------------------------------------------------+
//| predict next value based on model parameters                     |
//+------------------------------------------------------------------+
double OLS::predict(double x)
  {
//---
   if(m_error || (m_params.Size()-m_kconstant)>1)
     {
      if(m_error)
         Print("Invalid model");
      else
         Print("invalid x: insufficient number of predictors supplied");   
      return EMPTY_VALUE;
     }
//---
  double prediction = 0;
//---
  if(m_kconstant)
      prediction=(m_const_cols[0])?m_params[0]+(m_params[1]*x):m_params[1]+(m_params[0]*x);
  else
      prediction=m_params[0]*x;    
//---
   return prediction;
  }
//+------------------------------------------------------------------+
//|Count the number of constants in RHS matrix                       |
//+------------------------------------------------------------------+
ulong OLS::countconstants(void)
  {
   ulong count = 0;
   vector temp;
   
   m_const_cols.Resize(m_exog.Cols());
   m_const_cols.Fill(0.0);
   
   for(ulong i =0; i<m_exog.Cols(); i++)
     {
      temp = m_exog.Col(i);
      if((temp.Max()-temp.Min()) == 0.0)
         {
          count++;
          m_const_cols[i]=1.0;
         }

     }
     
   return count;
  }
//+------------------------------------------------------------------+
//|scale factor for the covariance matrix                            |
//+------------------------------------------------------------------+
void OLS::scale(void)
  {
   m_scale =  m_resid.Dot(m_resid)/double(m_resid_dof);
  }
//+------------------------------------------------------------------+
//| the variance/covariance matrix                                   |
//+------------------------------------------------------------------+
void OLS::covariance_matrix(void)
  {
//---
   m_cov_params=m_norm_cov_params*m_scale;
  }
//+------------------------------------------------------------------+
//| standard errors of the parameter estimates                       |
//+------------------------------------------------------------------+
void OLS::bse(void)
  {
   m_bse=m_cov_params.Diag();
   m_bse=MathSqrt(m_bse);
  }
//+------------------------------------------------------------------+
//| sum of squared errors                                            |
//+------------------------------------------------------------------+
void OLS::sse(void)
  {
   vector sqresid=MathPow(m_resid,2);

   m_sse = sqresid.Sum();

  }
//+------------------------------------------------------------------+
//|likelihood function for the OLS model                             |
//+------------------------------------------------------------------+
void OLS::llf(void)
  {
   double obs2=double(m_obs)/2.0;
   m_llf = -obs2*log(2.0*M_PI) - obs2*log(m_sse / double(m_obs)) - obs2;
//m_llf = -1*obs2*MathLog(2.0*M_PI*m_scale) - m_sse/(2.0*m_scale);
  }
//+------------------------------------------------------------------+
//| Akaike's information criteria                                    |
//+------------------------------------------------------------------+
void OLS::aic(void)
  {
   double params = double(m_model_dof)+double(m_kconstant);

   m_aic = -2*m_llf+2*params;

  }
//+------------------------------------------------------------------+
//|Bayes' information criteria                                       |
//+------------------------------------------------------------------+
void OLS::bic(void)
  {
   double params = double(m_model_dof)+double(m_kconstant);

   m_bic = -2*m_llf+MathLog(m_obs)*params;

  }
//+------------------------------------------------------------------+
//|t-statistic for a given parameter estimate                        |
//+------------------------------------------------------------------+
void OLS::tvalues(void)
  {
   m_tvalues = m_params/m_bse;
  }
//+------------------------------------------------------------------+
//|total  sum of squares centered about the mean                     |
//+------------------------------------------------------------------+
void OLS::centeredtss(void)
  {
   vector centered_endog = m_endog - m_endog.Mean();
//---
   m_centeredtss = centered_endog.Dot(centered_endog);
  }
//+------------------------------------------------------------------+
//| The sum of the squared values of the endogenous response variable|
//+------------------------------------------------------------------+
void OLS::uncenteredtss(void)
  {
   m_uncenteredtss = m_endog.Dot(m_endog);
  }
//+------------------------------------------------------------------+
//|R-squared of the model                                            |
//+------------------------------------------------------------------+
void OLS::rsqe(void)
  {
   m_rsqe = (m_kconstant)? 1 - m_sse/m_centeredtss: 1 - m_sse/m_uncenteredtss;
  }
//+------------------------------------------------------------------+


================================================
FILE: Tensors.mqh
================================================
//+------------------------------------------------------------------+
//|                                                      Tensors.mqh |
//|                                    Copyright 2022, Fxalgebra.com |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Fxalgebra.com"
#property link      "https://www.mql5.com/en/users/omegajoctan"

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

class CMatrix
  {
   public:
         matrix Matrix;
  };
  
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

class C3DTensor
  {
CMatrix* matrices[]; 

public:
                     C3DTensor(void); //For one dimension tensor
                    ~C3DTensor(void);
                    
                    bool   Init(uint size);
                    bool   Append(matrix<double> &__matrix__);
                    
                    CMatrix *GetObj(int index);
                    //virtual matrix operator[](const int index) { return Get(index); }
                    CMatrix* operator[](const int index) { return GetObj(index); }
                    void   Print_();
                    
                    void   Delete();
                    uint   Size(); //returns tensor's size
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
C3DTensor::C3DTensor(void)
 {   
 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
C3DTensor::~C3DTensor(void)
 {
   for (uint i=0; i<matrices.Size(); i++)
     if (CheckPointer(matrices[i]) != POINTER_INVALID)
       delete matrices[i];

   ArrayFree(matrices);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//|  This function initilalizes the 3D tensor by creating empty      |
//|  matrices to the tensor memory                                   |
//|                                                                  |
//+------------------------------------------------------------------+
bool C3DTensor::Init(uint size)
 {
   if (size==0)
     return false;
     
   ArrayResize(this.matrices, size);
   return true;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
uint C3DTensor::Size()
 {
   return this.matrices.Size();
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool C3DTensor::Append(matrix<double> &__matrix__)
 {
   if (ArrayResize(matrices, matrices.Size()+1)<0)
    return false;
    
   uint SIZE = matrices.Size();
   matrices[SIZE-1] = new CMatrix();
   matrices[SIZE-1].Matrix = __matrix__; //Add the new matrix to the newly created tensor index
   
   return true;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void C3DTensor::Print_(void)
 {
   for (uint i=0; i<matrices.Size(); i++)
     Print("TENSOR INDEX [",i,"] matrix-size=(",this.matrices[i].Matrix.Rows(),"x",this.matrices[i].Matrix.Cols(),")\n",this.matrices[i].Matrix); 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CMatrix *C3DTensor::GetObj(int index)
 {
   if (index<-1 || index > int(matrices.Size()))
    {
      printf("%s failed, index out of range. Line %d",__FUNCTION__, __LINE__);
      return this.matrices[index==-1?matrices.Size()-1: index];
    }
   
   return this.matrices[index==-1?matrices.Size()-1: index]; //if the selected position is -1 we obtain the last matrix in our tensor
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void C3DTensor::Delete(void)
 {
   for (ulong i=0; i<matrices.Size(); i++)
    {
      this.matrices[i].Matrix.Resize(0,0);
      ZeroMemory(this.matrices[i].Matrix);
    }
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


//+------------------------------------------------------------------+
//|                                                                  |
//|   Tensorflows for Vector type of data                            |
//|                                                                  |
//+------------------------------------------------------------------+

class CVectors
  {
   public:
          vector Vector;
  };

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
class C2DTensor
  {
CVectors             *vectors[];

public:
                     C2DTensor(void);
                    ~C2DTensor(void);
                     
                     bool   Init(uint size);
                     bool Append(vector &v);
                     
                     void Print_(void);
                     CVectors* operator[](const int index) { return GetObj(index); }
                     CVectors *GetObj(int index);
                     
                     void Delete();
                     uint   Size(); //returns tensor's size
  };
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
C2DTensor::C2DTensor(void)
 {
   
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
C2DTensor::~C2DTensor(void)
 {
   for (uint i=0; i<vectors.Size(); i++)
     if (CheckPointer(vectors[i]) != POINTER_INVALID)
       delete vectors[i];

   ArrayFree(vectors);
 } 
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool C2DTensor::Init(uint size)
 {
   if (size==0)
     return false;
     
   ArrayResize(this.vectors, size);
   return true;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CVectors *C2DTensor::GetObj(int index)
 {
   if (index<-1 || index > int(vectors.Size()))
    {
      printf("%s failed, index out of range. Line %d",__FUNCTION__, __LINE__);
      return this.vectors[index==-1?vectors.Size()-1: index];
    }
   
   return this.vectors[index==-1?vectors.Size()-1: index]; //if the selected position is -1 we obtain the last matrix in our tensor
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void C2DTensor::Print_(void)
 {
   for (ulong i=0; i<vectors.Size(); i++)
     Print("TENSOR INDEX [",i,"] vector-size =(",this.vectors[i].Vector.Size(),")\n",this.vectors[i].Vector); 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
uint C2DTensor::Size(void)
 {
   return this.vectors.Size();
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void C2DTensor::Delete(void)
 {
   for (ulong i=0; i<vectors.Size(); i++)
    {
      this.vectors[i].Vector.Resize(0,0);
      ZeroMemory(this.vectors[i].Vector);
    }
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool C2DTensor::Append(vector &v)
 {
   if (ArrayResize(this.vectors, vectors.Size()+1)<0)
    return false;
    
   uint SIZE = vectors.Size();
   vectors[SIZE-1] = new CVectors();
   vectors[SIZE-1].Vector = v; //Add the new matrix to the newly created tensor index
   
   return true;   
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

================================================
FILE: Utils.mqh
================================================
//+------------------------------------------------------------------+
//|                                                 matrix_utils.mqh |
//|                                  Copyright 2022, Omega Joctan  . |
//|                        https://www.mql5.com/en/users/omegajoctan |
//+------------------------------------------------------------------+
#property copyright "Copyright 2022, Omega Joctan"
#property link      "https://www.mql5.com/en/users/omegajoctan"

//+------------------------------------------------------------------+
//|   A class containing additional matrix manipulation functions    |
//+------------------------------------------------------------------+

class CUtils
  {
  
protected:

   template<typename T>
   static T          MathRandom(T mini, T maxi);
   static string     CalcTimeElapsed(double seconds);
   static void       Swap(double &var1, double &var2);
   static string     ConvertTime(double seconds);
   
   template<typename T>
   static void       GetCol(const T &Matrix[], T &Col[], int column, int cols);
   
   static bool       IsNumber(string text);

public:
                     CUtils(void);
                    ~CUtils(void);
   
   template<typename T>
   static int Sign(T var)
    {
      if (var<0)
        return -1;
      else if (var==0)
        return 0;
      else
        return 1;
    }
    
//--- File Functions

   template <typename T>
   static bool       WriteCsv(string csv_name, matrix<T> &matrix_, string &header[] ,bool common=false, int digits=5);
   template <typename T>
   static bool       WriteCsv(string csv_name, matrix<T> &matrix_, string header_string="",bool common=false, int digits=5);
   static matrix     ReadCsv(string file_name, string &headers, string delimiter=",",bool common=false, bool auto_encode=false);
   static matrix     DBtoMatrix(int db_handle, string table_name,string &column_names[],int total=WHOLE_ARRAY);
   static bool       write_bin(vector &v, string file);
   
//--- Manipulations
   
   template<typename T>
   static bool       RemoveCol(matrix<T> &mat, ulong col);
   static void       RemoveMultCols(matrix &mat, int &cols[]);
   static void       RemoveMultCols(matrix &mat, int from, int total=WHOLE_ARRAY);
   static void       RemoveRow(matrix &mat,ulong row);
   static void       VectorRemoveIndex(vector &v, ulong index);  
   
//--- Machine Learning 

   template<typename T>
   static bool       XandYSplitMatrices(const matrix<T> &matrix_, matrix<T> &xmatrix, vector<T> &y_vector,int y_column=-1);
   template <typename T>
   static void       TrainTestSplitMatrices(const matrix<T> &X, const vector<T> &y, matrix<T> &x_train, vector<T> &y_train, matrix<T> &x_test, vector<T> &y_test, double train_size=0.7,int random_state=-1, bool shuffle=true);
   static matrix     DesignMatrix(const matrix &x);              
   static matrix     OneHotEncoding(const vector &v);    //ONe hot encoding 
   static matrix     Sign(matrix &x);
   static vector     Sign(vector &x);
   
//--- Detection

   static void       Unique(const string &Array[], string &classes_arr[]);
   static vector     Unique(const vector &v);           //Identifies classes available in a vector
   static vector     Unique_count(vector &v);
   
   template<typename T> 
   static vector     Random(T min, T max, int size,int random_state=-1);          //Generates a random vector of type T sized = size
   static matrix     Random(double min, double max, ulong rows, ulong cols, int random_state=-1); 
   
   template<typename T>
   static vector     Search(const vector<T> &v, T value);
   
//--- Transformations

   static matrix     VectorToMatrix(const vector &v, ulong cols=1);
   template<typename T>
   static vector     MatrixToVector(const matrix<T> &mat);
   
   template<typename T>
   static vector     ArrayToVector(const T &Arr[]);     
   template<typename T>
   static bool       VectorToArray(const vector<T> &v,T &arr[]);
   
//--- Manipulations
   
   template<typename T>
   static vector     concatenate(const vector<T> &v1, const vector<T> &v2);              //Appends v2 to vector 1
   static vector     concatenate(const vector &v, const double value);              //Appends double value to a vector 
   static matrix     concatenate(const matrix &mat1, const  matrix &mat2, int axis = 0);
   template<typename T>
   static matrix<T>  concatenate(const matrix<T> &mat, const vector<T> &v, int axis=1);
   
   template<typename T>
   static bool       Copy(const vector<T> &src, vector<T> &dst, ulong src_start,ulong total=WHOLE_ARRAY);
   
   
   template<typename T>
   static void       Reverse(vector<T> &v);
   template<typename T>
   static void       Reverse(matrix<T> &mat);
   
   static matrix     HadamardProduct(matrix &a, matrix &b);
   
   template<typename T>
   static void       Randomize(vector<T> &v, int random_state=-1, bool replace=false);
   template<typename T>
   static void       Randomize(matrix<T> &matrix_,int random_state=-1, bool replace=false);
   
   template<typename T>
   static void       NormalizeDouble_(vector<T> &v, int digits=3);
   template<typename T>
   static void       NormalizeDouble_(matrix<T> &mat, int digits=3);
   
   static int        CopyBufferVector(int handle, int buff_num, int start_pos,int count, vector &v);
   static string     Stringfy(vector &v, int digits = 2);
   static matrix     Zeros(ulong rows, ulong cols) { matrix ret_mat(rows, cols); return(ret_mat.Fill(0.0)); }
   static vector     Zeros(ulong size) { vector ret_v(size); return( ret_v.Fill(0.0)); }
   static matrix     Get(const matrix &mat, ulong start_index, ulong end_index);
   static vector     Get(const vector &v, ulong start_index, ulong end_index);
   template<typename T>
   static vector     Sort(vector<T> &v,ENUM_SORT_MODE sort_mode=SORT_ASCENDING);
   template<typename T>
   static vector     ArgSort(vector<T> &v);
   static matrix     Slice(const matrix &mat, ulong start_index, int end_index, uint axis=0);
   static vector     Slice(const vector &vec, ulong start_index, int end_index);

//--- Others
   
   static void       PrintShort(matrix &matrix_,ulong rows=5, int digits=5);

  }; 
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CUtils::CUtils(void)
  {
    
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
CUtils::~CUtils(void)
  {
  
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CUtils::VectorToMatrix(const vector &v, ulong cols=1)
  {      
   ulong rows = 0;
   matrix mat = {};
   
   
    if ( v.Size() % cols > 0) //If there is a reminder
      {
        printf("Invalid rows %d and cols %d for this vector size ",rows,v.Size()/cols);
        return mat;
      }
    else
       rows = v.Size()/cols;

//---

   mat.Resize(rows, cols); 

   for(ulong i=0, index =0; i<rows; i++)
      for(ulong j=0; j<cols; j++, index++)
        {
         mat[i][j] = v[index];
        }
   return(mat);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
vector CUtils::MatrixToVector(const matrix<T> &mat)
  {
    vector<T> v = {};
    matrix<T> temp_mat = mat;
    
    if (!temp_mat.Swap(v))
      Print(__FUNCTION__," Failed to turn the matrix[",mat.Rows(),"x",mat.Cols(),"] into a vector");
    
    return(v);
  }

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
bool CUtils::RemoveCol(matrix<T> &mat, ulong col)
  {
   matrix<T> new_matrix(mat.Rows(),mat.Cols()-1); //Remove the one Column
   if (col > mat.Cols())
     {
       Print(__FUNCTION__," column out of range");
       return false;
     }

   for (ulong i=0, new_col=0; i<mat.Cols(); i++) 
     {
        if (i == col)
          continue;
        else
          {
           new_matrix.Col(mat.Col(i),new_col);
           new_col++;
          }    
     }

   mat.Copy(new_matrix);
   
   return true;
  }

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CUtils::RemoveMultCols(matrix &mat, int &cols[])
  {
   ulong size = (int)ArraySize(cols);

   if(size > mat.Cols())
     {
      Print(__FUNCTION__," Columns to remove can't be more than the available columns");
      return;
     }


   vector Zeros(mat.Rows());
   Zeros.Fill(0);

   for(ulong i=0; i<size; i++)
      for(ulong j=0; j<mat.Cols(); j++)
        {
         if(cols[i] == j)
            mat.Col(Zeros,j);
        }

//---

   vector column_vector;
   
   while (mat.Cols()-size >= size)
      for(ulong i=0; i<mat.Cols(); i++)
        {
         column_vector = mat.Col(i);
         if(column_vector.Sum()==0)
            if (!RemoveCol(mat,i))
              {
                printf("%s Line %d Failed to remove a column %d from a matrix",__FUNCTION__,__LINE__,i);
                break;
              }
        }
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+

void CUtils::RemoveMultCols(matrix &mat, int from, int total=WHOLE_ARRAY)
 {
   
   total = total==WHOLE_ARRAY ? (int)mat.Cols()-from : total;
   
   if(total > (int)mat.Cols())
     {
      Print(__FUNCTION__," Columns to remove can't be more than the available columns");
      return;
     }

   vector Zeros(mat.Rows());
   Zeros.Fill(0);

   for (int i=from; i<total+from; i++)
      mat.Col(Zeros, i);
   
//---      
   
   ulong remain_size = mat.Cols()-total;
   
   
   while (mat.Cols() >= remain_size && !IsStopped())
    {
      //printf("cols %d total %d",cols,total);
      
      for(ulong i=0; i<mat.Cols(); i++) //loop the entire matrix searching for columns to remove
         if(mat.Col(i).Sum()==0)
            if (!RemoveCol(mat,i))
              {
                printf("%s Line %s Failed to remove a column %d from a matrix",__FUNCTION__,__LINE__,i);
                break;
              }
    }
 }

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CUtils::RemoveRow(matrix &mat,ulong row)
  {
   matrix new_matrix(mat.Rows()-1,mat.Cols()); //Remove the one Row
 
      for(ulong i=0, new_rows=0; i<mat.Rows(); i++)
        {
         if(i == row)
            continue;
         else
           {
            new_matrix.Row(mat.Row(i),new_rows);
            new_rows++;
           }
        }

   mat.Copy(new_matrix);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CUtils::VectorRemoveIndex(vector &v, ulong index)
  {
   vector new_v(v.Size()-1);

   for(ulong i=0, count = 0; i<v.Size(); i++)
      if(i != index)
        {
         new_v[count] = v[i];
         count++;
        }
    v.Copy(new_v);
  }

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template <typename T>
bool CUtils::WriteCsv(string csv_name, matrix<T> &matrix_, string &header[], bool common=false, int digits=5)
  {
   string header_str = "";
   for (int i=0; i<ArraySize(header); i++)
      header_str += header[i] + ((i+1 == ArraySize(header)) ? "" : ",");
      
   return WriteCsv(csv_name, matrix_, header_str, common, digits);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template <typename T>
bool CUtils::WriteCsv(string csv_name, matrix<T> &matrix_, string header_string="", bool common=false, int digits=5)
  {
   FileDelete(csv_name);
   int handle = FileOpen(csv_name,FILE_WRITE|FILE_CSV|FILE_ANSI|(common?FILE_COMMON:FILE_IS_WRITABLE),",",CP_UTF8);
   
   if (header_string == "" || header_string == NULL)
     for (ulong i=0; i<matrix_.Cols(); i++)
       header_string += "None"+ (i==matrix_.Cols()-1?"":","); 

   if(handle == INVALID_HANDLE)
     {
       printf("Invalid %s handle Error %d ",csv_name,GetLastError());
       return (false);
     }
            
   string concstring;
   vector<T> row = {};
   
   datetime time_start = GetTickCount(), current_time;
   
   string header[];
   
   ushort u_sep;
   u_sep = StringGetCharacter(",",0);
   StringSplit(header_string,u_sep, header);
   
   vector<T> colsinrows = matrix_.Row(0);
   
   if (ArraySize(header) != (int)colsinrows.Size())
      {
         printf("headers=%d and columns=%d from the matrix vary is size ",ArraySize(header),colsinrows.Size());
         return false;
      }

//---

   string header_str = "";
   for (int i=0; i<ArraySize(header); i++)
      header_str += header[i] + (i+1 == colsinrows.Size() ? "" : ",");
   
   FileWrite(handle,header_str);
   
   FileSeek(handle,0,SEEK_SET);
   
   for(ulong i=0; i<matrix_.Rows() && !IsStopped(); i++)
     {
      ZeroMemory(concstring);

      row = matrix_.Row(i);
      for(ulong j=0, cols =1; j<row.Size() && !IsStopped(); j++, cols++)
        {
         current_time = GetTickCount();
         
         Comment("Writting ",csv_name," record [",i+1,"/",matrix_.Rows(),"] Time taken | ",ConvertTime((current_time - time_start) / 1000.0));
         
         concstring += (string)NormalizeDouble(row[j],digits) + (cols == matrix_.Cols() ? "" : ",");
        }

      FileSeek(handle,0,SEEK_END);
      FileWrite(handle,concstring);
     }
        
   FileClose(handle);
   
   return (true);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool CUtils::IsNumber(string text)
{
    int length = StringLen(text);   // Get the length of the string.
    int pointcount = 0;             // Initialize a counter for the number of decimal points.

    // Iterate through each character in the text.
    for (int i = 0; i < length; i++)
    {
        int char1 = StringGetCharacter(text, i);  // Get the ASCII code of the current character.

        // If the character is a decimal point, increment the decimal point counter.
        if (char1 == 46)
            pointcount += 1;

        // If the character is a digit or a decimal point and the number of decimal points is less than 2,
        // continue to the next character; otherwise, return false.
        if (((char1 >= 48 && char1 <= 57) || char1 == 46) && pointcount < 2)
            continue;
        else
            return false;
    }

    // If all characters in the text have been checked without returning false, return true.
    return true;
}
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
void CUtils::GetCol(const T &Matrix[], T &Col[], int column, int cols)
 {
   int rows = ArraySize(Matrix)/cols;
   ArrayResize(Col,rows);
   
   int start = 0;
    for (int i=0; i<cols; i++)
     {
      start = i;
      
      if (i != column-1)  continue;
      else
        for (int j=0; j<rows; j++)
          {
            //printf("ColMatrix[%d} Matrix{%d]",j,start);
            Col[j] = Matrix[start];
            
            start += cols;
          }
     }  
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
vector CUtils::ArrayToVector(const T &Arr[])
  {
   vector v(ArraySize(Arr));
   
   for (int i=0; i<ArraySize(Arr); i++)
     v[i] = double(Arr[i]);
     
   return (v);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
bool CUtils::VectorToArray(const vector<T> &v, T &arr[])
  {
   vector temp = v;
   if (!temp.Swap(arr))
    {
      Print("Failed to Convert vector to Array Err=",GetLastError());
      return false;
    }
   return(true);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
bool CUtils::XandYSplitMatrices(const matrix<T> &matrix_, matrix<T> &xmatrix, vector<T> &y_vector,int y_column=-1)
  {
   y_column = int( y_column==-1 ? matrix_.Cols()-1 : y_column);
   
   if (matrix_.Rows() == 0 || matrix_.Cols()==0)
     {
       #ifdef DEBUG_MODE
         printf("%s Line %d Cannot split the matrix of size[%dx%d]",__FUNCTION__,__LINE__,matrix_.Rows(),matrix_.Cols());
       #endif 
       
       return false;
     }
   
   y_vector = matrix_.Col(y_column);
   xmatrix.Copy(matrix_);
   
   return RemoveCol(xmatrix, y_column); //Remove the y column
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
void CUtils::Randomize(vector<T> &v, int random_state=-1, bool replace=false)
 {
   MathSrand(random_state!=-1?random_state:GetTickCount());
     
   int swap_index;
   double temp;
   
   int SIZE = (int)v.Size();
   vector<T> temp_v = v;
   
   for (int i=0; i<SIZE; i++) //Fisher yates algorithm
      {
        if (!replace)
          {
            swap_index = rand() % SIZE;
            
            temp = v[i];
            
            v[i] = v[swap_index];
            v[swap_index] = temp;
          }
        else
          {
            v[i] = temp_v[MathRandom(0, SIZE)];
          }
      }   
 }
//+------------------------------------------------------------------+
//| replace =true parameter allows the same index to be chosen more  |
//| than once, simulating the bootstrapping process.                 |    
//+------------------------------------------------------------------+
template<typename T>
void CUtils::Randomize(matrix<T> &matrix_,int random_state=-1, bool replace=false)
 {
   MathSrand(random_state!=-1?random_state:GetTickCount());
  
   int ROWS=(int)matrix_.Rows(), COL=(int)matrix_.Cols();   
   
   int swap_index;
   vector<T> temp(COL);
   matrix<T> temp_m = matrix_;
   int random = 0;
   
   for (int i=0; i<ROWS; i++)
      {
        if (!replace)
          {
            swap_index = MathRand() % ROWS;
            
            temp = matrix_.Row(i);
                  
            matrix_.Row(matrix_.Row(swap_index),i);
            
            matrix_.Row(temp,swap_index);
          }
        else
          {
            random = MathRandom(1, ROWS);  
            
            temp = temp_m.Row(random-1);                      
            matrix_.Row(temp, i);
          }
      }   
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template <typename T>
void CUtils::TrainTestSplitMatrices(const matrix<T> &X, const vector<T> &y, matrix<T> &x_train, vector<T> &y_train, matrix<T> &x_test, vector<T> &y_test, double train_size=0.7,int random_state=-1, bool shuffle=true)
  {
   ulong total = X.Rows(), cols = X.Cols();
   
   ulong last_col = cols-1;
   
//--- Random pseudo matrix
   
   matrix temp_x = X; vector temp_y = y;
   
   if (shuffle)
    {
      matrix temp_matrix = concatenate(X, y);
      Randomize(temp_matrix, random_state);
      XandYSplitMatrices(temp_matrix, temp_x, temp_y);
    }
    
//--- Resizing the new metrices

   int train = (int)MathFloor(total*train_size);
   int test = (int)total-train;
   
   
//---
   
   x_train = Slice(temp_x, 0, train);
   x_test = Slice(temp_x, train, -1);
   
//---
   
   y_train = Slice(temp_y, 0, train);
   y_test = Slice(temp_y, train, -1);
   
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CUtils::DesignMatrix(const matrix &x)
  {
   matrix out_matrix(x.Rows(),x.Cols()+1);

   vector ones(x.Rows());
   ones.Fill(1);

   out_matrix.Col(ones,0);
   vector new_vector;

   for(ulong i=1; i<out_matrix.Cols(); i++)
     {
      new_vector = x.Col(i-1);
      out_matrix.Col(new_vector,i);
     }

   return (out_matrix);
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CUtils::OneHotEncoding(const vector &v)
 {
   matrix mat = {}; 
   
//---

   vector v_classes = Unique(v);
     
//---

     mat.Resize(v.Size(),v_classes.Size());
     mat.Fill(-100);
     
     for (ulong i=0; i<mat.Rows(); i++)
        for (ulong j=0; j<mat.Cols(); j++)
           {
               if (v[i] == v_classes[j])
                  mat[i][j] = 1;
               else 
                  mat[i][j] = 0;     
           }
   
   return(mat);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CUtils::Unique(const string &Array[], string &classes_arr[])
 {
   string temp_arr[];

   ArrayResize(classes_arr,1);
   ArrayCopy(temp_arr,Array);
   
   classes_arr[0] = Array[0];
   
   for(int i=0, count =1; i<ArraySize(Array); i++)  //counting the different neighbors
     {
      for(int j=0; j<ArraySize(Array); j++)
        {
         if(Array[i] == temp_arr[j] && temp_arr[j] != "-nan")
           {
            bool count_ready = false;

            for(int n=0; n<ArraySize(classes_arr); n++)
               if(Array[i] == classes_arr[n])
                    count_ready = true;

            if(!count_ready)
              {
               count++;
               ArrayResize(classes_arr,count);

               classes_arr[count-1] = Array[i]; 

               temp_arr[j] = "-nan"; //modify so that it can no more be counted
              }
            else
               break;
           }
         else
            continue;
        }
     }
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CUtils::Unique(const vector &v)
 {
   vector temp_v = v; 
   vector v_classes={v[0]};

   for (ulong i = 0, count=0; i < v.Size(); i++) 
    {
      bool alreadyCounted = false;

      for (ulong j = 0; j < v_classes.Size(); j++) 
       {
         if (temp_v[i] == v_classes[j] && temp_v[i] != -DBL_MAX && i!=0) 
           {
             alreadyCounted = true;
             temp_v[i] = -DBL_MAX;
           }
      }

     if (!alreadyCounted) 
       {
         count++;
         v_classes.Resize(count);
         
         v_classes[count-1] = temp_v[i];
       }
    }
 
   return CUtils::Sort(v_classes); //Sort the unique values in ascending order
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
T CUtils:: MathRandom(T mini, T maxi)
  {
     double  f  = (MathRand() / 32767.0);
     return (mini + (T)(f * (maxi - mini)));
  }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T> 
vector CUtils::Random(T min, T max,int size,int random_state=-1)
 {
   MathSrand(random_state!=-1?random_state:GetTickCount());
    
   vector v(size);
   
   for (ulong i=0; i<v.Size(); i++)
      v[i] = MathRandom<T>(min,max);
      
   return (v);    
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CUtils::Random(double min,double max,ulong rows,ulong cols,int random_state=-1)
 {
   MathSrand(random_state!=-1?random_state:GetTickCount());
     
     matrix mat(rows,cols);
     
     for (ulong r=0; r<rows; r++)
       for (ulong c=0; c<cols; c++)
            mat[r][c] = MathRandom<double>(min,max);
     
     return (mat);
 }
//+------------------------------------------------------------------+
//|   Appends vector v1 to the end of vector v2                      |
//+------------------------------------------------------------------+
template<typename T>
vector CUtils::concatenate(const vector<T> &v1, const vector<T> &v2)
 {
   vector v_out = v1; 
   
   v_out.Resize(v1.Size()+v2.Size());
   
   for (ulong i=0; i<v1.Size(); i++)
      v_out[i] = v1[i]; 
   
   for (ulong i=v1.Size(),index =0; i<v_out.Size(); i++, index++)
       v_out[i] = v2[index]; 
   
   return (v_out); 
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CUtils::concatenate(const vector &v, const double value) //Appends double value to a vector 
 {
   vector v2 = {value};
   return concatenate(v, v2);
 }
//+------------------------------------------------------------------+
//|   Appends matrix mat1 to the end of mat2                         |
//+------------------------------------------------------------------+
matrix CUtils::concatenate(const matrix &mat1, const matrix &mat2, int axis = 0)
 {
     matrix m_out = {};

     if ((axis == 0 && mat1.Cols() != mat2.Cols() && mat1.Cols()>0) || (axis == 1 && mat1.Rows() != mat2.Rows() && mat1.Rows()>0)) 
       {
         Print(__FUNCTION__, "Err | Dimensions mismatch for concatenation");
         return m_out;
       }

     if (axis == 0) {
         m_out.Resize(mat1.Rows() + mat2.Rows(), MathMax(mat1.Cols(), mat2.Cols()));

         for (ulong row = 0; row < mat1.Rows(); row++) {
             for (ulong col = 0; col < m_out.Cols(); col++) {
                 m_out[row][col] = mat1[row][col];
             }
         }

         for (ulong row = 0; row < mat2.Rows(); row++) {
             for (ulong col = 0; col < m_out.Cols(); col++) {
                 m_out[row + mat1.Rows()][col] = mat2[row][col];
             }
         }
     } else if (axis == 1) {
         m_out.Resize(MathMax(mat1.Rows(), mat2.Rows()), mat1.Cols() + mat2.Cols());

         for (ulong row = 0; row < m_out.Rows(); row++) {
             for (ulong col = 0; col < mat1.Cols(); col++) {
                 m_out[row][col] = mat1[row][col];
             }

             for (ulong col = 0; col < mat2.Cols(); col++) {
                 m_out[row][col + mat1.Cols()] = mat2[row][col];
             }
         }
     }
   return m_out;
 }
//+------------------------------------------------------------------+
//|   Concatenates the vector to a matrix, axis =0 along the rows    |
//|   while axis =1 along the colums concatenation
//+------------------------------------------------------------------+
template<typename T>
matrix<T> CUtils::concatenate(const matrix<T> &mat, const vector<T> &v, int axis=1)
 {
   matrix<T> ret= mat;
     
   ulong new_rows, new_cols;
   
   if (axis == 0) //place it along the rows
    {
      if (mat.Cols() == 0)
        ret.Resize(mat.Rows(), v.Size());
        
      new_rows = ret.Rows()+1; new_cols = ret.Cols();
                 
      if (v.Size() != new_cols)
        {
          Print(__FUNCTION__," Dimensions don't match the vector v needs to have the same size as the number of columns in the original matrix");
          return ret;
        }
      
      ret.Resize(new_rows, new_cols);
      ret.Row(v, new_rows-1);
    }
   else if (axis == 1)
     {
         if (mat.Rows() == 0)
           ret.Resize(v.Size(), ret.Cols());
           
        new_rows = ret.Rows(); new_cols = ret.Cols()+1;
        
        if (v.Size() != new_rows)
          {
            Print(__FUNCTION__," Dimensions don't match the vector v needs to have the same size as the number of rows in the original matrix");
            return ret;
          }
        
        ret.Resize(new_rows, new_cols);
        ret.Col(v, new_cols-1);
     }
   else 
     {
       Print(__FUNCTION__," Axis value Can either be 0 or 1");
       return ret;
     }

//---
   return ret;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
bool CUtils::Copy(const vector<T> &src, vector<T> &dst,ulong src_start,ulong total=WHOLE_ARRAY)
 {
   if (total == WHOLE_ARRAY)
      total = src.Size()-src_start;
   
   if ( total <= 0 || src.Size() == 0)
    {
       printf("%s Can't copy a vector | Size %d total %d src_start %d ",__FUNCTION__,src.Size(),total,src_start);
       return (false);
    }
   
   dst.Resize(total);
   dst.Fill(0);
   
   for (ulong i=src_start, index =0; i<total+src_start; i++)
      {   
          dst[index] = src[i];         
          index++;
      }
   return (true);
 }
//+------------------------------------------------------------------+
//| Searches for a value in a vector | Returns all the index where   |
//| Such values was located                                          |
//+------------------------------------------------------------------+
template<typename T>
vector CUtils::Search(const vector<T> &v, T value)
 {
   vector<T> v_out ={};
   
   for (ulong i=0, count =0; i<v.Size(); i++)
     { 
      if (value == v[i])
        {
          count++;
          
          v_out.Resize(count);    
          
          v_out[count-1] = (T)i;
        }
     }   
    return v_out;
 }
//+------------------------------------------------------------------+
//| Finds the unique values in a vector and returns a vector of      |
//| the number of values found for each unique value                 |
//+------------------------------------------------------------------+
vector CUtils::Unique_count(vector &v)
 {
  vector classes = CUtils::Unique(v);
  vector keys(classes.Size());
  
   for (ulong i=0; i<classes.Size(); i++)
     keys[i] = (int)Search(v, classes[i]).Size();
    
  return keys;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
vector CUtils::Sort(vector<T> &v,ENUM_SORT_MODE sort_mode=SORT_ASCENDING)
 {
   T arr[];
   vector temp = v;
   temp.Swap(arr);
   
   if (!ArraySort(arr))
     printf("%s Failed to sort this vector Err=%d",__FUNCTION__,GetLastError());
   
   switch(sort_mode)
     {
      case  SORT_ASCENDING:
        temp = CUtils::ArrayToVector(arr);  
        break;
      case SORT_DESCENDING:
        temp = CUtils::ArrayToVector(arr);  
        CUtils::Reverse(temp);
        break;
      default:
        printf("%s Unknown sort mode");
        break;
     }
   return temp;   
 }
//+------------------------------------------------------------------+
//| Returns the Sorted Argsuments in either ascending order or       |
//|  descending order                                                |
//+------------------------------------------------------------------+
template<typename T>
vector CUtils::ArgSort(vector<T> &v)
 {   
//---

    ulong size = v.Size();
    vector args(size);
    
    // Initialize args array with sequential values
    for (ulong i = 0; i < size; i++)
        args[i] = (int)i;

    // Perform selection sort on args based on array values
    for (ulong i = 0; i < size - 1; i++)
    {
        ulong minIndex = i;
        for (ulong j = i + 1; j < size; j++)
        {
            if (v[(int)args[j]] < v[(int)args[minIndex]])
                minIndex = j;
        }

        // Swap args
        int temp = (int)args[i];
        args[i] = args[minIndex];
        args[minIndex] = temp;
    }
   
  return args;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
void CUtils::Reverse(vector<T> &v)
 {
  vector<T> v_temp = v;
  
   for (ulong i=0, j=v.Size()-1; i<v.Size(); i++, j--)
        v[i] = v_temp[j];
        
   ZeroMemory(v_temp);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
void CUtils::Reverse(matrix<T> &mat)
 {
   matrix<T> temp_mat = mat;
   
   for (ulong i=0, j=mat.Rows()-1; i<mat.Rows(); i++, j--)
      mat.Row(mat.Row(j), i); 
 }
//+------------------------------------------------------------------+
//|   Hadamard product --> is a binary operation that takes two      |
//|    matrices of the same dimensions and produces another matrix   |
//|   of the same dimension as the operands. | This operation is     |
//|  widely known as element wise multiplication                     |
//+------------------------------------------------------------------+
matrix CUtils::HadamardProduct(matrix &a,matrix &b)
 {  
  matrix c = {};
  if (a.Rows() != b.Rows() || a.Cols() != b.Cols())
    {
      Print("Cannot calculate Hadamard product | matrix a and b are not having the same size ");
      return c;
    }
//---
         
    return a*b;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


string CUtils::CalcTimeElapsed(double seconds)
  {
   string time_str = "";

   uint minutes=0, hours=0;

   if(seconds >= 60)
      time_str = StringFormat("%d Minutes and %.3f Seconds ",minutes=(int)round(seconds/60.0), ((int)seconds % 60));
   if(minutes >= 60)
      time_str = StringFormat("%d Hours %d Minutes and %.3f Seconds ",hours=(int)round(minutes/60.0), minutes, ((int)seconds % 60));
   else
      time_str = StringFormat("%.3f Seconds ",seconds);

   return time_str;
  }

//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CUtils::DBtoMatrix(int db_handle, string table_name,string &column_names[],int total=WHOLE_ARRAY)
 {
  matrix matrix_ = {};
  
  
  #ifdef DEBUG_MODE
     Print("---> loading database ");
  #endif 
  
  if(db_handle == INVALID_HANDLE)
     {
      printf("db handle failed, Err = %d",GetLastError());
      DatabaseClose(db_handle);
      return matrix_;
     }

//---

   string sql =  "SELECT * FROM "+table_name;
   int request = DatabasePrepare(db_handle,sql);     
   
   ulong cols = DatabaseColumnsCount(request), rows =0;
   
   ArrayResize(column_names,(int)cols);

//---

   matrix_.Resize(cols,0); 
    
    double time_start = GetMicrosecondCount()/(double)1e6, time_stop=0; //Elapsed time 
    double row_start = 0, row_stop =0;
     
    for (int j=0; DatabaseRead(request) && !IsStopped(); j++)
      {  
        
       row_start = GetMicrosecondCount()/(double)1e6; 
           
        rows = (ulong)j+1;
        matrix_.Resize(cols,rows);
         
         for (ulong k=0; k<cols; k++)
           {
             DatabaseColumnDouble(request,(int)k,matrix_[k][j]);
             
             if (j==0)  DatabaseColumnName(request,(int)k,column_names[k]);
           }
          
         if (total != WHOLE_ARRAY)
            if (j >= total)     break;
            
         #ifdef  DEBUG_MODE
            row_stop =GetMicrosecondCount()/(double)1e6;
            
            printf("Row ----> %d | Elapsed %s",j,CalcTimeElapsed(row_stop-row_start));
         #endif 
      }

//---
   
   DatabaseFinalize(request);
   DatabaseClose(db_handle);
   
   matrix_ = matrix_.Transpose(); //very crucial step
   
   #ifdef DEBUG_MODE
      time_stop = GetMicrosecondCount()/(double)1e6;
     
      printf("---> finished reading DB size=(%dx%d) | Time Elapsed %s",rows,cols,CalcTimeElapsed(time_stop-time_start)); 
     
      ArrayPrint(column_names);
      for (ulong i=0; i<5; i++)     Print(matrix_.Row(i));
   #endif 
   
   
  return matrix_;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
void CUtils::NormalizeDouble_(vector<T> &v,int digits=3)
 {
   for (ulong i=0; i<v.Size(); i++)
      v[i] = NormalizeDouble(v[i], digits);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
template<typename T>
void CUtils::NormalizeDouble_(matrix<T> &mat,int digits=3)
 {
   for (ulong i=0; i<mat.Rows(); i++)
      for (ulong j=0; j<mat.Cols(); j++)
         mat[i][j] = NormalizeDouble(mat[i][j], digits);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CUtils::PrintShort(matrix &matrix_, ulong rows=5,int digits=5)
 {
   vector v = {};
    for (ulong i=0; i<rows; i++)
     {
        v = matrix_.Row(i);
        NormalizeDouble_(v, digits);
        
        Print(v); 
     }
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
void CUtils::Swap(double &var1,double &var2)
 {
   double temp_1 = var1, temp2=var2;
   
   var1 = temp2;
   var2 = temp_1;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
int CUtils::CopyBufferVector(int handle,int buff_num,int start_pos,int count,vector &v)
 {
   double buff_arr[];
   
   int ret = CopyBuffer(handle, buff_num, start_pos, count, buff_arr);
   v = ArrayToVector(buff_arr);
   
   return (ret);
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
string CUtils::Stringfy(vector &v, int digits = 2)
 {
   string str = "";
   for (ulong i=0; i<v.Size(); i++)
       str += " "+DoubleToString(v[i], digits) + " ";
   
   return (str);
 }
//+------------------------------------------------------------------+
//| a function to convert the seocnds to Hours and minutes, Useful   |
//| in measuring the time taken for operations that takes a long     |
//| time to complete, Such as reading and writing to a large csv file|
//+------------------------------------------------------------------+
string CUtils::ConvertTime(double seconds)
{
    string time_str = "";
    uint minutes = 0, hours = 0;

    if (seconds >= 60)
    {
        minutes = (uint)(seconds / 60.0) ;
        seconds = fmod(seconds, 1.0) * 60;
        time_str = StringFormat("%d Minutes and %.3f Seconds", minutes, seconds);
    }
    
    if (minutes >= 60)
    {
        hours = (uint)(minutes / 60.0);
        minutes = minutes % 60;
        time_str = StringFormat("%d Hours and %d Minutes", hours, minutes);
    }

    if (time_str == "")
    {
        time_str = StringFormat("%.3f Seconds", seconds);
    }

    return time_str;
}
//+------------------------------------------------------------------+
//|  Obtains a part of the matrix starting from a start_index row to |
//|   end_index row Inclusive                                        |
//+------------------------------------------------------------------+
matrix CUtils::Get(const matrix &mat, ulong start_index, ulong end_index)
 {
  matrix ret_mat(MathAbs(end_index-start_index+1), mat.Cols());
  
  if (start_index >= mat.Rows())
    {
       Print(__FUNCTION__," Error | start_index (",start_index,") is greater than or Equal to matrix Rows (",mat.Rows(),")");
       return ret_mat;
    }
    
  if (end_index > mat.Rows())
   {
       Print(__FUNCTION__," Error | end_index (",end_index,") is greater than (",mat.Rows(),")");
       return ret_mat;
   }
  
  if (start_index > end_index)
    {
      Print(__FUNCTION__," Error | start_index shouldn't be greater than end_index ???");
      return ret_mat;
    }
  
   for (ulong i=start_index, count =0; i<=end_index; i++, count++)
     for (ulong col=0; col<mat.Cols(); col++)
         ret_mat[count][col] = mat[i][col];
       
   return ret_mat;
 }

//+------------------------------------------------------------------+
//|  Obtains a part of the vector starting from a start_index row to |
//|   end_index row Inclusive                                        |
//+------------------------------------------------------------------+

vector CUtils::Get(const vector &v, ulong start_index, ulong end_index)
 {
  vector ret_vec(MathAbs(end_index-start_index+1));
  
  if (start_index >= v.Size())
    {
       Print(__FUNCTION__,"Error | start_index (",start_index,") is greater than or Equal to matrix Rows (",v.Size(),")");
       return ret_vec;
    }
    
  if (end_index > v.Size())
   {
       Print(__FUNCTION__,"Error | end_index (",start_index,") is greater than (",v.Size(),")");
       return ret_vec;
   }
  
  if (start_index > end_index)
    {
      Print(__FUNCTION__,"Error | start_index shouldn't be greater than end_index ???");
      return ret_vec;
    }
  
  for (ulong i=start_index, count=0; i<=end_index; i++, count++)
     ret_vec[count] = v[i];
       
   return ret_vec;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CUtils::Sign(matrix &x)
 {
   matrix ret_matrix = x;
   
    for (ulong i=0; i<x.Cols(); i++)
     ret_matrix.Col(Sign(x.Col(i)) ,i);
   
   return ret_matrix;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CUtils::Sign(vector &x)
 {
   vector v(x.Size());
   for (ulong i=0; i<x.Size(); i++)
     v[i] = Sign(x[i]);
     
  return v;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
bool CUtils::write_bin(vector &v,string file)
 {
   FileDelete(file);
   int handle = FileOpen(file,FILE_READ|FILE_WRITE|FILE_BIN,",");
   if (handle == INVALID_HANDLE)
    {
      printf("Invalid handle Err=%d",GetLastError());
      DebugBreak();
      return false;
    }
   
   double arr[];
   ArrayResize(arr, (int)v.Size());
   
   for (uint i=0; i<arr.Size(); i++)
    arr[i] = v[i];
   
   FileWriteArray(handle, arr);
   FileClose(handle);
  
  return true;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
matrix CUtils::Slice(const matrix &mat, ulong start_index, int end_index, uint axis=0)
 {
   matrix sliced = {};
   
   if (end_index<-1)
     {
       printf("%s line=%d, INvalid end index=%d",__FUNCTION__,__LINE__, end_index);
       return sliced;
     }
   
   if (end_index==-1)
     end_index = (int)mat.Rows();

//---

   if ((int)start_index>=end_index)
    {
      printf("%s failed, end must be >= start",__FUNCTION__);
      return sliced;
    }    
   
   for (ulong i=start_index, count=0; i<(ulong)end_index; i++, count++)
     {
         switch(axis)
           {
            case  0: //slice along rows
              
               if (end_index-start_index>mat.Rows())
                 {
                   printf("%s failed, Index out of range line %d",__FUNCTION__,__LINE__);
                   return sliced;
                 }
                 
                 sliced.Resize(end_index-start_index, mat.Cols());
                 sliced.Row(mat.Row(i) , count);
              
              break;
            case 1: //slice along columns
             
               if (end_index-start_index>mat.Cols())
                 {
                   printf("%s failed, Index out of range line %d",__FUNCTION__,__LINE__);
                   return sliced;
                 }
                 
                 sliced.Resize(mat.Rows(), end_index-start_index);
                 sliced.Col(mat.Col(i) , count);
              
              break;
            default:
              printf("%s failed, Unknown axis value %d",__FUNCTION__, axis);
              return sliced;
              break;
           } 
     } 
     
   return sliced;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+
vector CUtils::Slice(const vector &vec, ulong start_index, int end_index)
 {
   vector sliced = {};
   
   if (end_index<-1)
     {
       printf("%s line=%d, Invalid end index=%d",__FUNCTION__,__LINE__, end_index);
       return sliced;
     }
   
   if (end_index==-1)
     end_index = (int)vec.Size();
     
//---
   
   if ((int)start_index>=end_index)
    {
      printf("%s failed, end must be >= start",__FUNCTION__);
      return sliced;
    }
    

   sliced.Resize(end_index-start_index);
   for (ulong i=start_index, count=0; i<(ulong)end_index; i++, count++)
     {
         if (end_index-start_index>vec.Size())
           {
             printf("%s failed, Index out of range line %d",__FUNCTION__,__LINE__);
             return sliced;
           }
           
           sliced[count] = vec[i];
     } 
     
   return sliced;
 }
//+------------------------------------------------------------------+
//|                                                                  |
//+------------------------------------------------------------------+


================================================
FILE: requirements.txt
================================================
contourpy==1.0.7
cycler==0.11.0
fonttools==4.38.0
kiwisolver==1.4.4
matplotlib==3.7.0
numpy==1.24.2
packaging==23.0
pandas==1.5.3
Pillow==9.4.0
pyparsing==3.0.9
python-dateutil==2.8.2
pytz==2022.7.1
seaborn==0.12.2
six==1.16.0