fix: error handling in opening of external files (neural_network.cpp). (#1044)

* Error Handdling of Files * exit -> std::exit * Improved Overall Error handling and reporting * test commit added spaces in include to try to trigger GitHub Actions * updating DIRECTORY.md * clang-format and clang-tidy fixes for 51e943d0 Co-authored-by: Krishna Vedala <7001608+kvedala@users.noreply.github.com> Co-authored-by: github-actions <${GITHUB_ACTOR}@users.noreply.github.com>
2023-10-11 13:05:55 +08:00 · 2020-08-26 23:26:31 +05:30 · 2020-08-26 23:26:31 +05:30 · 44f4f4d6c3
commit 44f4f4d6c3
parent c4f586b6ab
2 changed files with 970 additions and 896 deletions
--- a/machine_learning/neural_network.cpp
+++ b/machine_learning/neural_network.cpp
@ -2,36 +2,43 @@
 * @file
 * @author [Deep Raval](https://github.com/imdeep2905)
 *
- * @brief Implementation of [Multilayer Perceptron] (https://en.wikipedia.org/wiki/Multilayer_perceptron). 
+ * @brief Implementation of [Multilayer Perceptron]
 * (https://en.wikipedia.org/wiki/Multilayer_perceptron).
 *
 * @details
- * A multilayer perceptron (MLP) is a class of feedforward artificial neural network (ANN). The term MLP is used ambiguously, 
+ * A multilayer perceptron (MLP) is a class of feedforward artificial neural
- * sometimes loosely to any feedforward ANN, sometimes strictly to refer to networks composed of multiple layers of perceptrons 
+ * network (ANN). The term MLP is used ambiguously, sometimes loosely to any
- * (with threshold activation). Multilayer perceptrons are sometimes colloquially referred to as "vanilla" neural networks, 
+ * feedforward ANN, sometimes strictly to refer to networks composed of multiple
- * especially when they have a single hidden layer.
+ * layers of perceptrons (with threshold activation). Multilayer perceptrons are
 * sometimes colloquially referred to as "vanilla" neural networks, especially
 * when they have a single hidden layer.
 *
- * An MLP consists of at least three layers of nodes: an input layer, a hidden layer and an output layer. Except for the 
+ * An MLP consists of at least three layers of nodes: an input layer, a hidden
- * input nodes, each node is a neuron that uses a nonlinear activation function. MLP utilizes a supervised learning technique 
+ * layer and an output layer. Except for the input nodes, each node is a neuron
- * called backpropagation for training. Its multiple layers and non-linear activation distinguish MLP from a linear 
+ * that uses a nonlinear activation function. MLP utilizes a supervised learning
- * perceptron. It can distinguish data that is not linearly separable.
+ * technique called backpropagation for training. Its multiple layers and
 * non-linear activation distinguish MLP from a linear perceptron. It can
 * distinguish data that is not linearly separable.
 *
- * See [Backpropagation](https://en.wikipedia.org/wiki/Backpropagation) for training algorithm.
+ * See [Backpropagation](https://en.wikipedia.org/wiki/Backpropagation) for
 * training algorithm.
 *
- * \note This implementation uses mini-batch gradient descent as optimizer and MSE as loss function. Bias is also not included.
+ * \note This implementation uses mini-batch gradient descent as optimizer and
 * MSE as loss function. Bias is also not included.
 */
-#include "vector_ops.hpp" // Custom header file for vector operations
+#include <algorithm>
-
+#include <cassert>
 #include <chrono>
 #include <cmath>
 #include <fstream>
 #include <iostream>
 #include <sstream>
 #include <string>
 #include <valarray>
 #include <vector>
-#include <cmath>
+
-#include <algorithm>
+#include "vector_ops.hpp"  // Custom header file for vector operations
 #include <chrono>
 #include <string>
 #include <fstream>
 #include <sstream>
 #include <cassert>
 /** \namespace machine_learning
 * \brief Machine learning algorithms
@ -50,54 +57,42 @@ namespace machine_learning {
 * @param X Value
 * @return Returns sigmoid(x)
 */
-            double sigmoid (const double &x) {
+double sigmoid(const double &x) { return 1.0 / (1.0 + std::exp(-x)); }
                return 1.0 / (1.0 + std::exp(-x));
            }
 /**
 * Derivative of sigmoid function
 * @param X Value
 * @return Returns derivative of sigmoid(x)
 */
-            double dsigmoid (const double &x) {
+double dsigmoid(const double &x) { return x * (1 - x); }
                return x * (1 - x);
            }
 /**
 * Relu function
 * @param X Value
 * @returns relu(x)
 */
-            double relu (const double &x) {
+double relu(const double &x) { return std::max(0.0, x); }
                return std::max(0.0, x);
            }
 /**
 * Derivative of relu function
 * @param X Value
 * @returns derivative of relu(x)
 */
-            double drelu (const double &x) {
+double drelu(const double &x) { return x >= 0.0 ? 1.0 : 0.0; }
                return x >= 0.0 ? 1.0 : 0.0;
            }
 /**
 * Tanh function
 * @param X Value
 * @return Returns tanh(x)
 */
-            double tanh (const double &x) {
+double tanh(const double &x) { return 2 / (1 + std::exp(-2 * x)) - 1; }
                return 2 / (1 + std::exp(-2 * x)) - 1;
            }
 /**
 * Derivative of Sigmoid function
 * @param X Value
 * @return Returns derivative of tanh(x)
 */
-            double dtanh (const double &x) {
+double dtanh(const double &x) { return 1 - x * x; }
                return 1 - x * x;
            }
 }  // namespace activations
 /** \namespace util_functions
 * \brief Various utility functions used in Neural network
@ -108,17 +103,13 @@ namespace machine_learning {
 * @param X Value
 * @return Returns x * x
 */
-            double square(const double &x) {
+double square(const double &x) { return x * x; }
                return x * x;
            }
 /**
 * Identity function
 * @param X Value
 * @return Returns x
 */
-            double identity_function(const double &x) {
+double identity_function(const double &x) { return x; }
                return x;
            }
 }  // namespace util_functions
 /** \namespace layers
 * \brief This namespace contains layers used
@ -126,9 +117,9 @@ namespace machine_learning {
 */
 namespace layers {
 /**
-             * neural_network::layers::DenseLayer class is used to store all necessary information about 
+ * neural_network::layers::DenseLayer class is used to store all necessary
-             * the layers (i.e. neurons, activation and kernal). This class 
+ * information about the layers (i.e. neurons, activation and kernal). This
-             * is used by NeuralNetwork class to store layers.
+ * class is used by NeuralNetwork class to store layers.
 *
 */
 class DenseLayer {
@ -147,32 +138,30 @@ namespace machine_learning {
     * @param kernal_shape shape of kernal
     * @param random_kernal flag for whether to intialize kernal randomly
     */
-                    DenseLayer(const int &neurons, 
+    DenseLayer(const int &neurons, const std::string &activation,
                          const std::string &activation,
               const std::pair<size_t, size_t> &kernal_shape,
               const bool &random_kernal) {
        // Choosing activation (and it's derivative)
        if (activation == "sigmoid") {
            activation_function = neural_network::activations::sigmoid;
            dactivation_function = neural_network::activations::sigmoid;
-                        }
+        } else if (activation == "relu") {
                        else if (activation == "relu") {
            activation_function = neural_network::activations::relu;
            dactivation_function = neural_network::activations::drelu;
-                        }
+        } else if (activation == "tanh") {
                        else if (activation == "tanh") {
            activation_function = neural_network::activations::tanh;
            dactivation_function = neural_network::activations::dtanh;
-                        }
+        } else if (activation == "none") {
                        else if (activation == "none") {
            // Set identity function in casse of none is supplied
-                            activation_function = neural_network::util_functions::identity_function;
+            activation_function =
-                            dactivation_function = neural_network::util_functions::identity_function;
+                neural_network::util_functions::identity_function;
-                        }
+            dactivation_function =
-                        else {
+                neural_network::util_functions::identity_function;
        } else {
            // If supplied activation is invalid
-                            std::cerr << "ERROR: Invalid argument for layer -> constructor -> activation, ";
+            std::cerr << "ERROR (" << __func__ << ") : ";
-                            std::cerr << "Expected from {none, sigmoid, relu, tanh} got ";
+            std::cerr << "Invalid argument. Expected {none, sigmoid, relu, "
                         "tanh} got ";
            std::cerr << activation << std::endl;
            std::exit(EXIT_FAILURE);
        }
@ -181,8 +170,7 @@ namespace machine_learning {
        // Initialize kernal according to flag
        if (random_kernal) {
            uniform_random_initialization(kernal, kernal_shape, -1.0, 1.0);
-                        }
+        } else {
                        else {
            unit_matrix_initialization(kernal, kernal_shape);
        }
    }
@ -192,31 +180,29 @@ namespace machine_learning {
     * @param activation activation function for layer
     * @param kernal values of kernal (useful in loading model)
     */
-                    DenseLayer (const int &neurons, 
+    DenseLayer(const int &neurons, const std::string &activation,
                           const std::string &activation, 
               const std::vector<std::valarray<double>> &kernal) {
        // Choosing activation (and it's derivative)
        if (activation == "sigmoid") {
            activation_function = neural_network::activations::sigmoid;
            dactivation_function = neural_network::activations::sigmoid;
-                        }
+        } else if (activation == "relu") {
                        else if (activation == "relu") {
            activation_function = neural_network::activations::relu;
            dactivation_function = neural_network::activations::drelu;
-                        }
+        } else if (activation == "tanh") {
                        else if (activation == "tanh") {
            activation_function = neural_network::activations::tanh;
            dactivation_function = neural_network::activations::dtanh;
-                        }
+        } else if (activation == "none") {
                        else if (activation == "none") {
            // Set identity function in casse of none is supplied
-                            activation_function = neural_network::util_functions::identity_function;
+            activation_function =
-                            dactivation_function = neural_network::util_functions::identity_function;
+                neural_network::util_functions::identity_function;
-                        }
+            dactivation_function =
-                        else {
+                neural_network::util_functions::identity_function;
        } else {
            // If supplied activation is invalid
-                            std::cerr << "ERROR: Invalid argument for layer -> constructor -> activation, ";
+            std::cerr << "ERROR (" << __func__ << ") : ";
-                            std::cerr << "Expected from {none, sigmoid, relu, tanh} got ";
+            std::cerr << "Invalid argument. Expected {none, sigmoid, relu, "
                         "tanh} got ";
            std::cerr << activation << std::endl;
            std::exit(EXIT_FAILURE);
        }
@ -267,25 +253,29 @@ namespace machine_learning {
     * @param config vector containing pair (neurons, activation)
     * @param kernals vector containing all pretrained kernals
     */
-                NeuralNetwork(const std::vector <std::pair<int, std::string>> &config,
+    NeuralNetwork(
        const std::vector<std::pair<int, std::string>> &config,
        const std::vector<std::vector<std::valarray<double>>> &kernals) {
        // First layer should not have activation
        if (config.begin()->second != "none") {
-                        std::cerr << "ERROR: First layer can't have activation other than none";
+            std::cerr << "ERROR (" << __func__ << ") : ";
            std::cerr
                << "First layer can't have activation other than none got "
                << config.begin()->second;
            std::cerr << std::endl;
            std::exit(EXIT_FAILURE);
        }
        // Network should have atleast two layers
        if (config.size() <= 1) {
-                        std::cerr << "ERROR: Invalid size of network, ";
+            std::cerr << "ERROR (" << __func__ << ") : ";
            std::cerr << "Invalid size of network, ";
            std::cerr << "Atleast two layers are required";
            std::exit(EXIT_FAILURE);
        }
        // Reconstructing all pretrained layers
        for (size_t i = 0; i < config.size(); i++) {
-                        layers.emplace_back(neural_network::layers::DenseLayer(config[i].first, 
+            layers.emplace_back(neural_network::layers::DenseLayer(
-                                               config[i].second,
+                config[i].first, config[i].second, kernals[i]));
                                               kernals[i])); 
        }
        std::cout << "INFO: Network constructed successfully" << std::endl;
    }
@ -307,6 +297,7 @@ namespace machine_learning {
        }
        return details;
    }
 public:
    /**
     * Default Constructor for class NeuralNetwork. This constructor
@ -319,31 +310,34 @@ namespace machine_learning {
     * is used by user.
     * @param config vector containing pair (neurons, activation)
     */
-                explicit NeuralNetwork(const std::vector <std::pair<int, std::string>> &config) {
+    explicit NeuralNetwork(
        const std::vector<std::pair<int, std::string>> &config) {
        // First layer should not have activation
        if (config.begin()->second != "none") {
-                        std::cerr << "ERROR: First layer can't have activation other than none";
+            std::cerr << "ERROR (" << __func__ << ") : ";
            std::cerr
                << "First layer can't have activation other than none got "
                << config.begin()->second;
            std::cerr << std::endl;
            std::exit(EXIT_FAILURE);
        }
        // Network should have atleast two layers
        if (config.size() <= 1) {
-                        std::cerr << "ERROR: Invalid size of network, ";
+            std::cerr << "ERROR (" << __func__ << ") : ";
            std::cerr << "Invalid size of network, ";
            std::cerr << "Atleast two layers are required";
            std::exit(EXIT_FAILURE);
        }
        // Separately creating first layer so it can have unit matrix
        // as kernal.
-                    layers.push_back(neural_network::layers::DenseLayer(config[0].first, 
+        layers.push_back(neural_network::layers::DenseLayer(
-                                           config[0].second, 
+            config[0].first, config[0].second,
-                                           {config[0].first, config[0].first},
+            {config[0].first, config[0].first}, false));
                                           false));
        // Creating remaining layers
        for (size_t i = 1; i < config.size(); i++) {
-                        layers.push_back(neural_network::layers::DenseLayer(config[i].first, 
+            layers.push_back(neural_network::layers::DenseLayer(
-                                               config[i].second,
+                config[i].first, config[i].second,
-                                               {config[i - 1].first, config[i].first},
+                {config[i - 1].first, config[i].first}, true));
                                               true));
        }
        std::cout << "INFO: Network constructed successfully" << std::endl;
    }
@ -383,23 +377,29 @@ namespace machine_learning {
     * @param slip_lines number of lines to skip
     * @return returns pair of X and Y
     */
-                std::pair<std::vector<std::vector<std::valarray<double>>>, std::vector<std::vector<std::valarray<double>>>>
+    std::pair<std::vector<std::vector<std::valarray<double>>>,
-                get_XY_from_csv(const std::string &file_name, 
+              std::vector<std::vector<std::valarray<double>>>>
-                                     const bool &last_label, 
+    get_XY_from_csv(const std::string &file_name, const bool &last_label,
-                                     const bool &normalize,
+                    const bool &normalize, const int &slip_lines = 1) {
                                     const int &slip_lines = 1) {
        std::ifstream in_file;                          // Ifstream to read file
        in_file.open(file_name.c_str(), std::ios::in);  // Open file
-                    std::vector <std::vector<std::valarray<double>>> X, Y; // To store X and Y
+        // If there is any problem in opening file
        if (!in_file.is_open()) {
            std::cerr << "ERROR (" << __func__ << ") : ";
            std::cerr << "Unable to open file: " << file_name << std::endl;
            std::exit(EXIT_FAILURE);
        }
        std::vector<std::vector<std::valarray<double>>> X,
            Y;             // To store X and Y
        std::string line;  // To store each line
        // Skip lines
        for (int i = 0; i < slip_lines; i++) {
            std::getline(in_file, line, '\n');  // Ignore line
        }
        // While file has information
-                    while(!in_file.eof() && std::getline(in_file, line, '\n'))
+        while (!in_file.eof() && std::getline(in_file, line, '\n')) {
-                    {
+            std::valarray<double> x_data,
-                        std::valarray <double> x_data, y_data; // To store single sample and label
+                y_data;                  // To store single sample and label
            std::stringstream ss(line);  // Constructing stringstream from line
            std::string token;  // To store each token in line (seprated by ',')
            while (std::getline(ss, token, ',')) {  // For each token
@ -418,8 +418,7 @@ namespace machine_learning {
                    y_data[0] = x_data[x_data.size() - 1];
                }
                x_data = pop_back(x_data);  // Remove label from x_data
-                        }
+            } else {
                        else {
                y_data.resize(this->layers.back().neurons);
                // If task is classification
                if (y_data.size() > 1) {
@ -435,12 +434,12 @@ namespace machine_learning {
            X.push_back({x_data});
            Y.push_back({y_data});
        }
                    in_file.close();
        // Normalize training data if flag is set
        if (normalize) {
            // Scale data between 0 and 1 using min-max scaler
            X = minmax_scaler(X, 0.01, 1.0);
        }
        in_file.close();         // Closing file
        return make_pair(X, Y);  // Return pair of X and Y
    }
@ -449,8 +448,8 @@ namespace machine_learning {
     * @param X array of feature vectors
     * @return returns predictions as vector
     */
-                std::vector<std::valarray <double>> 
+    std::vector<std::valarray<double>> single_predict(
-                single_predict (const std::vector<std::valarray <double>> &X) {
+        const std::vector<std::valarray<double>> &X) {
        // Get activations of all layers
        auto activations = this->__detailed_single_prediction(X);
        // Return activations of last layer (actual predicted values)
@ -462,10 +461,11 @@ namespace machine_learning {
     * @param X array of feature vectors
     * @return returns predicted values as vector
     */
-                std::vector < std::vector <std::valarray<double>>>
+    std::vector<std::vector<std::valarray<double>>> batch_predict(
-                batch_predict (const std::vector <std::vector <std::valarray <double>>> &X) {
+        const std::vector<std::vector<std::valarray<double>>> &X) {
        // Store predicted values
-                    std::vector < std::vector <std::valarray<double>>> predicted_batch(X.size());
+        std::vector<std::vector<std::valarray<double>>> predicted_batch(
            X.size());
        for (size_t i = 0; i < X.size(); i++) {  // For every sample
            // Push predicted values
            predicted_batch[i] = this->single_predict(X[i]);
@ -484,14 +484,13 @@ namespace machine_learning {
     */
    void fit(const std::vector<std::vector<std::valarray<double>>> &X_,
             const std::vector<std::vector<std::valarray<double>>> &Y_,
-                         const int &epochs = 100, 
+             const int &epochs = 100, const double &learning_rate = 0.01,
-                         const double &learning_rate = 0.01,
+             const size_t &batch_size = 32, const bool &shuffle = true) {
                         const size_t &batch_size = 32,
                         const bool &shuffle = true) {
        std::vector<std::vector<std::valarray<double>>> X = X_, Y = Y_;
        // Both label and input data should have same size
        if (X.size() != Y.size()) {
-                        std::cerr << "ERROR : X and Y in fit have different sizes" << std::endl;
+            std::cerr << "ERROR (" << __func__ << ") : ";
            std::cerr << "X and Y in fit have different sizes" << std::endl;
            std::exit(EXIT_FAILURE);
        }
        std::cout << "INFO: Training Started" << std::endl;
@ -500,12 +499,17 @@ namespace machine_learning {
            if (shuffle) {
                equal_shuffle(X, Y);
            }
-                        auto start = std::chrono::high_resolution_clock::now(); // Start clock
+            auto start =
-                        double loss = 0, acc = 0; // Intialize performance metrics with zero
+                std::chrono::high_resolution_clock::now();  // Start clock
            double loss = 0,
                   acc = 0;  // Intialize performance metrics with zero
            // For each starting index of batch
-                        for(size_t batch_start = 0; batch_start < X.size(); batch_start += batch_size) {
+            for (size_t batch_start = 0; batch_start < X.size();
-                            for(size_t i = batch_start; i < std::min(X.size(), batch_start + batch_size); i++) {
+                 batch_start += batch_size) {
-                                    std::vector <std::valarray<double>> grad, cur_error, predicted;
+                for (size_t i = batch_start;
                     i < std::min(X.size(), batch_start + batch_size); i++) {
                    std::vector<std::valarray<double>> grad, cur_error,
                        predicted;
                    auto activations = this->__detailed_single_prediction(X[i]);
                    // Gradients vector to store gradients for all layers
                    // They will be averaged and applied to kernal
@ -513,12 +517,14 @@ namespace machine_learning {
                    gradients.resize(this->layers.size());
                    // First intialize gradients to zero
                    for (size_t i = 0; i < gradients.size(); i++) {
-                                        zeroes_initialization(gradients[i], get_shape(this -> layers[i].kernal));
+                        zeroes_initialization(
                            gradients[i], get_shape(this->layers[i].kernal));
                    }
                    predicted = activations.back();  // Predicted vector
                    cur_error = predicted - Y[i];    // Absoulute error
                    // Calculating loss with MSE
-                                    loss += sum(apply_function(cur_error, neural_network::util_functions::square));
+                    loss += sum(apply_function(
                        cur_error, neural_network::util_functions::square));
                    // If prediction is correct
                    if (argmax(predicted) == argmax(Y[i])) {
                        acc += 1;
@ -526,13 +532,16 @@ namespace machine_learning {
                    // For every layer (except first) starting from last one
                    for (size_t j = this->layers.size() - 1; j >= 1; j--) {
                        // Backpropogating errors
-                                        cur_error = hadamard_product(cur_error, 
+                        cur_error = hadamard_product(
-                                                                    apply_function(activations[j + 1], 
+                            cur_error,
                            apply_function(
                                activations[j + 1],
                                this->layers[j].dactivation_function));
                        // Calculating gradient for current layer
                        grad = multiply(transpose(activations[j]), cur_error);
                        // Change error according to current kernal values
-                                        cur_error = multiply(cur_error, transpose(this -> layers[j].kernal));
+                        cur_error = multiply(cur_error,
                                             transpose(this->layers[j].kernal));
                        // Adding gradient values to collection of gradients
                        gradients[j] = gradients[j] + grad / double(batch_size);
                    }
@ -544,9 +553,12 @@ namespace machine_learning {
                    }
                }
            }
-                        auto stop = std::chrono::high_resolution_clock::now(); // Stoping the clock
+            auto stop =
                std::chrono::high_resolution_clock::now();  // Stoping the clock
            // Calculate time taken by epoch
-                        auto duration = std::chrono::duration_cast<std::chrono::microseconds>(stop - start);
+            auto duration =
                std::chrono::duration_cast<std::chrono::microseconds>(stop -
                                                                      start);
            loss /= X.size();        // Averaging loss
            acc /= X.size();         // Averaging accuracy
            std::cout.precision(4);  // set output precision to 4
@ -554,7 +566,8 @@ namespace machine_learning {
            std::cout << "Training: Epoch " << epoch << '/' << epochs;
            std::cout << ", Loss: " << loss;
            std::cout << ", Accuracy: " << acc;
-                        std::cout << ", Taken time: " << duration.count() / 1e6 << " seconds";
+            std::cout << ", Taken time: " << duration.count() / 1e6
                      << " seconds";
            std::cout << std::endl;
        }
        return;
@ -571,18 +584,17 @@ namespace machine_learning {
     * @param batch_size batch size for gradient descent (default = 32)
     * @param shuffle flag for whether to shuffle data (default = true)
     */
-                void fit_from_csv (const std::string &file_name, 
+    void fit_from_csv(const std::string &file_name, const bool &last_label,
-                                     const bool &last_label,
+                      const int &epochs, const double &learning_rate,
-                                     const int &epochs, 
+                      const bool &normalize, const int &slip_lines = 1,
                                     const double &learning_rate,
                                     const bool &normalize,
                                     const int &slip_lines = 1,
                      const size_t &batch_size = 32,
                      const bool &shuffle = true) {
        // Getting training data from csv file
-                    auto data = this -> get_XY_from_csv(file_name, last_label, normalize, slip_lines);
+        auto data =
            this->get_XY_from_csv(file_name, last_label, normalize, slip_lines);
        // Fit the model on training data
-                    this -> fit(data.first, data.second, epochs, learning_rate, batch_size, shuffle);
+        this->fit(data.first, data.second, epochs, learning_rate, batch_size,
                  shuffle);
        return;
    }
@ -597,14 +609,16 @@ namespace machine_learning {
        double acc = 0, loss = 0;  // intialize performance metrics with zero
        for (size_t i = 0; i < X.size(); i++) {  // For every sample in input
            // Get predictions
-                        std::vector<std::valarray<double>> pred = this -> single_predict(X[i]);
+            std::vector<std::valarray<double>> pred =
                this->single_predict(X[i]);
            // If predicted class is correct
            if (argmax(pred) == argmax(Y[i])) {
                acc += 1;  // Increment accuracy
            }
            // Calculating loss - Mean Squared Error
            loss += sum(apply_function((Y[i] - pred),
-                                    neural_network::util_functions::square) * 0.5);
+                                       neural_network::util_functions::square) *
                        0.5);
        }
        acc /= X.size();   // Averaging accuracy
        loss /= X.size();  // Averaging loss
@ -621,12 +635,11 @@ namespace machine_learning {
     * @param normalize flag for whether to normalize data
     * @param slip_lines number of lines to skip
     */
-                void evaluate_from_csv (const std::string &file_name, 
+    void evaluate_from_csv(const std::string &file_name, const bool &last_label,
-                                     const bool &last_label,
+                           const bool &normalize, const int &slip_lines = 1) {
                                     const bool &normalize,
                                     const int &slip_lines = 1) {
        // Getting training data from csv file
-                    auto data = this -> get_XY_from_csv(file_name, last_label, normalize, slip_lines);
+        auto data =
            this->get_XY_from_csv(file_name, last_label, normalize, slip_lines);
        // Evaluating model
        this->evaluate(data.first, data.second);
        return;
@ -644,20 +657,27 @@ namespace machine_learning {
        }
        std::ofstream out_file;  // Ofstream to write in file
        // Open file in out|trunc mode
-                    out_file.open(file_name.c_str(), std::ofstream::out | std::ofstream::trunc);
+        out_file.open(file_name.c_str(),
                      std::ofstream::out | std::ofstream::trunc);
        // If there is any problem in opening file
        if (!out_file.is_open()) {
            std::cerr << "ERROR (" << __func__ << ") : ";
            std::cerr << "Unable to open file: " << file_name << std::endl;
            std::exit(EXIT_FAILURE);
        }
        /**
            Format in which model is saved:
            total_layers
-                        neurons(1st neural_network::layers::DenseLayer) activation_name(1st neural_network::layers::DenseLayer)
+            neurons(1st neural_network::layers::DenseLayer) activation_name(1st
-                        kernal_shape(1st neural_network::layers::DenseLayer)
+           neural_network::layers::DenseLayer) kernal_shape(1st
-                        kernal_values
+           neural_network::layers::DenseLayer) kernal_values
            .
            .
            .
-                        neurons(Nth neural_network::layers::DenseLayer) activation_name(Nth neural_network::layers::DenseLayer)
+            neurons(Nth neural_network::layers::DenseLayer) activation_name(Nth
-                        kernal_shape(Nth neural_network::layers::DenseLayer)
+           neural_network::layers::DenseLayer) kernal_shape(Nth
-                        kernal_value
+           neural_network::layers::DenseLayer) kernal_value
            For Example, pretrained model with 3 layers:
            <pre>
@ -700,6 +720,7 @@ namespace machine_learning {
        }
        std::cout << "INFO: Model saved successfully with name : ";
        std::cout << file_name << std::endl;
        out_file.close();  // Closing file
        return;
    }
@ -711,8 +732,15 @@ namespace machine_learning {
    NeuralNetwork load_model(const std::string &file_name) {
        std::ifstream in_file;            // Ifstream to read file
        in_file.open(file_name.c_str());  // Openinig file
        // If there is any problem in opening file
        if (!in_file.is_open()) {
            std::cerr << "ERROR (" << __func__ << ") : ";
            std::cerr << "Unable to open file: " << file_name << std::endl;
            std::exit(EXIT_FAILURE);
        }
        std::vector<std::pair<int, std::string>> config;  // To store config
-                    std::vector <std::vector<std::valarray<double>>> kernals; // To store pretrained kernals
+        std::vector<std::vector<std::valarray<double>>>
            kernals;  // To store pretrained kernals
        // Loading model from saved file format
        size_t total_layers = 0;
        in_file >> total_layers;
@ -729,11 +757,14 @@ namespace machine_learning {
                }
                kernal.push_back(row);
            }
-                        config.emplace_back(make_pair(neurons, activation));;
+            config.emplace_back(make_pair(neurons, activation));
            ;
            kernals.emplace_back(kernal);
        }
        std::cout << "INFO: Model loaded successfully" << std::endl;
-                    return NeuralNetwork(config, kernals); // Return instance of NeuralNetwork class
+        in_file.close();  // Closing file
        return NeuralNetwork(
            config, kernals);  // Return instance of NeuralNetwork class
    }
    /**
@ -741,20 +772,28 @@ namespace machine_learning {
     */
    void summary() {
        // Printing Summary
-                    std::cout << "===============================================================" << std::endl;
+        std::cout
            << "==============================================================="
            << std::endl;
        std::cout << "\t\t+ MODEL SUMMARY +\t\t\n";
-                    std::cout << "===============================================================" << std::endl;
+        std::cout
            << "==============================================================="
            << std::endl;
        for (size_t i = 1; i <= layers.size(); i++) {  // For every layer
            std::cout << i << ")";
-                        std::cout << " Neurons : " << layers[i - 1].neurons; // number of neurons
+            std::cout << " Neurons : "
-                        std::cout << ", Activation : " << layers[i - 1].activation; // activation
+                      << layers[i - 1].neurons;  // number of neurons
-                        std::cout << ", Kernal Shape : " << get_shape(layers[i - 1].kernal); // kernal shape
+            std::cout << ", Activation : "
                      << layers[i - 1].activation;  // activation
            std::cout << ", Kernal Shape : "
                      << get_shape(layers[i - 1].kernal);  // kernal shape
            std::cout << std::endl;
        }
-                    std::cout << "===============================================================" << std::endl;
+        std::cout
            << "==============================================================="
            << std::endl;
        return;
    }
 };
 }  // namespace neural_network
 }  // namespace machine_learning
@ -768,17 +807,22 @@ static void test() {
    machine_learning::neural_network::NeuralNetwork myNN =
        machine_learning::neural_network::NeuralNetwork({
            {4, "none"},  // First layer with 3 neurons and "none" as activation
-        {6, "relu"}, // Second layer with 6 neurons and "relu" as activation
+            {6,
-        {3, "sigmoid"} // Third layer with 3 neurons and "sigmoid" as activation
+             "relu"},  // Second layer with 6 neurons and "relu" as activation
            {3, "sigmoid"}  // Third layer with 3 neurons and "sigmoid" as
                            // activation
        });
    // Printing summary of model
    myNN.summary();
    // Training Model
    myNN.fit_from_csv("iris.csv", true, 100, 0.3, false, 2, 32, true);
    // Testing predictions of model
-    assert(machine_learning::argmax(myNN.single_predict({{5,3.4,1.6,0.4}})) == 0);
+    assert(machine_learning::argmax(
-    assert(machine_learning::argmax(myNN.single_predict({{6.4,2.9,4.3,1.3}})) == 1);
+               myNN.single_predict({{5, 3.4, 1.6, 0.4}})) == 0);
-    assert(machine_learning::argmax(myNN.single_predict({{6.2,3.4,5.4,2.3}})) == 2);
+    assert(machine_learning::argmax(
               myNN.single_predict({{6.4, 2.9, 4.3, 1.3}})) == 1);
    assert(machine_learning::argmax(
               myNN.single_predict({{6.2, 3.4, 5.4, 2.3}})) == 2);
    return;
 }
--- a/machine_learning/vector_ops.hpp
+++ b/machine_learning/vector_ops.hpp
@ -2,19 +2,20 @@
 * @file vector_ops.hpp
 * @author [Deep Raval](https://github.com/imdeep2905)
 *
- * @brief Various functions for vectors associated with [NeuralNetwork (aka Multilayer Perceptron)] 
+ * @brief Various functions for vectors associated with [NeuralNetwork (aka
 * Multilayer Perceptron)]
 * (https://en.wikipedia.org/wiki/Multilayer_perceptron).
 *
 */
 #ifndef VECTOR_OPS_FOR_NN
 #define VECTOR_OPS_FOR_NN
 #include <iostream>
 #include <algorithm>
 #include <vector>
 #include <valarray>
 #include <chrono>
 #include <iostream>
 #include <random>
 #include <valarray>
 #include <vector>
 /**
 * @namespace machine_learning
@ -34,9 +35,9 @@ std::ostream &operator<<(std::ostream &out,
    out.precision(4);
    for (const auto &a : A) {       // For each row in A
        for (const auto &x : a) {   // For each element in row
-            std::cerr << x << ' '; // print element 
+            std::cout << x << ' ';  // print element
        }
-        std::cerr << std::endl;
+        std::cout << std::endl;
    }
    return out;
 }
@ -52,7 +53,7 @@ std::ostream &operator<<(std::ostream &out, const std::pair<T, T> &A) {
    // Setting output precision to 4 in case of floating point numbers
    out.precision(4);
    // printing pair in the form (p, q)
-    std::cerr << "(" << A.first << ", " << A.second << ")";
+    std::cout << "(" << A.first << ", " << A.second << ")";
    return out;
 }
@ -67,9 +68,9 @@ std::ostream &operator<<(std::ostream &out, const std::valarray<T> &A) {
    // Setting output precision to 4 in case of floating point numbers
    out.precision(4);
    for (const auto &a : A) {   // For every element in the vector.
-        std::cerr << a << ' '; // Print element
+        std::cout << a << ' ';  // Print element
    }
-    std::cerr << std::endl;
+    std::cout << std::endl;
    return out;
 }
@ -101,7 +102,8 @@ template <typename T>
 std::valarray<T> pop_front(const std::valarray<T> &A) {
    std::valarray<T> B;      // New 1D vector to store resultant vector
    B.resize(A.size() - 1);  // Resizing it accordingly
-    for(size_t i = 1; i < A.size(); i ++) { // // For every (except first) element in A 
+    for (size_t i = 1; i < A.size();
         i++) {           // // For every (except first) element in A
        B[i - 1] = A[i];  // Copy element in B with left shifted position
    }
    return B;  // Return resultant vector
@ -117,7 +119,8 @@ template <typename T>
 std::valarray<T> pop_back(const std::valarray<T> &A) {
    std::valarray<T> B;      // New 1D vector to store resultant vector
    B.resize(A.size() - 1);  // Resizing it accordingly
-    for(size_t i = 0; i < A.size() - 1; i ++) { // For every (except last) element in A 
+    for (size_t i = 0; i < A.size() - 1;
         i++) {       // For every (except last) element in A
        B[i] = A[i];  // Copy element in B
    }
    return B;  // Return resultant vector
@ -133,9 +136,10 @@ template <typename T>
 void equal_shuffle(std::vector<std::vector<std::valarray<T>>> &A,
                   std::vector<std::vector<std::valarray<T>>> &B) {
    // If two vectors have different sizes
-    if(A.size() != B.size())
+    if (A.size() != B.size()) {
-    {
+        std::cerr << "ERROR (" << __func__ << ") : ";
-        std::cerr << "ERROR : Can not equally shuffle two vectors with different sizes: ";
+        std::cerr
            << "Can not equally shuffle two vectors with different sizes: ";
        std::cerr << A.size() << " and " << B.size() << std::endl;
        std::exit(EXIT_FAILURE);
    }
@ -161,14 +165,15 @@ void equal_shuffle(std::vector < std::vector <std::valarray<T>> >  &A,
 template <typename T>
 void uniform_random_initialization(std::vector<std::valarray<T>> &A,
                                   const std::pair<size_t, size_t> &shape,
-                   const T &low, 
+                                   const T &low, const T &high) {
                   const T &high) {
    A.clear();  // Making A empty
    // Uniform distribution in range [low, high]
-    std::default_random_engine generator(std::chrono::system_clock::now().time_since_epoch().count());
+    std::default_random_engine generator(
        std::chrono::system_clock::now().time_since_epoch().count());
    std::uniform_real_distribution<T> distribution(low, high);
    for (size_t i = 0; i < shape.first; i++) {  // For every row
-        std::valarray <T> row; // Making empty row which will be inserted in vector
+        std::valarray<T>
            row;  // Making empty row which will be inserted in vector
        row.resize(shape.second);
        for (auto &r : row) {             // For every element in row
            r = distribution(generator);  // copy random number
@ -178,7 +183,6 @@ void uniform_random_initialization(std::vector<std::valarray<T>> &A,
    return;
 }
 /**
 * Function to Intialize 2D vector as unit matrix
 * @tparam T typename of the vector
@ -187,11 +191,11 @@ void uniform_random_initialization(std::vector<std::valarray<T>> &A,
 */
 template <typename T>
 void unit_matrix_initialization(std::vector<std::valarray<T>> &A,
-                   const std::pair<size_t, size_t> &shape
+                                const std::pair<size_t, size_t> &shape) {
                   ) {
    A.clear();  // Making A empty
    for (size_t i = 0; i < shape.first; i++) {
-        std::valarray <T> row; // Making empty row which will be inserted in vector
+        std::valarray<T>
            row;  // Making empty row which will be inserted in vector
        row.resize(shape.second);
        row[i] = T(1);     // Insert 1 at ith position
        A.push_back(row);  // Insert new row in vector
@ -207,11 +211,11 @@ void unit_matrix_initialization(std::vector<std::valarray<T>> &A,
 */
 template <typename T>
 void zeroes_initialization(std::vector<std::valarray<T>> &A,
-                   const std::pair<size_t, size_t> &shape
+                           const std::pair<size_t, size_t> &shape) {
                   ) {
    A.clear();  // Making A empty
    for (size_t i = 0; i < shape.first; i++) {
-        std::valarray <T> row; // Making empty row which will be inserted in vector
+        std::valarray<T>
            row;  // Making empty row which will be inserted in vector
        row.resize(shape.second);  // By default all elements are zero
        A.push_back(row);          // Insert new row in vector
    }
@ -245,7 +249,8 @@ std::pair<size_t, size_t> get_shape(const std::vector<std::valarray<T>> &A) {
    for (const auto &a : A) {
        // If supplied vector don't have same shape in all rows
        if (a.size() != sub_size) {
-            std::cerr << "ERROR: (get_shape) Supplied vector is not 2D Matrix" << std::endl;
+            std::cerr << "ERROR (" << __func__ << ") : ";
            std::cerr << "Supplied vector is not 2D Matrix" << std::endl;
            std::exit(EXIT_FAILURE);
        }
    }
@ -261,13 +266,18 @@ std::pair<size_t, size_t> get_shape(const std::vector<std::valarray<T>> &A) {
 * @return new scaled 3D vector
 */
 template <typename T>
-std::vector<std::vector<std::valarray<T>>>
+std::vector<std::vector<std::valarray<T>>> minmax_scaler(
-minmax_scaler(const std::vector<std::vector<std::valarray<T>>> &A, const T &low, const T &high) {
+    const std::vector<std::vector<std::valarray<T>>> &A, const T &low,
-    std::vector<std::vector<std::valarray<T>>> B = A; // Copying into new vector B
+    const T &high) {
    std::vector<std::vector<std::valarray<T>>> B =
        A;                               // Copying into new vector B
    const auto shape = get_shape(B[0]);  // Storing shape of B's every element
-    // As this function is used for scaling training data vector should be of shape (1, X)
+    // As this function is used for scaling training data vector should be of
    // shape (1, X)
    if (shape.first != 1) {
-        std::cerr << "ERROR: (MinMax Scaling) Supplied vector is not supported for minmax scaling, shape: ";
+        std::cerr << "ERROR (" << __func__ << ") : ";
        std::cerr
            << "Supplied vector is not supported for minmax scaling, shape: ";
        std::cerr << shape << std::endl;
        std::exit(EXIT_FAILURE);
    }
@ -280,7 +290,8 @@ minmax_scaler(const std::vector<std::vector<std::valarray<T>>> &A, const T &low,
        }
        for (size_t j = 0; j < B.size(); j++) {
            // Applying min-max scaler formula
-            B[j][0][i] = ((B[j][0][i] - min) / (max - min)) * (high - low) + low;
+            B[j][0][i] =
                ((B[j][0][i] - min) / (max - min)) * (high - low) + low;
        }
    }
    return B;  // Return new resultant 3D vector
@ -295,13 +306,16 @@ minmax_scaler(const std::vector<std::vector<std::valarray<T>>> &A, const T &low,
 template <typename T>
 size_t argmax(const std::vector<std::valarray<T>> &A) {
    const auto shape = get_shape(A);
-    // As this function is used on predicted (or target) vector, shape should be (1, X)    
+    // As this function is used on predicted (or target) vector, shape should be
    // (1, X)
    if (shape.first != 1) {
-        std::cerr << "ERROR: (argmax) Supplied vector is ineligible for argmax" << std::endl;
+        std::cerr << "ERROR (" << __func__ << ") : ";
        std::cerr << "Supplied vector is ineligible for argmax" << std::endl;
        std::exit(EXIT_FAILURE);
    }
    // Return distance of max element from first element (i.e. index)
-    return std::distance(std::begin(A[0]), std::max_element(std::begin(A[0]), std::end(A[0])));
+    return std::distance(std::begin(A[0]),
                         std::max_element(std::begin(A[0]), std::end(A[0])));
 }
 /**
@ -312,9 +326,10 @@ size_t argmax(const std::vector<std::valarray<T>> &A) {
 * @return new resultant vector
 */
 template <typename T>
-std::vector <std::valarray <T>> apply_function(const std::vector <std::valarray <T>> &A, 
+std::vector<std::valarray<T>> apply_function(
-                                               T (*func) (const T &)) {
+    const std::vector<std::valarray<T>> &A, T (*func)(const T &)) {
-    std::vector<std::valarray<double>> B = A; // New vector to store resultant vector
+    std::vector<std::valarray<double>> B =
        A;                  // New vector to store resultant vector
    for (auto &b : B) {     // For every row in vector
        b = b.apply(func);  // Apply function to that row
    }
@ -329,8 +344,10 @@ std::vector <std::valarray <T>> apply_function(const std::vector <std::valarray
 * @return new resultant vector
 */
 template <typename T>
-std::vector <std::valarray <T> > operator * (const std::vector<std::valarray<T>> &A, const T& val) {
+std::vector<std::valarray<T>> operator*(const std::vector<std::valarray<T>> &A,
-    std::vector<std::valarray<double>> B = A; // New vector to store resultant vector
+                                        const T &val) {
    std::vector<std::valarray<double>> B =
        A;               // New vector to store resultant vector
    for (auto &b : B) {  // For every row in vector
        b = b * val;     // Multiply row with scaler
    }
@ -345,8 +362,10 @@ std::vector <std::valarray <T> > operator * (const std::vector<std::valarray<T>>
 * @return new resultant vector
 */
 template <typename T>
-std::vector <std::valarray <T> > operator / (const std::vector<std::valarray<T>> &A, const T& val) {
+std::vector<std::valarray<T>> operator/(const std::vector<std::valarray<T>> &A,
-    std::vector<std::valarray<double>> B = A; // New vector to store resultant vector
+                                        const T &val) {
    std::vector<std::valarray<double>> B =
        A;               // New vector to store resultant vector
    for (auto &b : B) {  // For every row in vector
        b = b / val;     // Divide row with scaler
    }
@ -360,7 +379,8 @@ std::vector <std::valarray <T> > operator / (const std::vector<std::valarray<T>>
 * @return new resultant vector
 */
 template <typename T>
-std::vector <std::valarray <T>> transpose(const std::vector<std::valarray<T>> &A) {
+std::vector<std::valarray<T>> transpose(
    const std::vector<std::valarray<T>> &A) {
    const auto shape = get_shape(A);  // Current shape of vector
    std::vector<std::valarray<T>> B;  // New vector to store result
    // Storing transpose values of A in B
@ -383,12 +403,15 @@ std::vector <std::valarray <T>> transpose(const std::vector<std::valarray<T>> &A
 * @return new resultant vector
 */
 template <typename T>
-std::vector <std::valarray <T> > operator + (const std::vector<std::valarray<T>> &A, const std::vector<std::valarray<T>> &B) {
+std::vector<std::valarray<T>> operator+(
    const std::vector<std::valarray<T>> &A,
    const std::vector<std::valarray<T>> &B) {
    const auto shape_a = get_shape(A);
    const auto shape_b = get_shape(B);
    // If vectors don't have equal shape
    if (shape_a.first != shape_b.first || shape_a.second != shape_b.second) {
-        std::cerr << "ERROR: (vector addition) Supplied vectors have different shapes ";
+        std::cerr << "ERROR (" << __func__ << ") : ";
        std::cerr << "Supplied vectors have different shapes ";
        std::cerr << shape_a << " and " << shape_b << std::endl;
        std::exit(EXIT_FAILURE);
    }
@ -407,12 +430,15 @@ std::vector <std::valarray <T> > operator + (const std::vector<std::valarray<T>>
 * @return new resultant vector
 */
 template <typename T>
-std::vector <std::valarray <T>> operator - (const std::vector<std::valarray<T>> &A, const std::vector<std::valarray<T>> &B) {
+std::vector<std::valarray<T>> operator-(
    const std::vector<std::valarray<T>> &A,
    const std::vector<std::valarray<T>> &B) {
    const auto shape_a = get_shape(A);
    const auto shape_b = get_shape(B);
    // If vectors don't have equal shape
    if (shape_a.first != shape_b.first || shape_a.second != shape_b.second) {
-        std::cerr << "ERROR: (vector subtraction) Supplied vectors have different shapes ";
+        std::cerr << "ERROR (" << __func__ << ") : ";
        std::cerr << "Supplied vectors have different shapes ";
        std::cerr << shape_a << " and " << shape_b << std::endl;
        std::exit(EXIT_FAILURE);
    }
@ -431,12 +457,14 @@ std::vector <std::valarray <T>> operator - (const std::vector<std::valarray<T>>
 * @return new resultant vector
 */
 template <typename T>
-std::vector <std::valarray <T>> multiply(const std::vector<std::valarray<T>> &A, const std::vector<std::valarray<T>> &B) {
+std::vector<std::valarray<T>> multiply(const std::vector<std::valarray<T>> &A,
                                       const std::vector<std::valarray<T>> &B) {
    const auto shape_a = get_shape(A);
    const auto shape_b = get_shape(B);
    // If vectors are not eligible for multiplication
    if (shape_a.second != shape_b.first) {
-        std::cerr << "ERROR: (multiply) Supplied vectors are not eligible for multiplication ";
+        std::cerr << "ERROR (" << __func__ << ") : ";
        std::cerr << "Vectors are not eligible for multiplication ";
        std::cerr << shape_a << " and " << shape_b << std::endl;
        std::exit(EXIT_FAILURE);
    }
@ -463,12 +491,15 @@ std::vector <std::valarray <T>> multiply(const std::vector<std::valarray<T>> &A,
 * @return new resultant vector
 */
 template <typename T>
-std::vector <std::valarray <T>> hadamard_product(const std::vector<std::valarray<T>> &A, const std::vector<std::valarray<T>> &B) {
+std::vector<std::valarray<T>> hadamard_product(
    const std::vector<std::valarray<T>> &A,
    const std::vector<std::valarray<T>> &B) {
    const auto shape_a = get_shape(A);
    const auto shape_b = get_shape(B);
    // If vectors are not eligible for hadamard product
    if (shape_a.first != shape_b.first || shape_a.second != shape_b.second) {
-        std::cerr << "ERROR: (hadamard_product) Supplied vectors have different shapes ";
+        std::cerr << "ERROR (" << __func__ << ") : ";
        std::cerr << "Vectors have different shapes ";
        std::cerr << shape_a << " and " << shape_b << std::endl;
        std::exit(EXIT_FAILURE);
    }
@ -480,5 +511,4 @@ std::vector <std::valarray <T>> hadamard_product(const std::vector<std::valarray
 }
 }  // namespace machine_learning
 #endif