add namespace - machine_learning

2023-10-11 13:05:55 +08:00 · 2020-05-31 23:00:38 -04:00 · 2020-05-31 23:00:38 -04:00 · 579620271f
commit 579620271f
parent e9f795e9c3
1 changed files with 152 additions and 143 deletions
--- a/machine_learning/adaline_learning.cpp
+++ b/machine_learning/adaline_learning.cpp
@ -31,155 +31,164 @@
 #define MAX_ITER 500  // INT_MAX  ///< Maximum number of iterations to learn
-class adaline {
+/** \namespace machine_learning
- public:
+ * \brief Machine learning algorithms
-    /**
+ */
-     * Default constructor
+namespace machine_learning {
-     * \param[in] num_features number of features present
+    class adaline {
-     * \param[in] eta learning rate (optional, default=0.1)
+     public:
-     * \param[in] convergence accuracy (optional, default=\f$1\times10^{-5}\f$)
+        /**
-     */
+         * Default constructor
-    adaline(int num_features, const double eta = 0.01f,
+         * \param[in] num_features number of features present
-            const double accuracy = 1e-5)
+         * \param[in] eta learning rate (optional, default=0.1)
-        : eta(eta), accuracy(accuracy) {
+         * \param[in] convergence accuracy (optional,
-        if (eta <= 0) {
+         * default=\f$1\times10^{-5}\f$)
-            std::cerr << "learning rate should be positive and nonzero"
+         */
-                      << std::endl;
+        adaline(int num_features, const double eta = 0.01f,
-            std::exit(EXIT_FAILURE);
+                const double accuracy = 1e-5)
-        }
+            : eta(eta), accuracy(accuracy) {
-
+            if (eta <= 0) {
-        weights = std::vector<double>(
+                std::cerr << "learning rate should be positive and nonzero"
-            num_features +
+                          << std::endl;
-            1);  // additional weight is for the constant bias term
+                std::exit(EXIT_FAILURE);
        // initialize with random weights in the range [-50, 49]
        for (int i = 0; i < weights.size(); i++) weights[i] = 1.f;
        // weights[i] = (static_cast<double>(std::rand() % 100) - 50);
    }
    /**
     * Operator to print the weights of the model
     */
    friend std::ostream &operator<<(std::ostream &out, const adaline &ada) {
        out << "<";
        for (int i = 0; i < ada.weights.size(); i++) {
            out << ada.weights[i];
            if (i < ada.weights.size() - 1)
                out << ", ";
        }
        out << ">";
        return out;
    }
    /**
     * predict the output of the model for given set of features
     * \param[in] x input vector
     * \param[out] out optional argument to return neuron output before applying
     * activation function (optional, `nullptr` to ignore)
     * \returns model prediction output
     */
    int predict(const std::vector<double> &x, double *out = nullptr) {
        if (!check_size_match(x))
            return 0;
        double y = weights.back();  // assign bias value
        // for (int i = 0; i < x.size(); i++) y += x[i] * weights[i];
        y = std::inner_product(x.begin(), x.end(), weights.begin(), y);
        if (out != nullptr)  // if out variable is provided
            *out = y;
        return activation(y);  // quantizer: apply ADALINE threshold function
    }
    /**
     * Update the weights of the model using supervised learning for one feature
     * vector
     * \param[in] x feature vector
     * \param[in] y known output  value
     * \returns correction factor
     */
    double fit(const std::vector<double> &x, const int &y) {
        if (!check_size_match(x))
            return 0;
        /* output of the model with current weights */
        int p = predict(x);
        int prediction_error = y - p;  // error in estimation
        double correction_factor = eta * prediction_error;
        /* update each weight, the last weight is the bias term */
        for (int i = 0; i < x.size(); i++) {
            weights[i] += correction_factor * x[i];
        }
        weights[x.size()] += correction_factor;  // update bias
        return correction_factor;
    }
    /**
     * Update the weights of the model using supervised learning for an array of
     * vectors.
     * \param[in] X array of feature vector
     * \param[in] y known output value for each feature vector
     */
    template <int N>
    void fit(std::vector<double> const (&X)[N], const int *y) {
        double avg_pred_error = 1.f;
        int iter;
        for (iter = 0; (iter < MAX_ITER) && (avg_pred_error > accuracy);
             iter++) {
            avg_pred_error = 0.f;
            // perform fit for each sample
            for (int i = 0; i < N; i++) {
                double err = fit(X[i], y[i]);
                avg_pred_error += std::abs(err);
            }
            avg_pred_error /= N;
-            // Print updates every 200th iteration
+            weights = std::vector<double>(
-            // if (iter % 100 == 0)
+                num_features +
-            std::cout << "\tIter " << iter << ": Training weights: " << *this
+                1);  // additional weight is for the constant bias term
-                      << "\tAvg error: " << avg_pred_error << std::endl;
+
            // initialize with random weights in the range [-50, 49]
            for (int i = 0; i < weights.size(); i++) weights[i] = 1.f;
            // weights[i] = (static_cast<double>(std::rand() % 100) - 50);
        }
-        if (iter < MAX_ITER)
+        /**
-
+         * Operator to print the weights of the model
-            std::cout << "Converged after " << iter << " iterations."
+         */
-                      << std::endl;
+        friend std::ostream &operator<<(std::ostream &out, const adaline &ada) {
-        else
+            out << "<";
-            std::cout << "Did not converge after " << iter << " iterations."
+            for (int i = 0; i < ada.weights.size(); i++) {
-                      << std::endl;
+                out << ada.weights[i];
-    }
+                if (i < ada.weights.size() - 1)
-
+                    out << ", ";
-    int activation(double x) { return x > 0 ? 1 : -1; }
+            }
-
+            out << ">";
- private:
+            return out;
    /**
     * convenient function to check if input feature vector size matches the
     * model weights size
     * \param[in] x fecture vector to check
     * \returns `true` size matches
     * \returns `false` size does not match
     */
    bool check_size_match(const std::vector<double> &x) {
        if (x.size() != (weights.size() - 1)) {
            std::cerr << __func__ << ": "
                      << "Number of features in x does not match the feature "
                         "dimension in model!"
                      << std::endl;
            return false;
        }
        return true;
    }
-    const double eta;             ///< learning rate of the algorithm
+        /**
-    const double accuracy;        ///< model fit convergence accuracy
+         * predict the output of the model for given set of features
-    std::vector<double> weights;  ///< weights of the neural network
+         * \param[in] x input vector
-};
+         * \param[out] out optional argument to return neuron output before
         * applying activation function (optional, `nullptr` to ignore) \returns
         * model prediction output
         */
        int predict(const std::vector<double> &x, double *out = nullptr) {
            if (!check_size_match(x))
                return 0;
            double y = weights.back();  // assign bias value
            // for (int i = 0; i < x.size(); i++) y += x[i] * weights[i];
            y = std::inner_product(x.begin(), x.end(), weights.begin(), y);
            if (out != nullptr)  // if out variable is provided
                *out = y;
            return activation(
                y);  // quantizer: apply ADALINE threshold function
        }
        /**
         * Update the weights of the model using supervised learning for one
         * feature vector \param[in] x feature vector \param[in] y known output
         * value \returns correction factor
         */
        double fit(const std::vector<double> &x, const int &y) {
            if (!check_size_match(x))
                return 0;
            /* output of the model with current weights */
            int p = predict(x);
            int prediction_error = y - p;  // error in estimation
            double correction_factor = eta * prediction_error;
            /* update each weight, the last weight is the bias term */
            for (int i = 0; i < x.size(); i++) {
                weights[i] += correction_factor * x[i];
            }
            weights[x.size()] += correction_factor;  // update bias
            return correction_factor;
        }
        /**
         * Update the weights of the model using supervised learning for an
         * array of vectors. \param[in] X array of feature vector \param[in] y
         * known output value for each feature vector
         */
        template <int N>
        void fit(std::vector<double> const (&X)[N], const int *y) {
            double avg_pred_error = 1.f;
            int iter;
            for (iter = 0; (iter < MAX_ITER) && (avg_pred_error > accuracy);
                 iter++) {
                avg_pred_error = 0.f;
                // perform fit for each sample
                for (int i = 0; i < N; i++) {
                    double err = fit(X[i], y[i]);
                    avg_pred_error += std::abs(err);
                }
                avg_pred_error /= N;
                // Print updates every 200th iteration
                // if (iter % 100 == 0)
                std::cout << "\tIter " << iter
                          << ": Training weights: " << *this
                          << "\tAvg error: " << avg_pred_error << std::endl;
            }
            if (iter < MAX_ITER)
                std::cout << "Converged after " << iter << " iterations."
                          << std::endl;
            else
                std::cout << "Did not converge after " << iter << " iterations."
                          << std::endl;
        }
        int activation(double x) { return x > 0 ? 1 : -1; }
     private:
        /**
         * convenient function to check if input feature vector size matches the
         * model weights size
         * \param[in] x fecture vector to check
         * \returns `true` size matches
         * \returns `false` size does not match
         */
        bool check_size_match(const std::vector<double> &x) {
            if (x.size() != (weights.size() - 1)) {
                std::cerr
                    << __func__ << ": "
                    << "Number of features in x does not match the feature "
                       "dimension in model!"
                    << std::endl;
                return false;
            }
            return true;
        }
        const double eta;             ///< learning rate of the algorithm
        const double accuracy;        ///< model fit convergence accuracy
        std::vector<double> weights;  ///< weights of the neural network
    };
 }  // namespace machine_learning
 using machine_learning::adaline;
 /**
 * test function to predict points in a 2D coordinate system above the line