BayesNet/bayesnet/ensembles/BoostAODE.cc

// ***************************************************************
// SPDX-FileCopyrightText: Copyright 2024 Ricardo Montañana Gómez
// SPDX-FileType: SOURCE
// SPDX-License-Identifier: MIT
// ***************************************************************

#include <random> 
#include <set>
#include <functional>
#include <limits.h>
#include <tuple>
#include "BoostAODE.h"

namespace bayesnet {

    BoostAODE::BoostAODE(bool predict_voting) : Boost(predict_voting)
    {
    }
    std::vector<int> BoostAODE::initializeModels(const Smoothing_t smoothing)
    {
        torch::Tensor weights_ = torch::full({ m }, 1.0 / m, torch::kFloat64);
        std::vector<int> featuresSelected = featureSelection(weights_);
        for (const int& feature : featuresSelected) {
            std::unique_ptr<Classifier> model = std::make_unique<SPODE>(feature);
            model->fit(dataset, features, className, states, weights_, smoothing);
            models.push_back(std::move(model));
            significanceModels.push_back(1.0); // They will be updated later in trainModel
            n_models++;
        }
        notes.push_back("Used features in initialization: " + std::to_string(featuresSelected.size()) + " of " + std::to_string(features.size()) + " with " + select_features_algorithm);
        return featuresSelected;
    }
    void BoostAODE::trainModel(const torch::Tensor& weights, const Smoothing_t smoothing)
    {
        //
        // Logging setup
        //
        // loguru::set_thread_name("BoostAODE");
        // loguru::g_stderr_verbosity = loguru::Verbosity_OFF;
        // loguru::add_file("boostAODE.log", loguru::Truncate, loguru::Verbosity_MAX);

        // Algorithm based on the adaboost algorithm for classification
        // as explained in Ensemble methods (Zhi-Hua Zhou, 2012)
        fitted = true;
        double alpha_t = 0;
        torch::Tensor weights_ = torch::full({ m }, 1.0 / m, torch::kFloat64);
        bool finished = false;
        std::vector<int> featuresUsed;
        if (selectFeatures) {
            featuresUsed = initializeModels(smoothing);
            auto ypred = predict(X_train);
            std::tie(weights_, alpha_t, finished) = update_weights(y_train, ypred, weights_);
            // Update significance of the models
            for (int i = 0; i < n_models; ++i) {
                significanceModels[i] = alpha_t;
            }
            if (finished) {
                return;
            }
        }
        int numItemsPack = 0; // The counter of the models inserted in the current pack
        // Variables to control the accuracy finish condition
        double priorAccuracy = 0.0;
        double improvement = 1.0;
        double convergence_threshold = 1e-4;
        int tolerance = 0; // number of times the accuracy is lower than the convergence_threshold
        // Step 0: Set the finish condition
        // epsilon sub t > 0.5 => inverse the weights policy
        // validation error is not decreasing
        // run out of features
        bool ascending = order_algorithm == Orders.ASC;
        std::mt19937 g{ 173 };
        while (!finished) {
            // Step 1: Build ranking with mutual information
            auto featureSelection = metrics.SelectKBestWeighted(weights_, ascending, n); // Get all the features sorted
            if (order_algorithm == Orders.RAND) {
                std::shuffle(featureSelection.begin(), featureSelection.end(), g);
            }
            // Remove used features
            featureSelection.erase(remove_if(begin(featureSelection), end(featureSelection), [&](auto x)
                { return std::find(begin(featuresUsed), end(featuresUsed), x) != end(featuresUsed);}),
                end(featureSelection)
            );
            int k = bisection ? pow(2, tolerance) : 1;
            int counter = 0; // The model counter of the current pack
            // VLOG_SCOPE_F(1, "counter=%d k=%d featureSelection.size: %zu", counter, k, featureSelection.size());
            while (counter++ < k && featureSelection.size() > 0) {
                auto feature = featureSelection[0];
                featureSelection.erase(featureSelection.begin());
                std::unique_ptr<Classifier> model;
                model = std::make_unique<SPODE>(feature);
                model->fit(dataset, features, className, states, weights_, smoothing);
                alpha_t = 0.0;
                if (!block_update) {
                    auto ypred = model->predict(X_train);
                    // Step 3.1: Compute the classifier amout of say
                    std::tie(weights_, alpha_t, finished) = update_weights(y_train, ypred, weights_);
                }
                // Step 3.4: Store classifier and its accuracy to weigh its future vote
                numItemsPack++;
                featuresUsed.push_back(feature);
                models.push_back(std::move(model));
                significanceModels.push_back(alpha_t);
                n_models++;
                // VLOG_SCOPE_F(2, "numItemsPack: %d n_models: %d featuresUsed: %zu", numItemsPack, n_models, featuresUsed.size());
            }
            if (block_update) {
                std::tie(weights_, alpha_t, finished) = update_weights_block(k, y_train, weights_);
            }
            if (convergence && !finished) {
                auto y_val_predict = predict(X_test);
                double accuracy = (y_val_predict == y_test).sum().item<double>() / (double)y_test.size(0);
                if (priorAccuracy == 0) {
                    priorAccuracy = accuracy;
                } else {
                    improvement = accuracy - priorAccuracy;
                }
                if (improvement < convergence_threshold) {
                    // VLOG_SCOPE_F(3, "  (improvement<threshold) tolerance: %d numItemsPack: %d improvement: %f prior: %f current: %f", tolerance, numItemsPack, improvement, priorAccuracy, accuracy);
                    tolerance++;
                } else {
                    // VLOG_SCOPE_F(3, "* (improvement>=threshold) Reset. tolerance: %d numItemsPack: %d improvement: %f prior: %f current: %f", tolerance, numItemsPack, improvement, priorAccuracy, accuracy);
                    tolerance = 0; // Reset the counter if the model performs better
                    numItemsPack = 0;
                }
                if (convergence_best) {
                    // Keep the best accuracy until now as the prior accuracy
                    priorAccuracy = std::max(accuracy, priorAccuracy);
                } else {
                    // Keep the last accuray obtained as the prior accuracy
                    priorAccuracy = accuracy;
                }
            }
            // VLOG_SCOPE_F(1, "tolerance: %d featuresUsed.size: %zu features.size: %zu", tolerance, featuresUsed.size(), features.size());
            finished = finished || tolerance > maxTolerance || featuresUsed.size() == features.size();
        }
        if (tolerance > maxTolerance) {
            if (numItemsPack < n_models) {
                notes.push_back("Convergence threshold reached & " + std::to_string(numItemsPack) + " models eliminated");
                // VLOG_SCOPE_F(4, "Convergence threshold reached & %d models eliminated of %d", numItemsPack, n_models);
                for (int i = 0; i < numItemsPack; ++i) {
                    significanceModels.pop_back();
                    models.pop_back();
                    n_models--;
                }
            } else {
                notes.push_back("Convergence threshold reached & 0 models eliminated");
                // VLOG_SCOPE_F(4, "Convergence threshold reached & 0 models eliminated n_models=%d numItemsPack=%d", n_models, numItemsPack);
            }
        }
        if (featuresUsed.size() != features.size()) {
            notes.push_back("Used features in train: " + std::to_string(featuresUsed.size()) + " of " + std::to_string(features.size()));
            status = WARNING;
        }
        notes.push_back("Number of models: " + std::to_string(n_models));
    }
    std::vector<std::string> BoostAODE::graph(const std::string& title) const
    {
        return Ensemble::graph(title);
    }
}
Add copyright header to source files 2024-04-11 16:02:49 +00:00			`// ***************************************************************`
			`// SPDX-FileCopyrightText: Copyright 2024 Ricardo Montañana Gómez`
			`// SPDX-FileType: SOURCE`
			`// SPDX-License-Identifier: MIT`
			`// ***************************************************************`

Extract buildModel method to parent class in Boost 2024-05-15 18:00:44 +00:00			`#include <random>`
Add hyperparameters and processing order to Boost 2023-08-20 18:31:23 +00:00			`#include <set>`
try openssl sha256 2023-10-10 16:16:43 +00:00			`#include <functional>`
			`#include <limits.h>`
Update select features models significance 2024-03-05 11:10:58 +00:00			`#include <tuple>`
try openssl sha256 2023-10-10 16:16:43 +00:00			`#include "BoostAODE.h"`
Add BoostAODE model based on AODE 2023-08-15 14:16:04 +00:00
			`namespace bayesnet {`
Update BoostAODE class structure 2024-04-02 07:52:40 +00:00
Create Boost class as Boost<x> classifiers parent 2024-05-15 17:49:15 +00:00			`BoostAODE::BoostAODE(bool predict_voting) : Boost(predict_voting)`
Refactor Hyperparameters management 2023-11-19 21:36:27 +00:00			`{`
			`}`
Set smoothing as fit parameter 2024-06-11 09:40:45 +00:00			`std::vector<int> BoostAODE::initializeModels(const Smoothing_t smoothing)`
Begin adding cfs to BoostAODE 2023-10-10 09:52:39 +00:00			`{`
Remove using namespace from Library 2023-11-08 17:45:35 +00:00			`torch::Tensor weights_ = torch::full({ m }, 1.0 / m, torch::kFloat64);`
Create Boost class as Boost<x> classifiers parent 2024-05-15 17:49:15 +00:00			`std::vector<int> featuresSelected = featureSelection(weights_);`
			`for (const int& feature : featuresSelected) {`
Remove using namespace from Library 2023-11-08 17:45:35 +00:00			`std::unique_ptr<Classifier> model = std::make_unique<SPODE>(feature);`
Set smoothing as fit parameter 2024-06-11 09:40:45 +00:00			`model->fit(dataset, features, className, states, weights_, smoothing);`
Prepare BoostAODE first try 2023-10-13 11:46:22 +00:00			`models.push_back(std::move(model));`
block_update and install in local folder 2024-04-09 22:55:36 +00:00			`significanceModels.push_back(1.0); // They will be updated later in trainModel`
Prepare BoostAODE first try 2023-10-13 11:46:22 +00:00			`n_models++;`
Begin adding cfs to BoostAODE 2023-10-10 09:52:39 +00:00			`}`
Create Boost class as Boost<x> classifiers parent 2024-05-15 17:49:15 +00:00			`notes.push_back("Used features in initialization: " + std::to_string(featuresSelected.size()) + " of " + std::to_string(features.size()) + " with " + select_features_algorithm);`
			`return featuresSelected;`
Begin adding cfs to BoostAODE 2023-10-10 09:52:39 +00:00			`}`
Set smoothing as fit parameter 2024-06-11 09:40:45 +00:00			`void BoostAODE::trainModel(const torch::Tensor& weights, const Smoothing_t smoothing)`
Remove FeatureSel, add SelectKBest to BayesMetrics 2023-08-16 17:05:18 +00:00			`{`
Add hyperparameter convergence_best move test libraries to test folder 2024-04-29 22:52:09 +00:00			`//`
			`// Logging setup`
			`//`
Add selectKParis method 2024-05-16 09:17:21 +00:00			`// loguru::set_thread_name("BoostAODE");`
			`// loguru::g_stderr_verbosity = loguru::Verbosity_OFF;`
			`// loguru::add_file("boostAODE.log", loguru::Truncate, loguru::Verbosity_MAX);`
Add hyperparameter convergence_best move test libraries to test folder 2024-04-29 22:52:09 +00:00
Update version number and Changelog 2024-03-06 16:04:16 +00:00			`// Algorithm based on the adaboost algorithm for classification`
			`// as explained in Ensemble methods (Zhi-Hua Zhou, 2012)`
Fix epsilont early stopping in BoostAODE 2024-02-20 09:11:22 +00:00			`fitted = true;`
Update select features models significance 2024-03-05 11:10:58 +00:00			`double alpha_t = 0;`
			`torch::Tensor weights_ = torch::full({ m }, 1.0 / m, torch::kFloat64);`
First approach to bisection 2024-03-19 13:13:40 +00:00			`bool finished = false;`
Fix metrics error in BoostAODE Convergence Update algorithm 2024-03-20 22:33:02 +00:00			`std::vector<int> featuresUsed;`
Implement IWSS and FCBF too for BoostAODE 2023-10-14 11:12:04 +00:00			`if (selectFeatures) {`
Set smoothing as fit parameter 2024-06-11 09:40:45 +00:00			`featuresUsed = initializeModels(smoothing);`
Update select features models significance 2024-03-05 11:10:58 +00:00			`auto ypred = predict(X_train);`
First approach to bisection 2024-03-19 13:13:40 +00:00			`std::tie(weights_, alpha_t, finished) = update_weights(y_train, ypred, weights_);`
Update select features models significance 2024-03-05 11:10:58 +00:00			`// Update significance of the models`
			`for (int i = 0; i < n_models; ++i) {`
			`significanceModels[i] = alpha_t;`
			`}`
First approach to bisection 2024-03-19 13:13:40 +00:00			`if (finished) {`
Update select features models significance 2024-03-05 11:10:58 +00:00			`return;`
			`}`
Complete first working cfs 2023-10-11 09:33:29 +00:00			`}`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`int numItemsPack = 0; // The counter of the models inserted in the current pack`
Add Convergence hyperparameter 2023-09-07 09:27:35 +00:00			`// Variables to control the accuracy finish condition`
			`double priorAccuracy = 0.0;`
Fix metrics error in BoostAODE Convergence Update algorithm 2024-03-20 22:33:02 +00:00			`double improvement = 1.0;`
Add comments to BoostAODE algorithm 2024-02-19 21:58:15 +00:00			`double convergence_threshold = 1e-4;`
First approach to bisection 2024-03-19 13:13:40 +00:00			`int tolerance = 0; // number of times the accuracy is lower than the convergence_threshold`
Complete first BoostAODE 2023-08-18 09:50:34 +00:00			`// Step 0: Set the finish condition`
Activate best score in odte 2023-10-25 08:23:42 +00:00			`// epsilon sub t > 0.5 => inverse the weights policy`
Add Convergence hyperparameter 2023-09-07 09:27:35 +00:00			`// validation error is not decreasing`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`// run out of features`
Replace constant strings in BoostAODE 2024-03-05 10:05:11 +00:00			`bool ascending = order_algorithm == Orders.ASC;`
change boostaode ascending hyperparameter to order {asc,desc,rand} 2024-02-26 16:07:57 +00:00			`std::mt19937 g{ 173 };`
First approach to bisection 2024-03-19 13:13:40 +00:00			`while (!finished) {`
Complete first BoostAODE 2023-08-18 09:50:34 +00:00			`// Step 1: Build ranking with mutual information`
Add hyperparameters and processing order to Boost 2023-08-20 18:31:23 +00:00			`auto featureSelection = metrics.SelectKBestWeighted(weights_, ascending, n); // Get all the features sorted`
Replace constant strings in BoostAODE 2024-03-05 10:05:11 +00:00			`if (order_algorithm == Orders.RAND) {`
change boostaode ascending hyperparameter to order {asc,desc,rand} 2024-02-26 16:07:57 +00:00			`std::shuffle(featureSelection.begin(), featureSelection.end(), g);`
			`}`
Remove repeatSparent hyperparameter 2024-03-19 08:42:03 +00:00			`// Remove used features`
			`featureSelection.erase(remove_if(begin(featureSelection), end(featureSelection), [&](auto x)`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`{ return std::find(begin(featuresUsed), end(featuresUsed), x) != end(featuresUsed);}),`
Remove repeatSparent hyperparameter 2024-03-19 08:42:03 +00:00			`end(featureSelection)`
			`);`
Add hyperparameter convergence_best move test libraries to test folder 2024-04-29 22:52:09 +00:00			`int k = bisection ? pow(2, tolerance) : 1;`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`int counter = 0; // The model counter of the current pack`
Add selectKParis method 2024-05-16 09:17:21 +00:00			`// VLOG_SCOPE_F(1, "counter=%d k=%d featureSelection.size: %zu", counter, k, featureSelection.size());`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`while (counter++ < k && featureSelection.size() > 0) {`
First approach to bisection 2024-03-19 13:13:40 +00:00			`auto feature = featureSelection[0];`
			`featureSelection.erase(featureSelection.begin());`
			`std::unique_ptr<Classifier> model;`
			`model = std::make_unique<SPODE>(feature);`
Set smoothing as fit parameter 2024-06-11 09:40:45 +00:00			`model->fit(dataset, features, className, states, weights_, smoothing);`
block_update and install in local folder 2024-04-09 22:55:36 +00:00			`alpha_t = 0.0;`
			`if (!block_update) {`
			`auto ypred = model->predict(X_train);`
			`// Step 3.1: Compute the classifier amout of say`
			`std::tie(weights_, alpha_t, finished) = update_weights(y_train, ypred, weights_);`
First approach to bisection 2024-03-19 13:13:40 +00:00			`}`
			`// Step 3.4: Store classifier and its accuracy to weigh its future vote`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`numItemsPack++;`
Fix metrics error in BoostAODE Convergence Update algorithm 2024-03-20 22:33:02 +00:00			`featuresUsed.push_back(feature);`
First approach to bisection 2024-03-19 13:13:40 +00:00			`models.push_back(std::move(model));`
			`significanceModels.push_back(alpha_t);`
			`n_models++;`
Add selectKParis method 2024-05-16 09:17:21 +00:00			`// VLOG_SCOPE_F(2, "numItemsPack: %d n_models: %d featuresUsed: %zu", numItemsPack, n_models, featuresUsed.size());`
Fix epsilont early stopping in BoostAODE 2024-02-20 09:11:22 +00:00			`}`
block_update and install in local folder 2024-04-09 22:55:36 +00:00			`if (block_update) {`
			`std::tie(weights_, alpha_t, finished) = update_weights_block(k, y_train, weights_);`
			`}`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`if (convergence && !finished) {`
If ! convergence don't predict test 2023-09-10 17:50:36 +00:00			`auto y_val_predict = predict(X_test);`
			`double accuracy = (y_val_predict == y_test).sum().item<double>() / (double)y_test.size(0);`
			`if (priorAccuracy == 0) {`
			`priorAccuracy = accuracy;`
			`} else {`
Fix metrics error in BoostAODE Convergence Update algorithm 2024-03-20 22:33:02 +00:00			`improvement = accuracy - priorAccuracy;`
If ! convergence don't predict test 2023-09-10 17:50:36 +00:00			`}`
Fix metrics error in BoostAODE Convergence Update algorithm 2024-03-20 22:33:02 +00:00			`if (improvement < convergence_threshold) {`
Add selectKParis method 2024-05-16 09:17:21 +00:00			`// VLOG_SCOPE_F(3, " (improvement<threshold) tolerance: %d numItemsPack: %d improvement: %f prior: %f current: %f", tolerance, numItemsPack, improvement, priorAccuracy, accuracy);`
First approach to bisection 2024-03-19 13:13:40 +00:00			`tolerance++;`
Initialize worse_model_count if model accuracy is better in BoostAODE 2024-03-11 20:30:01 +00:00			`} else {`
Add selectKParis method 2024-05-16 09:17:21 +00:00			`// VLOG_SCOPE_F(3, "* (improvement>=threshold) Reset. tolerance: %d numItemsPack: %d improvement: %f prior: %f current: %f", tolerance, numItemsPack, improvement, priorAccuracy, accuracy);`
First approach to bisection 2024-03-19 13:13:40 +00:00			`tolerance = 0; // Reset the counter if the model performs better`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`numItemsPack = 0;`
If ! convergence don't predict test 2023-09-10 17:50:36 +00:00			`}`
Add hyperparameter convergence_best move test libraries to test folder 2024-04-29 22:52:09 +00:00			`if (convergence_best) {`
			`// Keep the best accuracy until now as the prior accuracy`
			`priorAccuracy = std::max(accuracy, priorAccuracy);`
			`} else {`
			`// Keep the last accuray obtained as the prior accuracy`
			`priorAccuracy = accuracy;`
			`}`
Add Convergence hyperparameter 2023-09-07 09:27:35 +00:00			`}`
Add selectKParis method 2024-05-16 09:17:21 +00:00			`// VLOG_SCOPE_F(1, "tolerance: %d featuresUsed.size: %zu features.size: %zu", tolerance, featuresUsed.size(), features.size());`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`finished = finished \|\| tolerance > maxTolerance \|\| featuresUsed.size() == features.size();`
Add hyperparameters and processing order to Boost 2023-08-20 18:31:23 +00:00			`}`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`if (tolerance > maxTolerance) {`
			`if (numItemsPack < n_models) {`
			`notes.push_back("Convergence threshold reached & " + std::to_string(numItemsPack) + " models eliminated");`
Add selectKParis method 2024-05-16 09:17:21 +00:00			`// VLOG_SCOPE_F(4, "Convergence threshold reached & %d models eliminated of %d", numItemsPack, n_models);`
Implement algorithm and add logging 2024-03-20 10:30:02 +00:00			`for (int i = 0; i < numItemsPack; ++i) {`
			`significanceModels.pop_back();`
			`models.pop_back();`
			`n_models--;`
			`}`
			`} else {`
			`notes.push_back("Convergence threshold reached & 0 models eliminated");`
Add selectKParis method 2024-05-16 09:17:21 +00:00			`// VLOG_SCOPE_F(4, "Convergence threshold reached & 0 models eliminated n_models=%d numItemsPack=%d", n_models, numItemsPack);`
First approach to bisection 2024-03-19 13:13:40 +00:00			`}`
Fix Initialize worse_model_count if model accuracy is better in BoostAODE 2024-03-11 21:33:50 +00:00			`}`
Add hyperparameters and processing order to Boost 2023-08-20 18:31:23 +00:00			`if (featuresUsed.size() != features.size()) {`
Add notes to Classifier & use them in BoostAODE 2024-02-08 17:01:09 +00:00			`notes.push_back("Used features in train: " + std::to_string(featuresUsed.size()) + " of " + std::to_string(features.size()));`
Add status to classifier and Experiment 2023-09-05 11:39:43 +00:00			`status = WARNING;`
Remove FeatureSel, add SelectKBest to BayesMetrics 2023-08-16 17:05:18 +00:00			`}`
Add notes to Classifier & Changelog 2024-02-12 09:58:20 +00:00			`notes.push_back("Number of models: " + std::to_string(n_models));`
Remove FeatureSel, add SelectKBest to BayesMetrics 2023-08-16 17:05:18 +00:00			`}`
Remove using namespace from Library 2023-11-08 17:45:35 +00:00			`std::vector<std::string> BoostAODE::graph(const std::string& title) const`
Add BoostAODE model based on AODE 2023-08-15 14:16:04 +00:00			`{`
			`return Ensemble::graph(title);`
			`}`
			`}`