Refactor library

Complete CPP model integration
2025-08-19 09:35:54 +00:00 · 2023-07-19 16:16:15 +02:00 · 2023-07-18 23:39:50 +02:00
30 changed files with 5816 additions and 9249 deletions
--- a/MANIFEST.in
+++ b/MANIFEST.in
@@ -1,5 +1,13 @@
 include README.md LICENSE
-include bayesclass/FeatureSelect.h
+include bayesclass/cpp/FeatureSelect.h
-include bayesclass/Node.h
+include bayesclass/cpp/Node.h
-include bayesclass/Network.h
+include bayesclass/cpp/Mst.h
-include bayesclass/Metrics.hpp
+include bayesclass/cpp/Network.h
 include bayesclass/cpp/Metrics.hpp
 include bayesclass/cpp/BaseClassifier.h
 include bayesclass/cpp/Ensemble.h
 include bayesclass/cpp/TAN.h
 include bayesclass/cpp/KDB.h
 include bayesclass/cpp/SPODE.h
 include bayesclass/cpp/AODE.h
 include bayesclass/cpp/utils.h
--- a/bayesclass/BayesNetwork.cpp
+++ b/bayesclass/BayesNetwork.cpp
--- a/bayesclass/BayesNetwork.pyx
+++ b/bayesclass/BayesNetwork.pyx
@@ -2,9 +2,10 @@
 # cython: language_level = 3
 from libcpp.vector cimport vector
 from libcpp.string cimport string
 from libcpp.map cimport map
 import numpy as np
-cdef extern from "Network.h" namespace "bayesnet":
+cdef extern from "cpp/Network.h" namespace "bayesnet":
    cdef cppclass Network:
        Network(float, float) except + 
        void fit(vector[vector[int]]&, vector[int]&, vector[string]&, string)
@@ -58,7 +59,7 @@ cdef class BayesNetwork:
    def __reduce__(self):
        return (BayesNetwork, ())
-cdef extern from "Metrics.hpp" namespace "bayesnet":
+cdef extern from "cpp/Metrics.hpp" namespace "bayesnet":
    cdef cppclass Metrics:
        Metrics(vector[vector[int]], vector[int], vector[string]&, string&, int) except +
        vector[float] conditionalEdgeWeights()
@@ -76,3 +77,101 @@ cdef class CMetrics:
    def __reduce__(self):
        return (CMetrics, ())
 cdef extern from "cpp/TAN.h" namespace "bayesnet":
    cdef cppclass CTAN:
        CTAN() except + 
        void fit(vector[vector[int]]&, vector[int]&, vector[string]&, string, map[string, vector[int]]&)
        vector[int] predict(vector[vector[int]]&)
        vector[vector[double]] predict_proba(vector[vector[int]]&)
        float score(const vector[vector[int]]&, const vector[int]&)
        vector[string] graph()
 cdef extern from "cpp/KDB.h" namespace "bayesnet":
    cdef cppclass CKDB:
        CKDB(int) except + 
        void fit(vector[vector[int]]&, vector[int]&, vector[string]&, string, map[string, vector[int]]&)
        vector[int] predict(vector[vector[int]]&)
        vector[vector[double]] predict_proba(vector[vector[int]]&)
        float score(const vector[vector[int]]&, const vector[int]&)
        vector[string] graph()
 cdef extern from "cpp/AODE.h" namespace "bayesnet":
    cdef cppclass CAODE:
        CAODE() except + 
        void fit(vector[vector[int]]&, vector[int]&, vector[string]&, string, map[string, vector[int]]&)
        vector[int] predict(vector[vector[int]]&)
        vector[vector[double]] predict_proba(vector[vector[int]]&)
        float score(const vector[vector[int]]&, const vector[int]&)
        vector[string] graph()
 cdef class TAN:
    cdef CTAN *thisptr
    def __cinit__(self):
        self.thisptr = new CTAN() 
    def __dealloc__(self):
        del self.thisptr
    def fit(self, X, y, features, className, states):
        X_ = [X[:, i] for i in range(X.shape[1])]
        features_bytes = [x.encode() for x in features]
        states_dict = {key.encode(): value for key, value in states.items()}
        states_dict[className.encode()] = np.unique(y).tolist()
        self.thisptr.fit(X_, y, features_bytes, className.encode(), states_dict)
        return self
    def predict(self, X):
        X_ = [X[:, i] for i in range(X.shape[1])]
        return self.thisptr.predict(X_)
    def score(self, X, y):
        X_ = [X[:, i] for i in range(X.shape[1])]
        return self.thisptr.score(X_, y)
    def graph(self):
        return self.thisptr.graph()
    def __reduce__(self):
        return (TAN, ())
 cdef class CKDB:
    cdef KDB *thisptr
    def __cinit__(self, k):
        self.thisptr = new KDB(k) 
    def __dealloc__(self):
        del self.thisptr
    def fit(self, X, y, features, className, states):
        X_ = [X[:, i] for i in range(X.shape[1])]
        features_bytes = [x.encode() for x in features]
        states_dict = {key.encode(): value for key, value in states.items()}
        states_dict[className.encode()] = np.unique(y).tolist()
        self.thisptr.fit(X_, y, features_bytes, className.encode(), states_dict)
        return self
    def predict(self, X):
        X_ = [X[:, i] for i in range(X.shape[1])]
        return self.thisptr.predict(X_)
    def score(self, X, y):
        X_ = [X[:, i] for i in range(X.shape[1])]
        return self.thisptr.score(X_, y)
    def graph(self):
        return self.thisptr.graph()
    def __reduce__(self):
        return (CKDB, ())
 cdef class CAODE:
    cdef AODE *thisptr
    def __cinit__(self):
        self.thisptr = new AODE() 
    def __dealloc__(self):
        del self.thisptr
    def fit(self, X, y, features, className, states):
        X_ = [X[:, i] for i in range(X.shape[1])]
        features_bytes = [x.encode() for x in features]
        states_dict = {key.encode(): value for key, value in states.items()}
        states_dict[className.encode()] = np.unique(y).tolist()
        self.thisptr.fit(X_, y, features_bytes, className.encode(), states_dict)
        return self
    def predict(self, X):
        X_ = [X[:, i] for i in range(X.shape[1])]
        return self.thisptr.predict(X_)
    def score(self, X, y):
        X_ = [X[:, i] for i in range(X.shape[1])]
        return self.thisptr.score(X_, y)
    def graph(self):
        return self.thisptr.graph()
    def __reduce__(self):
        return (CAODE, ())
--- a/bayesclass/cSelectFeatures.cpp
+++ b/bayesclass/cSelectFeatures.cpp
--- a/bayesclass/cSelectFeatures.pyx
+++ b/bayesclass/cSelectFeatures.pyx
@@ -5,7 +5,7 @@ from libcpp.string cimport string
 from libcpp cimport bool
-cdef extern from "FeatureSelect.h" namespace "features":
+cdef extern from "cpp/FeatureSelect.h" namespace "features":
    ctypedef float precision_t
    cdef cppclass SelectKBestWeighted:
        SelectKBestWeighted(vector[vector[int]]&, vector[int]&, vector[precision_t]&, int, bool) except + 
--- a/bayesclass/cpp/AODE.cc
+++ b/bayesclass/cpp/AODE.cc
@@ -0,0 +1,16 @@
 #include "AODE.h"
 namespace bayesnet {
    AODE::AODE() : Ensemble() {}
    void AODE::train()
    {
        models.clear();
        for (int i = 0; i < features.size(); ++i) {
            models.push_back(std::make_unique<SPODE>(i));
        }
    }
    vector<string> AODE::graph(string title)
    {
        return Ensemble::graph(title);
    }
 }
--- a/bayesclass/cpp/AODE.h
+++ b/bayesclass/cpp/AODE.h
@@ -0,0 +1,14 @@
 #ifndef AODE_H
 #define AODE_H
 #include "Ensemble.h"
 #include "SPODE.h"
 namespace bayesnet {
    class AODE : public Ensemble {
    protected:
        void train() override;
    public:
        AODE();
        vector<string> graph(string title = "AODE");
    };
 }
 #endif
--- a/bayesclass/cpp/BaseClassifier.cc
+++ b/bayesclass/cpp/BaseClassifier.cc
@@ -1,34 +1,34 @@
 #include "BaseClassifier.h"
 #include "utils.h"
 namespace bayesnet {
    using namespace std;
    using namespace torch;
-    BaseClassifier::BaseClassifier(Network model) : model(model), m(0), n(0) {}
+    BaseClassifier::BaseClassifier(Network model) : model(model), m(0), n(0), metrics(Metrics()), fitted(false) {}
    BaseClassifier& BaseClassifier::build(vector<string>& features, string className, map<string, vector<int>>& states)
    {
        dataset = torch::cat({ X, y.view({y.size(0), 1}) }, 1);
        this->features = features;
        this->className = className;
        this->states = states;
        checkFitParameters();
        auto n_classes = states[className].size();
        metrics = Metrics(dataset, features, className, n_classes);
        train();
        model.fit(Xv, yv, features, className);
        fitted = true;
        return *this;
    }
    BaseClassifier& BaseClassifier::fit(Tensor& X, Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states)
    {
        this->X = X;
        this->y = y;
        return build(features, className, states);
    }
    BaseClassifier& BaseClassifier::fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states)
    {
        this->X = torch::zeros({ static_cast<int64_t>(X[0].size()), static_cast<int64_t>(X.size()) }, kInt64);
        Xv = X;
        for (int i = 0; i < X.size(); ++i) {
            this->X.index_put_({ "...", i }, torch::tensor(X[i], kInt64));
        }
        this->y = torch::tensor(y, kInt64);
        yv = y;
        return build(features, className, states);
    }
    void BaseClassifier::checkFitParameters()
@@ -51,25 +51,12 @@ namespace bayesnet {
            }
        }
    }
    vector<vector<int>> tensorToVector(const torch::Tensor& tensor)
    {
        // convert mxn tensor to nxm vector
        vector<vector<int>> result;
        auto tensor_accessor = tensor.accessor<int, 2>();
        // Iterate over columns and rows of the tensor
        for (int j = 0; j < tensor.size(1); ++j) {
            vector<int> column;
            for (int i = 0; i < tensor.size(0); ++i) {
                column.push_back(tensor_accessor[i][j]);
            }
            result.push_back(column);
        }
        return result;
    }
    Tensor BaseClassifier::predict(Tensor& X)
    {
        if (!fitted) {
            throw logic_error("Classifier has not been fitted");
        }
        auto m_ = X.size(0);
        auto n_ = X.size(1);
        vector<vector<int>> Xd(n_, vector<int>(m_, 0));
@@ -81,13 +68,60 @@ namespace bayesnet {
        auto ypred = torch::tensor(yp, torch::kInt64);
        return ypred;
    }
    vector<int> BaseClassifier::predict(vector<vector<int>>& X)
    {
        if (!fitted) {
            throw logic_error("Classifier has not been fitted");
        }
        auto m_ = X[0].size();
        auto n_ = X.size();
        vector<vector<int>> Xd(n_, vector<int>(m_, 0));
        for (auto i = 0; i < n_; i++) {
            Xd[i] = vector<int>(X[i].begin(), X[i].end());
        }
        auto yp = model.predict(Xd);
        return yp;
    }
    float BaseClassifier::score(Tensor& X, Tensor& y)
    {
        if (!fitted) {
            throw logic_error("Classifier has not been fitted");
        }
        Tensor y_pred = predict(X);
        return (y_pred == y).sum().item<float>() / y.size(0);
    }
    float BaseClassifier::score(vector<vector<int>>& X, vector<int>& y)
    {
        if (!fitted) {
            throw logic_error("Classifier has not been fitted");
        }
        auto m_ = X[0].size();
        auto n_ = X.size();
        vector<vector<int>> Xd(n_, vector<int>(m_, 0));
        for (auto i = 0; i < n_; i++) {
            Xd[i] = vector<int>(X[i].begin(), X[i].end());
        }
        return model.score(Xd, y);
    }
    vector<string> BaseClassifier::show()
    {
        return model.show();
    }
    void BaseClassifier::addNodes()
    {
        // Add all nodes to the network
        for (auto feature : features) {
            model.addNode(feature, states[feature].size());
        }
        model.addNode(className, states[className].size());
    }
    int BaseClassifier::getNumberOfNodes()
    {
        // Features does not include class
        return fitted ? model.getFeatures().size() + 1 : 0;
    }
    int BaseClassifier::getNumberOfEdges()
    {
        return fitted ? model.getEdges().size() : 0;
    }
 }
--- a/bayesclass/cpp/BaseClassifier.h
+++ b/bayesclass/cpp/BaseClassifier.h
@@ -1,19 +1,25 @@
 #ifndef CLASSIFIERS_H
 #define CLASSIFIERS_H
 #include <torch/torch.h>
 #include "Network.h"
 #include "Metrics.hpp"
 using namespace std;
 using namespace torch;
 namespace bayesnet {
    class BaseClassifier {
    private:
        bool fitted;
        BaseClassifier& build(vector<string>& features, string className, map<string, vector<int>>& states);
    protected:
        Network model;
        int m, n; // m: number of samples, n: number of features
        Tensor X;
        vector<vector<int>> Xv;
        Tensor y;
        vector<int> yv;
        Tensor dataset;
        Metrics metrics;
        vector<string> features;
        string className;
        map<string, vector<int>> states;
@@ -21,14 +27,17 @@ namespace bayesnet {
        virtual void train() = 0;
    public:
        BaseClassifier(Network model);
-        Tensor& getX();
+        virtual ~BaseClassifier() = default;
        vector<string>& getFeatures();
        string& getClassName();
        BaseClassifier& fit(Tensor& X, Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states);
        BaseClassifier& fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states);
        void addNodes();
        int getNumberOfNodes();
        int getNumberOfEdges();
        Tensor predict(Tensor& X);
        vector<int> predict(vector<vector<int>>& X);
        float score(Tensor& X, Tensor& y);
        float score(vector<vector<int>>& X, vector<int>& y);
        vector<string> show();
        virtual vector<string> graph(string title) = 0;
    };
 }
 #endif
--- a/bayesclass/cpp/Ensemble.cc
+++ b/bayesclass/cpp/Ensemble.cc
@@ -0,0 +1,112 @@
 #include "Ensemble.h"
 namespace bayesnet {
    using namespace std;
    using namespace torch;
    Ensemble::Ensemble() : m(0), n(0), n_models(0), metrics(Metrics()), fitted(false) {}
    Ensemble& Ensemble::build(vector<string>& features, string className, map<string, vector<int>>& states)
    {
        dataset = cat({ X, y.view({y.size(0), 1}) }, 1);
        this->features = features;
        this->className = className;
        this->states = states;
        auto n_classes = states[className].size();
        metrics = Metrics(dataset, features, className, n_classes);
        // Build models
        train();
        // Train models
        n_models = models.size();
        for (auto i = 0; i < n_models; ++i) {
            models[i]->fit(Xv, yv, features, className, states);
        }
        fitted = true;
        return *this;
    }
    Ensemble& Ensemble::fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states)
    {
        this->X = torch::zeros({ static_cast<int64_t>(X[0].size()), static_cast<int64_t>(X.size()) }, kInt64);
        Xv = X;
        for (int i = 0; i < X.size(); ++i) {
            this->X.index_put_({ "...", i }, torch::tensor(X[i], kInt64));
        }
        this->y = torch::tensor(y, kInt64);
        yv = y;
        return build(features, className, states);
    }
    Tensor Ensemble::predict(Tensor& X)
    {
        if (!fitted) {
            throw logic_error("Ensemble has not been fitted");
        }
        Tensor y_pred = torch::zeros({ X.size(0), n_models }, kInt64);
        for (auto i = 0; i < n_models; ++i) {
            y_pred.index_put_({ "...", i }, models[i]->predict(X));
        }
        return torch::tensor(voting(y_pred));
    }
    vector<int> Ensemble::voting(Tensor& y_pred)
    {
        auto y_pred_ = y_pred.accessor<int64_t, 2>();
        vector<int> y_pred_final;
        for (int i = 0; i < y_pred.size(0); ++i) {
            vector<float> votes(states[className].size(), 0);
            for (int j = 0; j < y_pred.size(1); ++j) {
                votes[y_pred_[i][j]] += 1;
            }
            auto indices = argsort(votes);
            y_pred_final.push_back(indices[0]);
        }
        return y_pred_final;
    }
    vector<int> Ensemble::predict(vector<vector<int>>& X)
    {
        if (!fitted) {
            throw logic_error("Ensemble has not been fitted");
        }
        long m_ = X[0].size();
        long n_ = X.size();
        vector<vector<int>> Xd(n_, vector<int>(m_, 0));
        for (auto i = 0; i < n_; i++) {
            Xd[i] = vector<int>(X[i].begin(), X[i].end());
        }
        Tensor y_pred = torch::zeros({ m_, n_models }, kInt64);
        for (auto i = 0; i < n_models; ++i) {
            y_pred.index_put_({ "...", i }, torch::tensor(models[i]->predict(Xd), kInt64));
        }
        return voting(y_pred);
    }
    float Ensemble::score(vector<vector<int>>& X, vector<int>& y)
    {
        if (!fitted) {
            throw logic_error("Ensemble has not been fitted");
        }
        auto y_pred = predict(X);
        int correct = 0;
        for (int i = 0; i < y_pred.size(); ++i) {
            if (y_pred[i] == y[i]) {
                correct++;
            }
        }
        return (double)correct / y_pred.size();
    }
    vector<string> Ensemble::show()
    {
        auto result = vector<string>();
        for (auto i = 0; i < n_models; ++i) {
            auto res = models[i]->show();
            result.insert(result.end(), res.begin(), res.end());
        }
        return result;
    }
    vector<string> Ensemble::graph(string title)
    {
        auto result = vector<string>();
        for (auto i = 0; i < n_models; ++i) {
            auto res = models[i]->graph(title + "_" + to_string(i));
            result.insert(result.end(), res.begin(), res.end());
        }
        return result;
    }
 }
--- a/bayesclass/cpp/Ensemble.h
+++ b/bayesclass/cpp/Ensemble.h
@@ -0,0 +1,42 @@
 #ifndef ENSEMBLE_H
 #define ENSEMBLE_H
 #include <torch/torch.h>
 #include "BaseClassifier.h"
 #include "Metrics.hpp"
 #include "utils.h"
 using namespace std;
 using namespace torch;
 namespace bayesnet {
    class Ensemble {
    private:
        bool fitted;
        long n_models;
        Ensemble& build(vector<string>& features, string className, map<string, vector<int>>& states);
    protected:
        vector<unique_ptr<BaseClassifier>> models;
        int m, n; // m: number of samples, n: number of features
        Tensor X;
        vector<vector<int>> Xv;
        Tensor y;
        vector<int> yv;
        Tensor dataset;
        Metrics metrics;
        vector<string> features;
        string className;
        map<string, vector<int>> states;
        void virtual train() = 0;
        vector<int> voting(Tensor& y_pred);
    public:
        Ensemble();
        virtual ~Ensemble() = default;
        Ensemble& fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states);
        Tensor predict(Tensor& X);
        vector<int> predict(vector<vector<int>>& X);
        float score(Tensor& X, Tensor& y);
        float score(vector<vector<int>>& X, vector<int>& y);
        vector<string> show();
        vector<string> graph(string title);
    };
 }
 #endif
--- a/bayesclass/cpp/FeatureSelect.cpp
+++ b/bayesclass/cpp/FeatureSelect.cpp
--- a/bayesclass/cpp/FeatureSelect.h
+++ b/bayesclass/cpp/FeatureSelect.h
--- a/bayesclass/cpp/KDB.cc
+++ b/bayesclass/cpp/KDB.cc
@@ -1,17 +1,9 @@
 #include "KDB.h"
 #include "Metrics.hpp"
 namespace bayesnet {
    using namespace std;
    using namespace torch;
-    vector<int> argsort(vector<float>& nums)
+
    {
        int n = nums.size();
        vector<int> indices(n);
        iota(indices.begin(), indices.end(), 0);
        sort(indices.begin(), indices.end(), [&nums](int i, int j) {return nums[i] > nums[j];});
        return indices;
    }
    KDB::KDB(int k, float theta) : BaseClassifier(Network()), k(k), theta(theta) {}
    void KDB::train()
    {
@@ -36,31 +28,23 @@ namespace bayesnet {
        */
        // 1. For each feature Xi, compute mutual information, I(X;C),
        // where C is the class.
        cout << "Computing mutual information between features and class" << endl;
        auto n_classes = states[className].size();
        auto metrics = Metrics(dataset, features, className, n_classes);
        vector <float> mi;
        for (auto i = 0; i < features.size(); i++) {
            Tensor firstFeature = X.index({ "...", i });
            mi.push_back(metrics.mutualInformation(firstFeature, y));
            cout << "Mutual information between " << features[i] << " and " << className << " is " << mi[i] << endl;
        }
        // 2. Compute class conditional mutual information I(Xi;XjIC), f or each
        auto conditionalEdgeWeights = metrics.conditionalEdge();
        cout << "Conditional edge weights" << endl;
        cout << conditionalEdgeWeights << endl;
        // 3. Let the used variable list, S, be empty.
        vector<int> S;
        // 4. Let the DAG network being constructed, BN, begin with a single
        // class node, C.
        model.addNode(className, states[className].size());
        cout << "Adding node " << className << " to the network" << endl;
        // 5. Repeat until S includes all domain features
        // 5.1. Select feature Xmax which is not in S and has the largest value
        // I(Xmax;C).
        auto order = argsort(mi);
        for (auto idx : order) {
            cout << idx << " " << mi[idx] << endl;
            // 5.2. Add a node to BN representing Xmax.
            model.addNode(features[idx], states[features[idx]].size());
            // 5.3. Add an arc from C to Xmax in BN.
@@ -76,8 +60,6 @@ namespace bayesnet {
    {
        auto n_edges = min(k, static_cast<int>(S.size()));
        auto cond_w = clone(weights);
        cout << "Conditional edge weights cloned for idx " << idx << endl;
        cout << cond_w << endl;
        bool exit_cond = k == 0;
        int num = 0;
        while (!exit_cond) {
@@ -93,18 +75,16 @@ namespace bayesnet {
                }
            }
            cond_w.index_put_({ idx, max_minfo }, -1);
            cout << "Conditional edge weights cloned for idx " << idx << " After -1" << endl;
            cout << cond_w << endl;
            cout << "cond_w.index({ idx, '...'})" << endl;
            cout << cond_w.index({ idx, "..." }) << endl;
            auto candidates_mask = cond_w.index({ idx, "..." }).gt(theta);
            auto candidates = candidates_mask.nonzero();
            cout << "Candidates mask" << endl;
            cout << candidates_mask << endl;
            cout << "Candidates: " << endl;
            cout << candidates << endl;
            cout << "Candidates size: " << candidates.size(0) << endl;
            exit_cond = num == n_edges || candidates.size(0) == 0;
        }
    }
    vector<string> KDB::graph(string title)
    {
        if (title == "KDB") {
            title += " (k=" + to_string(k) + ", theta=" + to_string(theta) + ")";
        }
        return model.graph(title);
    }
 }
--- a/bayesclass/cpp/KDB.h
+++ b/bayesclass/cpp/KDB.h
@@ -1,6 +1,7 @@
 #ifndef KDB_H
 #define KDB_H
 #include "BaseClassifier.h"
 #include "utils.h"
 namespace bayesnet {
    using namespace std;
    using namespace torch;
@@ -13,6 +14,7 @@ namespace bayesnet {
        void train() override;
    public:
        KDB(int k, float theta = 0.03);
        vector<string> graph(string name = "KDB") override;
    };
 }
 #endif
--- a/bayesclass/cpp/Metrics.cc
+++ b/bayesclass/cpp/Metrics.cc
@@ -1,4 +1,5 @@
 #include "Metrics.hpp"
 #include "Mst.h"
 using namespace std;
 namespace bayesnet {
    Metrics::Metrics(torch::Tensor& samples, vector<string>& features, string& className, int classNumStates)
@@ -116,4 +117,15 @@ namespace bayesnet {
    {
        return entropy(firstFeature) - conditionalEntropy(firstFeature, secondFeature);
    }
    /*
    Compute the maximum spanning tree considering the weights as distances
    and the indices of the weights as nodes of this square matrix using
    Kruskal algorithm
    */
    vector<pair<int, int>> Metrics::maximumSpanningTree(vector<string> features, Tensor& weights, int root)
    {
        auto result = vector<pair<int, int>>();
        auto mst = MST(features, weights, root);
        return mst.maximumSpanningTree();
    }
 }
--- a/bayesclass/cpp/Metrics.hpp
+++ b/bayesclass/cpp/Metrics.hpp
@@ -3,23 +3,26 @@
 #include <torch/torch.h>
 #include <vector>
 #include <string>
 using namespace std;
 namespace bayesnet {
    using namespace std;
    using namespace torch;
    class Metrics {
    private:
-        torch::Tensor samples;
+        Tensor samples;
        vector<string> features;
        string className;
        int classNumStates;
        vector<pair<string, string>> doCombinations(const vector<string>&);
        double entropy(torch::Tensor&);
        double conditionalEntropy(torch::Tensor&, torch::Tensor&);
    public:
-        double mutualInformation(torch::Tensor&, torch::Tensor&);
+        Metrics() = default;
-        Metrics(torch::Tensor&, vector<string>&, string&, int);
+        Metrics(Tensor&, vector<string>&, string&, int);
        Metrics(const vector<vector<int>>&, const vector<int>&, const vector<string>&, const string&, const int);
        double entropy(Tensor&);
        double conditionalEntropy(Tensor&, Tensor&);
        double mutualInformation(Tensor&, Tensor&);
        vector<float> conditionalEdgeWeights();
-        torch::Tensor conditionalEdge();
+        Tensor conditionalEdge();
        vector<pair<string, string>> doCombinations(const vector<string>&);
        vector<pair<int, int>> maximumSpanningTree(vector<string> features, Tensor& weights, int root);
    };
 }
 #endif
--- a/bayesclass/cpp/Mst.cc
+++ b/bayesclass/cpp/Mst.cc
@@ -0,0 +1,115 @@
 #include "Mst.h"
 #include <vector>
 /*
    Based on the code from https://www.softwaretestinghelp.com/minimum-spanning-tree-tutorial/
 */
 namespace bayesnet {
    using namespace std;
    Graph::Graph(int V)
    {
        parent = vector<int>(V);
        for (int i = 0; i < V; i++)
            parent[i] = i;
        G.clear();
        T.clear();
    }
    void Graph::addEdge(int u, int v, float wt)
    {
        G.push_back({ wt, { u, v } });
    }
    int Graph::find_set(int i)
    {
        // If i is the parent of itself
        if (i == parent[i])
            return i;
        else
            //else recursively find the parent of i
            return find_set(parent[i]);
    }
    void Graph::union_set(int u, int v)
    {
        parent[u] = parent[v];
    }
    void Graph::kruskal_algorithm()
    {
        int i, uSt, vEd;
        // sort the edges ordered on decreasing weight
        sort(G.begin(), G.end(), [](auto& left, auto& right) {return left.first > right.first;});
        for (i = 0; i < G.size(); i++) {
            uSt = find_set(G[i].second.first);
            vEd = find_set(G[i].second.second);
            if (uSt != vEd) {
                T.push_back(G[i]); // add to mst vector
                union_set(uSt, vEd);
            }
        }
    }
    void Graph::display_mst()
    {
        cout << "Edge :" << " Weight" << endl;
        for (int i = 0; i < T.size(); i++) {
            cout << T[i].second.first << " - " << T[i].second.second << " : "
                << T[i].first;
            cout << endl;
        }
    }
    vector<pair<int, int>> reorder(vector<pair<float, pair<int, int>>> T, int root_original)
    {
        auto result = vector<pair<int, int>>();
        auto visited = vector<int>();
        auto nextVariables = unordered_set<int>();
        nextVariables.emplace(root_original);
        while (nextVariables.size() > 0) {
            int root = *nextVariables.begin();
            nextVariables.erase(nextVariables.begin());
            for (int i = 0; i < T.size(); ++i) {
                auto [weight, edge] = T[i];
                auto [from, to] = edge;
                if (from == root || to == root) {
                    visited.insert(visited.begin(), i);
                    if (from == root) {
                        result.push_back({ from, to });
                        nextVariables.emplace(to);
                    } else {
                        result.push_back({ to, from });
                        nextVariables.emplace(from);
                    }
                }
            }
            // Remove visited
            for (int i = 0; i < visited.size(); ++i) {
                T.erase(T.begin() + visited[i]);
            }
            visited.clear();
        }
        if (T.size() > 0) {
            for (int i = 0; i < T.size(); ++i) {
                auto [weight, edge] = T[i];
                auto [from, to] = edge;
                result.push_back({ from, to });
            }
        }
        return result;
    }
    MST::MST(vector<string>& features, Tensor& weights, int root) : features(features), weights(weights), root(root) {}
    vector<pair<int, int>> MST::maximumSpanningTree()
    {
        auto num_features = features.size();
        Graph g(num_features);
        // Make a complete graph
        for (int i = 0; i < num_features - 1; ++i) {
            for (int j = i; j < num_features; ++j) {
                g.addEdge(i, j, weights[i][j].item<float>());
            }
        }
        g.kruskal_algorithm();
        auto mst = g.get_mst();
        return reorder(mst, root);
    }
 }
--- a/bayesclass/cpp/Mst.h
+++ b/bayesclass/cpp/Mst.h
@@ -0,0 +1,35 @@
 #ifndef MST_H
 #define MST_H
 #include <torch/torch.h>
 #include <vector>
 #include <string>
 namespace bayesnet {
    using namespace std;
    using namespace torch;
    class MST {
    private:
        Tensor weights;
        vector<string> features;
        int root;
    public:
        MST() = default;
        MST(vector<string>& features, Tensor& weights, int root);
        vector<pair<int, int>> maximumSpanningTree();
    };
    class Graph {
    private:
        int V;      // number of nodes in graph
        vector <pair<float, pair<int, int>>> G; // vector for graph
        vector <pair<float, pair<int, int>>> T; // vector for mst
        vector<int> parent;
    public:
        Graph(int V);
        void addEdge(int u, int v, float wt);
        int find_set(int i);
        void union_set(int u, int v);
        void kruskal_algorithm();
        void display_mst();
        vector <pair<float, pair<int, int>>> get_mst() { return T; }
    };
 }
 #endif
--- a/bayesclass/cpp/Network.cc
+++ b/bayesclass/cpp/Network.cc
@@ -2,19 +2,13 @@
 #include <mutex>
 #include "Network.h"
 namespace bayesnet {
-    Network::Network() : laplaceSmoothing(1), features(vector<string>()), className(""), classNumStates(0), maxThreads(0.8) {}
+    Network::Network() : laplaceSmoothing(1), features(vector<string>()), className(""), classNumStates(0), maxThreads(0.8), fitted(false) {}
-    Network::Network(float maxT) : laplaceSmoothing(1), features(vector<string>()), className(""), classNumStates(0), maxThreads(maxT) {}
+    Network::Network(float maxT) : laplaceSmoothing(1), features(vector<string>()), className(""), classNumStates(0), maxThreads(maxT), fitted(false) {}
-    Network::Network(float maxT, int smoothing) : laplaceSmoothing(smoothing), features(vector<string>()), className(""), classNumStates(0), maxThreads(maxT) {}
+    Network::Network(float maxT, int smoothing) : laplaceSmoothing(smoothing), features(vector<string>()), className(""), classNumStates(0), maxThreads(maxT), fitted(false) {}
-    Network::Network(Network& other) : laplaceSmoothing(other.laplaceSmoothing), features(other.features), className(other.className), classNumStates(other.getClassNumStates()), maxThreads(other.getmaxThreads())
+    Network::Network(Network& other) : laplaceSmoothing(other.laplaceSmoothing), features(other.features), className(other.className), classNumStates(other.getClassNumStates()), maxThreads(other.getmaxThreads()), fitted(other.fitted)
    {
        for (auto& pair : other.nodes) {
-            nodes[pair.first] = new Node(*pair.second);
+            nodes[pair.first] = make_unique<Node>(*pair.second);
        }
    }
    Network::~Network()
    {
        for (auto& pair : nodes) {
            delete pair.second;
        }
    }
    float Network::getmaxThreads()
@@ -27,12 +21,15 @@ namespace bayesnet {
    }
    void Network::addNode(string name, int numStates)
    {
        if (find(features.begin(), features.end(), name) == features.end()) {
            features.push_back(name);
        }
        if (nodes.find(name) != nodes.end()) {
            // if node exists update its number of states
            nodes[name]->setNumStates(numStates);
            return;
        }
-        nodes[name] = new Node(name, numStates);
+        nodes[name] = make_unique<Node>(name, numStates);
    }
    vector<string> Network::getFeatures()
    {
@@ -45,7 +42,7 @@ namespace bayesnet {
    int Network::getStates()
    {
        int result = 0;
-        for (auto node : nodes) {
+        for (auto& node : nodes) {
            result += node.second->getNumStates();
        }
        return result;
@@ -79,20 +76,20 @@ namespace bayesnet {
            throw invalid_argument("Child node " + child + " does not exist");
        }
        // Temporarily add edge to check for cycles
-        nodes[parent]->addChild(nodes[child]);
+        nodes[parent]->addChild(nodes[child].get());
-        nodes[child]->addParent(nodes[parent]);
+        nodes[child]->addParent(nodes[parent].get());
        unordered_set<string> visited;
        unordered_set<string> recStack;
        if (isCyclic(nodes[child]->getName(), visited, recStack)) // if adding this edge forms a cycle
        {
            // remove problematic edge
-            nodes[parent]->removeChild(nodes[child]);
+            nodes[parent]->removeChild(nodes[child].get());
-            nodes[child]->removeParent(nodes[parent]);
+            nodes[child]->removeParent(nodes[parent].get());
            throw invalid_argument("Adding this edge forms a cycle in the graph.");
        }
    }
-    map<string, Node*>& Network::getNodes()
+    map<string, std::unique_ptr<Node>>& Network::getNodes()
    {
        return nodes;
    }
@@ -140,9 +137,8 @@ namespace bayesnet {
                    lock.unlock();
                    pair.second->computeCPT(dataset, laplaceSmoothing);
                    lock.lock();
-                    nodes[pair.first] = pair.second;
+                    nodes[pair.first] = std::move(pair.second);
                    lock.unlock();
                }
                lock_guard<mutex> lock(mtx);
@@ -155,10 +151,14 @@ namespace bayesnet {
        for (auto& thread : threads) {
            thread.join();
        }
        fitted = true;
    }
    vector<int> Network::predict(const vector<vector<int>>& tsamples)
    {
        if (!fitted) {
            throw logic_error("You must call fit() before calling predict()");
        }
        vector<int> predictions;
        vector<int> sample;
        for (int row = 0; row < tsamples[0].size(); ++row) {
@@ -176,6 +176,9 @@ namespace bayesnet {
    }
    vector<vector<double>> Network::predict_proba(const vector<vector<int>>& tsamples)
    {
        if (!fitted) {
            throw logic_error("You must call fit() before calling predict_proba()");
        }
        vector<vector<double>> predictions;
        vector<int> sample;
        for (int row = 0; row < tsamples[0].size(); ++row) {
@@ -215,7 +218,7 @@ namespace bayesnet {
    double Network::computeFactor(map<string, int>& completeEvidence)
    {
        double result = 1.0;
-        for (auto node : getNodes()) {
+        for (auto& node : getNodes()) {
            result *= node.second->getFactorValue(completeEvidence);
        }
        return result;
@@ -249,7 +252,7 @@ namespace bayesnet {
    {
        vector<string> result;
        // Draw the network
-        for (auto node : nodes) {
+        for (auto& node : nodes) {
            string line = node.first + " -> ";
            for (auto child : node.second->getChildren()) {
                line += child->getName() + ", ";
@@ -258,5 +261,31 @@ namespace bayesnet {
        }
        return result;
    }
    vector<string> Network::graph(string title)
    {
        auto output = vector<string>();
        auto prefix = "digraph BayesNet {\nlabel=<BayesNet ";
        auto suffix = ">\nfontsize=30\nfontcolor=blue\nlabelloc=t\nlayout=circo\n";
        string header = prefix + title + suffix;
        output.push_back(header);
        for (auto& node : nodes) {
            auto result = node.second->graph(className);
            output.insert(output.end(), result.begin(), result.end());
        }
        output.push_back("}\n");
        return output;
    }
    vector<pair<string, string>> Network::getEdges()
    {
        auto edges = vector<pair<string, string>>();
        for (const auto& node : nodes) {
            auto head = node.first;
            for (const auto& child : node.second->getChildren()) {
                auto tail = child->getName();
                edges.push_back({ head, tail });
            }
        }
        return edges;
    }
 }
--- a/bayesclass/cpp/Network.h
+++ b/bayesclass/cpp/Network.h
@@ -7,8 +7,9 @@
 namespace bayesnet {
    class Network {
    private:
-        map<string, Node*> nodes;
+        map<string, std::unique_ptr<Node>> nodes;
        map<string, vector<int>> dataset;
        bool fitted;
        float maxThreads;
        int classNumStates;
        vector<string> features;
@@ -28,14 +29,14 @@ namespace bayesnet {
        Network(float, int);
        Network(float);
        Network(Network&);
        ~Network();
        torch::Tensor& getSamples();
        float getmaxThreads();
        void addNode(string, int);
        void addEdge(const string, const string);
-        map<string, Node*>& getNodes();
+        map<string, std::unique_ptr<Node>>& getNodes();
        vector<string> getFeatures();
        int getStates();
        vector<pair<string, string>> getEdges();
        int getClassNumStates();
        string getClassName();
        void fit(const vector<vector<int>>&, const vector<int>&, const vector<string>&, const string&);
@@ -45,6 +46,7 @@ namespace bayesnet {
        vector<vector<double>> predict_proba(const vector<vector<int>>&);
        double score(const vector<vector<int>>&, const vector<int>&);
        vector<string> show();
        vector<string> graph(string title); // Returns a vector of strings representing the graph in graphviz format
        inline string version() { return "0.1.0"; }
    };
 }
--- a/bayesclass/cpp/Node.cc
+++ b/bayesclass/cpp/Node.cc
@@ -6,12 +6,10 @@ namespace bayesnet {
        : name(name), numStates(numStates), cpTable(torch::Tensor()), parents(vector<Node*>()), children(vector<Node*>())
    {
    }
    string Node::getName() const
    {
        return name;
    }
    void Node::addParent(Node* parent)
    {
        parents.push_back(parent);
@@ -111,4 +109,14 @@ namespace bayesnet {
        }
        return cpTable.index({ coordinates }).item<float>();
    }
    vector<string> Node::graph(string className)
    {
        auto output = vector<string>();
        auto suffix = name == className ? ", fontcolor=red, fillcolor=lightblue, style=filled " : "";
        output.push_back(name + " [shape=circle" + suffix + "] \n");
        for (auto& child : children) {
            output.push_back(name + " -> " + child->getName());
        }
        return output;
    }
 }
--- a/bayesclass/cpp/Node.h
+++ b/bayesclass/cpp/Node.h
@@ -29,6 +29,7 @@ namespace bayesnet {
        int getNumStates() const;
        void setNumStates(int);
        unsigned minFill();
        vector<string> graph(string clasName); // Returns a vector of strings representing the graph in graphviz format
        float getFactorValue(map<string, int>&);
    };
 }
--- a/bayesclass/cpp/SPODE.cc
+++ b/bayesclass/cpp/SPODE.cc
@@ -0,0 +1,25 @@
 #include "SPODE.h"
 namespace bayesnet {
    SPODE::SPODE(int root) : BaseClassifier(Network()), root(root) {}
    void SPODE::train()
    {
        // 0. Add all nodes to the model
        addNodes();
        // 1. Add edges from the class node to all other nodes
        // 2. Add edges from the root node to all other nodes
        for (int i = 0; i < static_cast<int>(features.size()); ++i) {
            model.addEdge(className, features[i]);
            if (i != root) {
                model.addEdge(features[root], features[i]);
            }
        }
    }
    vector<string> SPODE::graph(string name )
    {
        return model.graph(name);
    }
 }
--- a/bayesclass/cpp/SPODE.h
+++ b/bayesclass/cpp/SPODE.h
@@ -0,0 +1,15 @@
 #ifndef SPODE_H
 #define SPODE_H
 #include "BaseClassifier.h"
 namespace bayesnet {
    class SPODE : public BaseClassifier {
    private:
        int root;
    protected:
        void train() override;
    public:
        SPODE(int root);
        vector<string> graph(string name = "SPODE") override;
    };
 }
 #endif
--- a/bayesclass/cpp/TAN.cc
+++ b/bayesclass/cpp/TAN.cc
@@ -0,0 +1,42 @@
 #include "TAN.h"
 namespace bayesnet {
    using namespace std;
    using namespace torch;
    TAN::TAN() : BaseClassifier(Network()) {}
    void TAN::train()
    {
        // 0. Add all nodes to the model
        addNodes();
        // 1. Compute mutual information between each feature and the class and set the root node
        // as the highest mutual information with the class
        auto mi = vector <pair<int, float >>();
        Tensor class_dataset = dataset.index({ "...", -1 });
        for (int i = 0; i < static_cast<int>(features.size()); ++i) {
            Tensor feature_dataset = dataset.index({ "...", i });
            auto mi_value = metrics.mutualInformation(class_dataset, feature_dataset);
            mi.push_back({ i, mi_value });
        }
        sort(mi.begin(), mi.end(), [](auto& left, auto& right) {return left.second < right.second;});
        auto root = mi[mi.size() - 1].first;
        // 2. Compute mutual information between each feature and the class
        auto weights = metrics.conditionalEdge();
        // 3. Compute the maximum spanning tree
        auto mst = metrics.maximumSpanningTree(features, weights, root);
        // 4. Add edges from the maximum spanning tree to the model
        for (auto i = 0; i < mst.size(); ++i) {
            auto [from, to] = mst[i];
            model.addEdge(features[from], features[to]);
        }
        // 5. Add edges from the class to all features
        for (auto feature : features) {
            model.addEdge(className, feature);
        }
    }
    vector<string> TAN::graph(string title)
    {
        return model.graph(title);
    }
 }
--- a/bayesclass/cpp/TAN.h
+++ b/bayesclass/cpp/TAN.h
@@ -0,0 +1,16 @@
 #ifndef TAN_H
 #define TAN_H
 #include "BaseClassifier.h"
 namespace bayesnet {
    using namespace std;
    using namespace torch;
    class TAN : public BaseClassifier {
    private:
    protected:
        void train() override;
    public:
        TAN();
        vector<string> graph(string name = "TAN") override;
    };
 }
 #endif
--- a/bayesclass/cpp/utils.cc
+++ b/bayesclass/cpp/utils.cc
@@ -0,0 +1,31 @@
 #include <torch/torch.h>
 #include <vector>
 namespace bayesnet {
    using namespace std;
    using namespace torch;
    vector<int> argsort(vector<float>& nums)
    {
        int n = nums.size();
        vector<int> indices(n);
        iota(indices.begin(), indices.end(), 0);
        sort(indices.begin(), indices.end(), [&nums](int i, int j) {return nums[i] > nums[j];});
        return indices;
    }
    vector<vector<int>> tensorToVector(const Tensor& tensor)
    {
        // convert mxn tensor to nxm vector
        vector<vector<int>> result;
        auto tensor_accessor = tensor.accessor<int, 2>();
        // Iterate over columns and rows of the tensor
        for (int j = 0; j < tensor.size(1); ++j) {
            vector<int> column;
            for (int i = 0; i < tensor.size(0); ++i) {
                column.push_back(tensor_accessor[i][j]);
            }
            result.push_back(column);
        }
        return result;
    }
 }
--- a/bayesclass/cpp/utils.h
+++ b/bayesclass/cpp/utils.h
@@ -0,0 +1,8 @@
 namespace bayesnet {
    using namespace std;
    using namespace torch;
    vector<int> argsort(vector<float>& nums);
    vector<vector<int>> tensorToVector(const Tensor& tensor);
 }
--- a/setup.py
+++ b/setup.py
@@ -18,7 +18,7 @@ setup(
            name="bayesclass.cppSelectFeatures",
            sources=[
                "bayesclass/cSelectFeatures.pyx",
-                "bayesclass/FeatureSelect.cpp",
+                "bayesclass/cpp/FeatureSelect.cpp",
            ],
            language="c++",
            include_dirs=["bayesclass"],
@@ -30,9 +30,17 @@ setup(
            name="bayesclass.BayesNet",
            sources=[
                "bayesclass/BayesNetwork.pyx",
-                "bayesclass/Network.cc",
+                "bayesclass/cpp/Network.cc",
-                "bayesclass/Node.cc",
+                "bayesclass/cpp/Node.cc",
-                "bayesclass/Metrics.cc",
+                "bayesclass/cpp/Metrics.cc",
                "bayesclass/cpp/utils.cc",
                "bayesclass/cpp/Mst.cc",
                "bayesclass/cpp/BaseClassifier.cc",
                "bayesclass/cpp/Ensemble.cc",
                "bayesclass/cpp/TAN.cc",
                "bayesclass/cpp/KDB.cc",
                "bayesclass/cpp/SPODE.cc",
                "bayesclass/cpp/AODE.cc",
            ],
            include_dirs=include_paths(),
        ),
Author	SHA1	Message	Date
Ricardo Montañana	7f5ea1ab1e	Refactor library	2023-07-19 16:16:15 +02:00
Ricardo Montañana	168cc368ee	Complete CPP model integration	2023-07-18 23:39:50 +02:00