Merge branch 'main' into TANNew

Complete AODELd
Rename suffix of proposal classifier to Ld
2023-08-06 11:40:10 +02:00 · 2023-08-06 11:31:44 +02:00 · 2023-08-05 23:23:31 +02:00 · 2023-08-05 23:11:36 +02:00 · 2023-08-05 20:29:05 +02:00 · 2023-08-05 18:39:48 +02:00
78 changed files with 2553 additions and 1158 deletions
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -0,0 +1,17 @@
+---
+Checks: '-*,
+         clang-*,
+         bugprone-*,
+         cppcoreguidelines-*,
+         modernize-*,
+         performance-*,
+         -cppcoreguidelines-pro-type-vararg,
+         -modernize-use-trailing-return-type,
+         -bugprone-exception-escape'
+
+HeaderFilterRegex: 'src/*'
+AnalyzeTemporaryDtors: false
+WarningsAsErrors: ''
+FormatStyle: file
+FormatStyleOptions: ''
+...
--- a/.gitmodules
+++ b/.gitmodules
@@ -0,0 +1,12 @@
+[submodule "lib/mdlp"]
+	path = lib/mdlp
+	url = https://github.com/rmontanana/mdlp
+[submodule "lib/catch2"]
+	path = lib/catch2
+	url = https://github.com/catchorg/Catch2.git
+[submodule "lib/argparse"]
+	path = lib/argparse
+	url = https://github.com/p-ranav/argparse
+[submodule "lib/json"]
+	path = lib/json
+	url = https://github.com/nlohmann/json.git
--- a/.vscode/launch.json
+++ b/.vscode/launch.json
@@ -4,22 +4,35 @@
        {
            "type": "lldb",
            "request": "launch",
-            "name": "bayesnet",
-            "program": "${workspaceFolder}/build/sample/main",
+            "name": "sample",
+            "program": "${workspaceFolder}/build/sample/BayesNetSample",
            "args": [
-                "-f",
-                "iris"
+                "-d",
+                "iris",
+                "-m",
+                "KDB",
+                "-s",
+                "271",
+                "-p",
+                "/Users/rmontanana/Code/discretizbench/datasets/",
            ],
-            "cwd": "${workspaceFolder}",
-            "preLaunchTask": "CMake: build"
+            //"cwd": "${workspaceFolder}/build/sample/",
        },
        {
            "type": "lldb",
            "request": "launch",
-            "name": "aout",
-            "program": "${workspaceFolder}/a.out",
-            "args": [],
-            "cwd": "${workspaceFolder}"
+            "name": "experiment",
+            "program": "${workspaceFolder}/build/src/Platform/main",
+            "args": [
+                "-m",
+                "AODELd",
+                "-p",
+                "/Users/rmontanana/Code/discretizbench/datasets",
+                "--stratified",
+                "-d",
+                "iris"
+            ],
+            "cwd": "/Users/rmontanana/Code/discretizbench",
        },
        {
            "name": "Build & debug active file",
--- a/.vscode/settings.json
+++ b/.vscode/settings.json
@@ -97,7 +97,12 @@
        "future": "cpp",
        "queue": "cpp",
        "typeindex": "cpp",
-        "shared_mutex": "cpp"
+        "shared_mutex": "cpp",
+        "*.ipp": "cpp",
+        "cassert": "cpp",
+        "charconv": "cpp",
+        "source_location": "cpp",
+        "ranges": "cpp"
    },
    "cmake.configureOnOpen": false,
    "C_Cpp.default.configurationProvider": "ms-vscode.cmake-tools"
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -7,10 +7,14 @@ project(BayesNet
  LANGUAGES CXX
 )

+if (CODE_COVERAGE AND NOT ENABLE_TESTING)
+  MESSAGE(FATAL_ERROR "Code coverage requires testing enabled")
+endif (CODE_COVERAGE AND NOT ENABLE_TESTING)
+
 find_package(Torch REQUIRED)

 if (POLICY CMP0135)
-    cmake_policy(SET CMP0135 NEW)
+  cmake_policy(SET CMP0135 NEW)
 endif ()

 # Global CMake variables
@@ -24,21 +28,40 @@ set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${TORCH_CXX_FLAGS}")
 # Options
 # -------
 option(ENABLE_CLANG_TIDY "Enable to add clang tidy."              OFF)
-option(ENABLE_TESTING "Unit testing build"                        ON)
-option(CODE_COVERAGE "Collect coverage from test library"         ON)
-
-set(CMAKE_BUILD_TYPE "Debug")
+option(ENABLE_TESTING "Unit testing build"                        OFF)
+option(CODE_COVERAGE "Collect coverage from test library"         OFF)

 # CMakes modules
 # --------------
 set(CMAKE_MODULE_PATH ${CMAKE_CURRENT_SOURCE_DIR}/cmake/modules ${CMAKE_MODULE_PATH})

+include(AddGitSubmodule)
+if (CODE_COVERAGE)
+    enable_testing()
+    include(CodeCoverage)
+    MESSAGE("Code coverage enabled")
+    set(CMAKE_C_FLAGS " ${CMAKE_C_FLAGS} -fprofile-arcs -ftest-coverage")
+    set(CMAKE_CXX_FLAGS " ${CMAKE_CXX_FLAGS} -fprofile-arcs -ftest-coverage")
+    SET(GCC_COVERAGE_LINK_FLAGS " ${GCC_COVERAGE_LINK_FLAGS} -lgcov --coverage")
+endif (CODE_COVERAGE)
+
+if (ENABLE_CLANG_TIDY)
+  include(StaticAnalyzers) # clang-tidy
+endif (ENABLE_CLANG_TIDY)
+
+# External libraries - dependencies of BayesNet
+# ---------------------------------------------
+# include(FetchContent)
+add_git_submodule("lib/mdlp")
+add_git_submodule("lib/argparse")
+add_git_submodule("lib/json")

 # Subdirectories
 # --------------
 add_subdirectory(config)
-add_subdirectory(${BayesNet_SOURCE_DIR}/src/BayesNet)
-add_subdirectory(${BayesNet_SOURCE_DIR}/src/Platform)
+add_subdirectory(lib/Files)
+add_subdirectory(src/BayesNet)
+add_subdirectory(src/Platform)
 add_subdirectory(sample)

 file(GLOB BayesNet_HEADERS CONFIGURE_DEPENDS ${BayesNet_SOURCE_DIR}/src/BayesNet/*.h ${BayesNet_SOURCE_DIR}/BayesNet/*.hpp)
@@ -47,18 +70,11 @@ file(GLOB Platform_SOURCES CONFIGURE_DEPENDS ${BayesNet_SOURCE_DIR}/src/Platform

 # Testing
 # -------
+
 if (ENABLE_TESTING)
  MESSAGE("Testing enabled")
-  enable_testing()
-  if (CODE_COVERAGE)
-    include(CodeCoverage)
-    MESSAGE("Code coverage enabled")
-    set(CMAKE_C_FLAGS " ${CMAKE_C_FLAGS} -fprofile-arcs -ftest-coverage")
-    set(CMAKE_CXX_FLAGS " ${CMAKE_CXX_FLAGS} -fprofile-arcs -ftest-coverage")
-    SET(GCC_COVERAGE_LINK_FLAGS " ${GCC_COVERAGE_LINK_FLAGS} -lgcov --coverage")
-  endif (CODE_COVERAGE)
-  find_package(Catch2 3 REQUIRED)
+  add_git_submodule("lib/catch2")
+  
  include(CTest)
-  include(Catch)
  add_subdirectory(tests)
-endif (ENABLE_TESTING)
+endif (ENABLE_TESTING)
--- a/26
+++ b/26
@@ -14,16 +14,30 @@ setup: ## Install dependencies for tests and coverage
 dependency: ## Create a dependency graph diagram of the project (build/dependency.png)
 	cd build && cmake .. --graphviz=dependency.dot && dot -Tpng dependency.dot -o dependency.png

-build: ## Build the project
-	@echo ">>> Building BayesNet ...";
+build: ## Build the main and BayesNetSample
+	cmake --build build -t main -t BayesNetSample -j 32
+
+clean: ## Clean the debug info
+	@echo ">>> Cleaning Debug BayesNet ...";
+	find . -name "*.gcda" -print0 | xargs -0 rm
+	@echo ">>> Done";
+
+debug: ## Build a debug version of the project
+	@echo ">>> Building Debug BayesNet ...";
 	@if [ -d ./build ]; then rm -rf ./build; fi
 	@mkdir build; 
-	cmake -S . -B build; \
-	cd build; \
-	make; \
-	
+	cmake -S . -B build -D CMAKE_BUILD_TYPE=Debug -D ENABLE_TESTING=ON -D CODE_COVERAGE=ON; \
+	cmake --build build -j 32;
 	@echo ">>> Done";

+release: ## Build a Release version of the project
+	@echo ">>> Building Release BayesNet ...";
+	@if [ -d ./build ]; then rm -rf ./build; fi
+	@mkdir build; 
+	cmake -S . -B build -D CMAKE_BUILD_TYPE=Release; \
+	cmake --build build -t main -t BayesNetSample -j 32;
+	@echo ">>> Done";	
+
 test: ## Run tests
 	@echo "* Running tests...";
 	find . -name "*.gcda" -print0 | xargs -0 rm
--- a/TAN_iris.dot
+++ b/TAN_iris.dot
@@ -0,0 +1,12 @@
+digraph BayesNet {
+label=<BayesNet >
+fontsize=30
+fontcolor=blue
+labelloc=t
+layout=circo
+ class [shape=circle, fontcolor=red, fillcolor=lightblue, style=filled ] 
+ class -> sepallength class -> sepalwidth class -> petallength class -> petalwidth petallength [shape=circle] 
+ petallength -> sepallength petalwidth [shape=circle] 
+ sepallength [shape=circle] 
+ sepallength -> sepalwidth sepalwidth [shape=circle] 
+ sepalwidth -> petalwidth }
--- a/cmake/modules/AddGitSubmodule.cmake
+++ b/cmake/modules/AddGitSubmodule.cmake
@@ -0,0 +1,12 @@
+
+function(add_git_submodule dir)
+  find_package(Git REQUIRED) 
+
+  if(NOT EXISTS ${dir}/CMakeLists.txt)
+    message(STATUS "🚨 Adding git submodule => ${dir}")
+    execute_process(COMMAND ${GIT_EXECUTABLE}
+      submodule update --init --recursive -- ${dir}
+      WORKING_DIRECTORY ${PROJECT_SOURCE_DIR}) 
+  endif()
+  add_subdirectory(${dir})
+endfunction(add_git_submodule)
--- a/cmake/modules/StaticAnalyzers.cmake
+++ b/cmake/modules/StaticAnalyzers.cmake
@@ -0,0 +1,22 @@
+if(ENABLE_CLANG_TIDY)
+    find_program(CLANG_TIDY_COMMAND NAMES clang-tidy)
+
+    if(NOT CLANG_TIDY_COMMAND)
+        message(WARNING "🔴 CMake_RUN_CLANG_TIDY is ON but clang-tidy is not found!")
+        set(CMAKE_CXX_CLANG_TIDY "" CACHE STRING "" FORCE)
+    else()
+    
+        message(STATUS "🟢 CMake_RUN_CLANG_TIDY is ON")
+        set(CLANGTIDY_EXTRA_ARGS
+            "-extra-arg=-Wno-unknown-warning-option"
+        )
+        set(CMAKE_CXX_CLANG_TIDY "${CLANG_TIDY_COMMAND};-p=${CMAKE_BINARY_DIR};${CLANGTIDY_EXTRA_ARGS}" CACHE STRING "" FORCE)
+
+        add_custom_target(clang-tidy
+            COMMAND ${CMAKE_COMMAND} --build ${CMAKE_BINARY_DIR} --target ${CMAKE_PROJECT_NAME}
+            COMMAND ${CMAKE_COMMAND} --build ${CMAKE_BINARY_DIR} --target clang-tidy
+            COMMENT "Running clang-tidy..."
+        )
+       set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
+    endif()
+endif(ENABLE_CLANG_TIDY)
--- a/data/_TAN_cpp_accuracy__.json
+++ b/data/_TAN_cpp_accuracy__.json
@@ -0,0 +1 @@
+null
--- a/gcovr.cfg
+++ b/gcovr.cfg
@@ -1,5 +1,4 @@
 filter = src/
-exclude = external/
-exclude = tests/
+exclude-directories = build/lib/
 print-summary = yes
 sort-percentage = yes
--- a/src/Platform/ArffFiles.cc
+++ b/src/Platform/ArffFiles.cc
@@ -2,6 +2,7 @@
 #include <fstream>
 #include <sstream>
 #include <map>
+#include <iostream>

 using namespace std;

@@ -42,7 +43,7 @@ vector<int>& ArffFiles::getY()
    return y;
 }

-void ArffFiles::load(const string& fileName, bool classLast)
+void ArffFiles::loadCommon(string fileName)
 {
    ifstream file(fileName);
    if (!file.is_open()) {
@@ -74,24 +75,51 @@ void ArffFiles::load(const string& fileName, bool classLast)
    file.close();
    if (attributes.empty())
        throw invalid_argument("No attributes found");
+}
+
+void ArffFiles::load(const string& fileName, bool classLast)
+{
+    int labelIndex;
+    loadCommon(fileName);
    if (classLast) {
        className = get<0>(attributes.back());
        classType = get<1>(attributes.back());
        attributes.pop_back();
+        labelIndex = static_cast<int>(attributes.size());
    } else {
        className = get<0>(attributes.front());
        classType = get<1>(attributes.front());
        attributes.erase(attributes.begin());
+        labelIndex = 0;
    }
-    generateDataset(classLast);
-
+    generateDataset(labelIndex);
+}
+void ArffFiles::load(const string& fileName, const string& name)
+{
+    int labelIndex;
+    loadCommon(fileName);
+    bool found = false;
+    for (int i = 0; i < attributes.size(); ++i) {
+        if (attributes[i].first == name) {
+            className = get<0>(attributes[i]);
+            classType = get<1>(attributes[i]);
+            attributes.erase(attributes.begin() + i);
+            labelIndex = i;
+            found = true;
+            break;
+        }
+    }
+    if (!found) {
+        throw invalid_argument("Class name not found");
+    }
+    generateDataset(labelIndex);
 }

-void ArffFiles::generateDataset(bool classLast)
+void ArffFiles::generateDataset(int labelIndex)
 {
    X = vector<vector<float>>(attributes.size(), vector<float>(lines.size()));
    auto yy = vector<string>(lines.size(), "");
-    int labelIndex = classLast ? static_cast<int>(attributes.size()) : 0;
+    auto removeLines = vector<int>(); // Lines with missing values
    for (size_t i = 0; i < lines.size(); i++) {
        stringstream ss(lines[i]);
        string value;
@@ -101,10 +129,20 @@ void ArffFiles::generateDataset(bool classLast)
            if (pos++ == labelIndex) {
                yy[i] = value;
            } else {
-                X[xIndex++][i] = stof(value);
+                if (value == "?") {
+                    X[xIndex++][i] = -1;
+                    removeLines.push_back(i);
+                } else
+                    X[xIndex++][i] = stof(value);
            }
        }
    }
+    for (auto i : removeLines) {
+        yy.erase(yy.begin() + i);
+        for (auto& x : X) {
+            x.erase(x.begin() + i);
+        }
+    }
    y = factorize(yy);
 }

--- a/src/Platform/ArffFiles.h
+++ b/src/Platform/ArffFiles.h
@@ -14,12 +14,12 @@ private:
    string classType;
    vector<vector<float>> X;
    vector<int> y;
-
-    void generateDataset(bool);
-
+    void generateDataset(int);
+    void loadCommon(string);
 public:
    ArffFiles();
    void load(const string&, bool = true);
+    void load(const string&, const string&);
    vector<string> getLines() const;
    unsigned long int getSize() const;
    string getClassName() const;
--- a/lib/Files/CMakeLists.txt
+++ b/lib/Files/CMakeLists.txt
@@ -0,0 +1,2 @@
+add_library(ArffFiles ArffFiles.cc)
+#target_link_libraries(BayesNet "${TORCH_LIBRARIES}")
--- a/lib/argparse
+++ b/lib/argparse
--- a/lib/catch2
+++ b/lib/catch2
--- a/lib/json
+++ b/lib/json
--- a/lib/mdlp
+++ b/lib/mdlp
--- a/sample/CMakeLists.txt
+++ b/sample/CMakeLists.txt
@@ -1,4 +1,7 @@
 include_directories(${BayesNet_SOURCE_DIR}/src/Platform)
 include_directories(${BayesNet_SOURCE_DIR}/src/BayesNet)
-add_executable(sample sample.cc ${BayesNet_SOURCE_DIR}/src/Platform/ArffFiles.cc ${BayesNet_SOURCE_DIR}/src/Platform/CPPFImdlp.cpp ${BayesNet_SOURCE_DIR}/src/Platform/Metrics.cpp ${BayesNet_SOURCE_DIR}/src/Platform/typesFImdlp.h ${BayesNet_HEADERS})
-target_link_libraries(sample BayesNet "${TORCH_LIBRARIES}")
+include_directories(${BayesNet_SOURCE_DIR}/lib/Files)
+include_directories(${BayesNet_SOURCE_DIR}/lib/mdlp)
+include_directories(${BayesNet_SOURCE_DIR}/lib/argparse/include)
+add_executable(BayesNetSample sample.cc ${BayesNet_SOURCE_DIR}/src/Platform/Folding.cc ${BayesNet_SOURCE_DIR}/src/Platform/Models.cc) 
+target_link_libraries(BayesNetSample BayesNet ArffFiles mdlp "${TORCH_LIBRARIES}")
--- a/sample/sample.cc
+++ b/sample/sample.cc
@@ -1,96 +1,19 @@
 #include <iostream>
-#include <string>
 #include <torch/torch.h>
-#include <thread>
-#include <getopt.h>
+#include <string>
+#include <map>
+#include <argparse/argparse.hpp>
 #include "ArffFiles.h"
-#include "Network.h"
-#include "Metrics.hpp"
+#include "BayesMetrics.h"
 #include "CPPFImdlp.h"
-#include "KDB.h"
-#include "SPODE.h"
-#include "AODE.h"
-#include "TAN.h"
+#include "Folding.h"
+#include "Models.h"
+#include "modelRegister.h"


 using namespace std;

-const string PATH = "data/";
-
-/* print a description of all supported options */
-void usage(const char* path)
-{
-    /* take only the last portion of the path */
-    const char* basename = strrchr(path, '/');
-    basename = basename ? basename + 1 : path;
-
-    cout << "usage: " << basename << "[OPTION]" << endl;
-    cout << "  -h, --help\t\t Print this help and exit." << endl;
-    cout
-        << "  -f, --file[=FILENAME]\t {diabetes, glass, iris, kdd_JapaneseVowels, letter, liver-disorders, mfeat-factors}."
-        << endl;
-    cout << "  -p, --path[=FILENAME]\t folder where the data files are located, default " << PATH << endl;
-    cout << "  -m, --model={AODE, KDB, SPODE, TAN}\t " << endl;
-}
-
-tuple<string, string, string> parse_arguments(int argc, char** argv)
-{
-    string file_name;
-    string model_name;
-    string path = PATH;
-    const vector<struct option> long_options = {
-            {"help",          no_argument,       nullptr, 'h'},
-            {"file",          required_argument, nullptr, 'f'},
-            {"path",          required_argument, nullptr, 'p'},
-            {"model",         required_argument, nullptr, 'm'},
-            {nullptr,         no_argument,       nullptr, 0}
-    };
-    while (true) {
-        const auto c = getopt_long(argc, argv, "hf:p:m:", long_options.data(), nullptr);
-        if (c == -1)
-            break;
-        switch (c) {
-            case 'h':
-                usage(argv[0]);
-                exit(0);
-            case 'f':
-                file_name = string(optarg);
-                break;
-            case 'm':
-                model_name = string(optarg);
-                break;
-            case 'p':
-                path = optarg;
-                if (path.back() != '/')
-                    path += '/';
-                break;
-            case '?':
-                usage(argv[0]);
-                exit(1);
-            default:
-                abort();
-        }
-    }
-    if (file_name.empty()) {
-        usage(argv[0]);
-        exit(1);
-    }
-    return make_tuple(file_name, path, model_name);
-}
-
-inline constexpr auto hash_conv(const std::string_view sv)
-{
-    unsigned long hash{ 5381 };
-    for (unsigned char c : sv) {
-        hash = ((hash << 5) + hash) ^ c;
-    }
-    return hash;
-}
-
-inline constexpr auto operator"" _sh(const char* str, size_t len)
-{
-    return hash_conv(std::string_view{ str, len });
-}
+const string PATH = "../../data/";

 pair<vector<mdlp::labels_t>, map<string, int>> discretize(vector<mdlp::samples_t>& X, mdlp::labels_t& y, vector<string> features)
 {
@@ -116,8 +39,23 @@ bool file_exists(const std::string& name)
        return false;
    }
 }
+pair<vector<vector<int>>, vector<int>> extract_indices(vector<int> indices, vector<vector<int>> X, vector<int> y)
+{
+    vector<vector<int>> Xr; // nxm
+    vector<int> yr;
+    for (int col = 0; col < X.size(); ++col) {
+        Xr.push_back(vector<int>());
+    }
+    for (auto index : indices) {
+        for (int col = 0; col < X.size(); ++col) {
+            Xr[col].push_back(X[col][index]);
+        }
+        yr.push_back(y[index]);
+    }
+    return { Xr, yr };
+}

-tuple<string, string, string> get_options(int argc, char** argv)
+int main(int argc, char** argv)
 {
    map<string, bool> datasets = {
            {"diabetes",           true},
@@ -129,97 +67,170 @@ tuple<string, string, string> get_options(int argc, char** argv)
            {"liver-disorders",    true},
            {"mfeat-factors",      true},
    };
-    vector <string> models = { "AODE", "KDB", "SPODE", "TAN" };
-    string file_name;
-    string path;
-    string model_name;
-    tie(file_name, path, model_name) = parse_arguments(argc, argv);
-    if (datasets.find(file_name) == datasets.end()) {
-        cout << "Invalid file name: " << file_name << endl;
-        usage(argv[0]);
+    auto valid_datasets = vector<string>();
+    transform(datasets.begin(), datasets.end(), back_inserter(valid_datasets),
+        [](const pair<string, bool>& pair) { return pair.first; });
+    argparse::ArgumentParser program("BayesNetSample");
+    program.add_argument("-d", "--dataset")
+        .help("Dataset file name")
+        .action([valid_datasets](const std::string& value) {
+        if (find(valid_datasets.begin(), valid_datasets.end(), value) != valid_datasets.end()) {
+            return value;
+        }
+        throw runtime_error("file must be one of {diabetes, ecoli, glass, iris, kdd_JapaneseVowels, letter, liver-disorders, mfeat-factors}");
+            }
+    );
+    program.add_argument("-p", "--path")
+        .help(" folder where the data files are located, default")
+        .default_value(string{ PATH }
+    );
+    program.add_argument("-m", "--model")
+        .help("Model to use " + platform::Models::instance()->toString())
+        .action([](const std::string& value) {
+        static const vector<string> choices = platform::Models::instance()->getNames();
+        if (find(choices.begin(), choices.end(), value) != choices.end()) {
+            return value;
+        }
+        throw runtime_error("Model must be one of " + platform::Models::instance()->toString());
+            }
+    );
+    program.add_argument("--discretize").help("Discretize input dataset").default_value(false).implicit_value(true);
+    program.add_argument("--dumpcpt").help("Dump CPT Tables").default_value(false).implicit_value(true);
+    program.add_argument("--stratified").help("If Stratified KFold is to be done").default_value(false).implicit_value(true);
+    program.add_argument("--tensors").help("Use tensors to store samples").default_value(false).implicit_value(true);
+    program.add_argument("-f", "--folds").help("Number of folds").default_value(5).scan<'i', int>().action([](const string& value) {
+        try {
+            auto k = stoi(value);
+            if (k < 2) {
+                throw runtime_error("Number of folds must be greater than 1");
+            }
+            return k;
+        }
+        catch (const runtime_error& err) {
+            throw runtime_error(err.what());
+        }
+        catch (...) {
+            throw runtime_error("Number of folds must be an integer");
+        }});
+    program.add_argument("-s", "--seed").help("Random seed").default_value(-1).scan<'i', int>();
+    bool class_last, stratified, tensors, dump_cpt;
+    string model_name, file_name, path, complete_file_name;
+    int nFolds, seed;
+    try {
+        program.parse_args(argc, argv);
+        file_name = program.get<string>("dataset");
+        path = program.get<string>("path");
+        model_name = program.get<string>("model");
+        complete_file_name = path + file_name + ".arff";
+        stratified = program.get<bool>("stratified");
+        tensors = program.get<bool>("tensors");
+        nFolds = program.get<int>("folds");
+        seed = program.get<int>("seed");
+        dump_cpt = program.get<bool>("dumpcpt");
+        class_last = datasets[file_name];
+        if (!file_exists(complete_file_name)) {
+            throw runtime_error("Data File " + path + file_name + ".arff" + " does not exist");
+        }
+    }
+    catch (const exception& err) {
+        cerr << err.what() << endl;
+        cerr << program;
        exit(1);
    }
-    if (!file_exists(path + file_name + ".arff")) {
-        cout << "Data File " << path + file_name + ".arff" << " does not exist" << endl;
-        usage(argv[0]);
-        exit(1);
-    }
-    if (find(models.begin(), models.end(), model_name) == models.end()) {
-        cout << "Invalid model name: " << model_name << endl;
-        usage(argv[0]);
-        exit(1);
-    }
-    return { file_name, path, model_name };
-}

-int main(int argc, char** argv)
-{
-    string file_name, path, model_name;
-    tie(file_name, path, model_name) = get_options(argc, argv);
+    /*
+    * Begin Processing
+    */
    auto handler = ArffFiles();
-    handler.load(path + file_name + ".arff");
+    handler.load(complete_file_name, class_last);
    // Get Dataset X, y
    vector<mdlp::samples_t>& X = handler.getX();
    mdlp::labels_t& y = handler.getY();
    // Get className & Features
    auto className = handler.getClassName();
    vector<string> features;
-    for (auto feature : handler.getAttributes()) {
-        features.push_back(feature.first);
-    }
+    auto attributes = handler.getAttributes();
+    transform(attributes.begin(), attributes.end(), back_inserter(features),
+        [](const pair<string, string>& item) { return item.first; });
    // Discretize Dataset
-    vector<mdlp::labels_t> Xd;
-    map<string, int> maxes;
-    tie(Xd, maxes) = discretize(X, y, features);
+    auto [Xd, maxes] = discretize(X, y, features);
    maxes[className] = *max_element(y.begin(), y.end()) + 1;
    map<string, vector<int>> states;
    for (auto feature : features) {
        states[feature] = vector<int>(maxes[feature]);
    }
-    states[className] = vector<int>(
-        maxes[className]);
-    double score;
-    vector<string> lines;
-    vector<string> graph;
-    auto kdb = bayesnet::KDB(2);
-    auto aode = bayesnet::AODE();
-    auto spode = bayesnet::SPODE(2);
-    auto tan = bayesnet::TAN();
-    switch (hash_conv(model_name)) {
-        case "AODE"_sh:
-            aode.fit(Xd, y, features, className, states);
-            lines = aode.show();
-            score = aode.score(Xd, y);
-            graph = aode.graph();
-            break;
-        case "KDB"_sh:
-            kdb.fit(Xd, y, features, className, states);
-            lines = kdb.show();
-            score = kdb.score(Xd, y);
-            graph = kdb.graph();
-            break;
-        case "SPODE"_sh:
-            spode.fit(Xd, y, features, className, states);
-            lines = spode.show();
-            score = spode.score(Xd, y);
-            graph = spode.graph();
-            break;
-        case "TAN"_sh:
-            tan.fit(Xd, y, features, className, states);
-            lines = tan.show();
-            score = tan.score(Xd, y);
-            graph = tan.graph();
-            break;
+    states[className] = vector<int>(maxes[className]);
+    auto clf = platform::Models::instance()->create(model_name);
+    clf->fit(Xd, y, features, className, states);
+    if (dump_cpt) {
+        cout << "--- CPT Tables ---" << endl;
+        clf->dump_cpt();
    }
+    auto lines = clf->show();
    for (auto line : lines) {
        cout << line << endl;
    }
+    cout << "--- Topological Order ---" << endl;
+    auto order = clf->topological_order();
+    for (auto name : order) {
+        cout << name << ", ";
+    }
+    cout << "end." << endl;
+    auto score = clf->score(Xd, y);
    cout << "Score: " << score << endl;
-    auto dot_file = model_name + "_" + file_name;
-    ofstream file(dot_file + ".dot");
-    file << graph;
-    file.close();
-    cout << "Graph saved in " << model_name << "_" << file_name << ".dot" << endl;
-    cout << "dot -Tpng -o " + dot_file + ".png " + dot_file + ".dot " << endl;
-    return 0;
+    // auto graph = clf->graph();
+    // auto dot_file = model_name + "_" + file_name;
+    // ofstream file(dot_file + ".dot");
+    // file << graph;
+    // file.close();
+    // cout << "Graph saved in " << model_name << "_" << file_name << ".dot" << endl;
+    // cout << "dot -Tpng -o " + dot_file + ".png " + dot_file + ".dot " << endl;
+    // string stratified_string = stratified ? " Stratified" : "";
+    // cout << nFolds << " Folds" << stratified_string << " Cross validation" << endl;
+    // cout << "==========================================" << endl;
+    // torch::Tensor Xt = torch::zeros({ static_cast<int>(Xd.size()), static_cast<int>(Xd[0].size()) }, torch::kInt32);
+    // torch::Tensor yt = torch::tensor(y, torch::kInt32);
+    // for (int i = 0; i < features.size(); ++i) {
+    //     Xt.index_put_({ i, "..." }, torch::tensor(Xd[i], torch::kInt32));
+    // }
+    // float total_score = 0, total_score_train = 0, score_train, score_test;
+    // Fold* fold;
+    // if (stratified)
+    //     fold = new StratifiedKFold(nFolds, y, seed);
+    // else
+    //     fold = new KFold(nFolds, y.size(), seed);
+    // for (auto i = 0; i < nFolds; ++i) {
+    //     auto [train, test] = fold->getFold(i);
+    //     cout << "Fold: " << i + 1 << endl;
+    //     if (tensors) {
+    //         auto ttrain = torch::tensor(train, torch::kInt64);
+    //         auto ttest = torch::tensor(test, torch::kInt64);
+    //         torch::Tensor Xtraint = torch::index_select(Xt, 1, ttrain);
+    //         torch::Tensor ytraint = yt.index({ ttrain });
+    //         torch::Tensor Xtestt = torch::index_select(Xt, 1, ttest);
+    //         torch::Tensor ytestt = yt.index({ ttest });
+    //         clf->fit(Xtraint, ytraint, features, className, states);
+    //         auto temp = clf->predict(Xtraint);
+    //         score_train = clf->score(Xtraint, ytraint);
+    //         score_test = clf->score(Xtestt, ytestt);
+    //     } else {
+    //         auto [Xtrain, ytrain] = extract_indices(train, Xd, y);
+    //         auto [Xtest, ytest] = extract_indices(test, Xd, y);
+    //         clf->fit(Xtrain, ytrain, features, className, states);
+    //         score_train = clf->score(Xtrain, ytrain);
+    //         score_test = clf->score(Xtest, ytest);
+    //     }
+    //     if (dump_cpt) {
+    //         cout << "--- CPT Tables ---" << endl;
+    //         clf->dump_cpt();
+    //     }
+    //     total_score_train += score_train;
+    //     total_score += score_test;
+    //     cout << "Score Train: " << score_train << endl;
+    //     cout << "Score Test : " << score_test << endl;
+    //     cout << "-------------------------------------------------------------------------------" << endl;
+    // }
+    // cout << "**********************************************************************************" << endl;
+    // cout << "Average Score Train: " << total_score_train / nFolds << endl;
+    // cout << "Average Score Test : " << total_score / nFolds << endl;return 0;
 }
--- a/src/BayesNet/AODE.cc
+++ b/src/BayesNet/AODE.cc
@@ -9,7 +9,7 @@ namespace bayesnet {
            models.push_back(std::make_unique<SPODE>(i));
        }
    }
-    vector<string> AODE::graph(string title)
+    vector<string> AODE::graph(const string& title)
    {
        return Ensemble::graph(title);
    }
--- a/src/BayesNet/AODE.h
+++ b/src/BayesNet/AODE.h
@@ -8,7 +8,8 @@ namespace bayesnet {
        void train() override;
    public:
        AODE();
-        vector<string> graph(string title = "AODE");
+        virtual ~AODE() {};
+        vector<string> graph(const string& title = "AODE") override;
    };
 }
 #endif
--- a/src/BayesNet/AODELd.cc
+++ b/src/BayesNet/AODELd.cc
@@ -0,0 +1,34 @@
+#include "AODELd.h"
+
+namespace bayesnet {
+    using namespace std;
+    AODELd::AODELd() : Ensemble(), Proposal(Ensemble::Xv, Ensemble::yv, features, className) {}
+    AODELd& AODELd::fit(torch::Tensor& X_, torch::Tensor& y_, vector<string>& features_, string className_, map<string, vector<int>>& states_)
+    {
+        features = features_;
+        className = className_;
+        states = states_;
+        train();
+        for (const auto& model : models) {
+            model->fit(X_, y_, features_, className_, states_);
+        }
+        n_models = models.size();
+        fitted = true;
+        return *this;
+    }
+    void AODELd::train()
+    {
+        models.clear();
+        for (int i = 0; i < features.size(); ++i) {
+            models.push_back(std::make_unique<SPODELd>(i));
+        }
+    }
+    Tensor AODELd::predict(Tensor& X)
+    {
+        return Ensemble::predict(X);
+    }
+    vector<string> AODELd::graph(const string& name)
+    {
+        return Ensemble::graph(name);
+    }
+}
--- a/src/BayesNet/AODELd.h
+++ b/src/BayesNet/AODELd.h
@@ -0,0 +1,20 @@
+#ifndef AODELD_H
+#define AODELD_H
+#include "Ensemble.h"
+#include "Proposal.h"
+#include "SPODELd.h"
+
+namespace bayesnet {
+    using namespace std;
+    class AODELd : public Ensemble, public Proposal {
+    public:
+        AODELd();
+        virtual ~AODELd() = default;
+        AODELd& fit(torch::Tensor& X, torch::Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states) override;
+        vector<string> graph(const string& name = "AODE") override;
+        Tensor predict(Tensor& X) override;
+        void train() override;
+        static inline string version() { return "0.0.1"; };
+    };
+}
+#endif // !AODELD_H
--- a/src/BayesNet/BaseClassifier.cc
+++ b/src/BayesNet/BaseClassifier.cc
@@ -1,127 +0,0 @@
-#include "BaseClassifier.h"
-#include "bayesnetUtils.h"
-
-namespace bayesnet {
-    using namespace std;
-    using namespace torch;
-
-    BaseClassifier::BaseClassifier(Network model) : model(model), m(0), n(0), metrics(Metrics()), fitted(false) {}
-    BaseClassifier& BaseClassifier::build(vector<string>& features, string className, map<string, vector<int>>& states)
-    {
-        dataset = torch::cat({ X, y.view({y.size(0), 1}) }, 1);
-        this->features = features;
-        this->className = className;
-        this->states = states;
-        checkFitParameters();
-        auto n_classes = states[className].size();
-        metrics = Metrics(dataset, features, className, n_classes);
-        train();
-        model.fit(Xv, yv, features, className);
-        fitted = true;
-        return *this;
-    }
-    BaseClassifier& BaseClassifier::fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states)
-    {
-        this->X = torch::zeros({ static_cast<int64_t>(X[0].size()), static_cast<int64_t>(X.size()) }, kInt64);
-        Xv = X;
-        for (int i = 0; i < X.size(); ++i) {
-            this->X.index_put_({ "...", i }, torch::tensor(X[i], kInt64));
-        }
-        this->y = torch::tensor(y, kInt64);
-        yv = y;
-        return build(features, className, states);
-    }
-    void BaseClassifier::checkFitParameters()
-    {
-        auto sizes = X.sizes();
-        m = sizes[0];
-        n = sizes[1];
-        if (m != y.size(0)) {
-            throw invalid_argument("X and y must have the same number of samples");
-        }
-        if (n != features.size()) {
-            throw invalid_argument("X and features must have the same number of features");
-        }
-        if (states.find(className) == states.end()) {
-            throw invalid_argument("className not found in states");
-        }
-        for (auto feature : features) {
-            if (states.find(feature) == states.end()) {
-                throw invalid_argument("feature [" + feature + "] not found in states");
-            }
-        }
-    }
-
-    Tensor BaseClassifier::predict(Tensor& X)
-    {
-        if (!fitted) {
-            throw logic_error("Classifier has not been fitted");
-        }
-        auto m_ = X.size(0);
-        auto n_ = X.size(1);
-        vector<vector<int>> Xd(n_, vector<int>(m_, 0));
-        for (auto i = 0; i < n_; i++) {
-            auto temp = X.index({ "...", i });
-            Xd[i] = vector<int>(temp.data_ptr<int>(), temp.data_ptr<int>() + m_);
-        }
-        auto yp = model.predict(Xd);
-        auto ypred = torch::tensor(yp, torch::kInt64);
-        return ypred;
-    }
-    vector<int> BaseClassifier::predict(vector<vector<int>>& X)
-    {
-        if (!fitted) {
-            throw logic_error("Classifier has not been fitted");
-        }
-        auto m_ = X[0].size();
-        auto n_ = X.size();
-        vector<vector<int>> Xd(n_, vector<int>(m_, 0));
-        for (auto i = 0; i < n_; i++) {
-            Xd[i] = vector<int>(X[i].begin(), X[i].end());
-        }
-        auto yp = model.predict(Xd);
-        return yp;
-    }
-    float BaseClassifier::score(Tensor& X, Tensor& y)
-    {
-        if (!fitted) {
-            throw logic_error("Classifier has not been fitted");
-        }
-        Tensor y_pred = predict(X);
-        return (y_pred == y).sum().item<float>() / y.size(0);
-    }
-    float BaseClassifier::score(vector<vector<int>>& X, vector<int>& y)
-    {
-        if (!fitted) {
-            throw logic_error("Classifier has not been fitted");
-        }
-        auto m_ = X[0].size();
-        auto n_ = X.size();
-        vector<vector<int>> Xd(n_, vector<int>(m_, 0));
-        for (auto i = 0; i < n_; i++) {
-            Xd[i] = vector<int>(X[i].begin(), X[i].end());
-        }
-        return model.score(Xd, y);
-    }
-    vector<string> BaseClassifier::show()
-    {
-        return model.show();
-    }
-    void BaseClassifier::addNodes()
-    {
-        // Add all nodes to the network
-        for (auto feature : features) {
-            model.addNode(feature, states[feature].size());
-        }
-        model.addNode(className, states[className].size());
-    }
-    int BaseClassifier::getNumberOfNodes()
-    {
-        // Features does not include class
-        return fitted ? model.getFeatures().size() + 1 : 0;
-    }
-    int BaseClassifier::getNumberOfEdges()
-    {
-        return fitted ? model.getEdges().size() : 0;
-    }
-}
--- a/src/BayesNet/BaseClassifier.h
+++ b/src/BayesNet/BaseClassifier.h
@@ -1,48 +1,28 @@
-#ifndef CLASSIFIERS_H
-#define CLASSIFIERS_H
+#ifndef BASE_H
+#define BASE_H
 #include <torch/torch.h>
-#include "Network.h"
-#include "Metrics.hpp"
-using namespace std;
-using namespace torch;
-
+#include <vector>
 namespace bayesnet {
+    using namespace std;
    class BaseClassifier {
-    private:
-        bool fitted;
-        BaseClassifier& build(vector<string>& features, string className, map<string, vector<int>>& states);
-    protected:
-        Network model;
-        int m, n; // m: number of samples, n: number of features
-        Tensor X;
-        vector<vector<int>> Xv;
-        Tensor y;
-        vector<int> yv;
-        Tensor dataset;
-        Metrics metrics;
-        vector<string> features;
-        string className;
-        map<string, vector<int>> states;
-        void checkFitParameters();
-        virtual void train() = 0;
    public:
-        BaseClassifier(Network model);
+        // X is nxm vector, y is nx1 vector
+        virtual BaseClassifier& fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states) = 0;
+        // X is nxm tensor, y is nx1 tensor
+        virtual BaseClassifier& fit(torch::Tensor& X, torch::Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states) = 0;
        virtual ~BaseClassifier() = default;
-        BaseClassifier& fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states);
-        void addNodes();
-        int getNumberOfNodes();
-        int getNumberOfEdges();
-        Tensor predict(Tensor& X);
-        vector<int> predict(vector<vector<int>>& X);
-        float score(Tensor& X, Tensor& y);
-        float score(vector<vector<int>>& X, vector<int>& y);
-        vector<string> show();
-        virtual vector<string> graph(string title) = 0;
+        torch::Tensor virtual predict(torch::Tensor& X) = 0;
+        vector<int> virtual predict(vector<vector<int>>& X) = 0;
+        float virtual score(vector<vector<int>>& X, vector<int>& y) = 0;
+        float virtual score(torch::Tensor& X, torch::Tensor& y) = 0;
+        int virtual getNumberOfNodes() = 0;
+        int virtual getNumberOfEdges() = 0;
+        int virtual getNumberOfStates() = 0;
+        vector<string> virtual show() = 0;
+        vector<string> virtual graph(const string& title = "") = 0;
+        const string inline getVersion() const { return "0.1.0"; };
+        vector<string> virtual topological_order() = 0;
+        void virtual dump_cpt() = 0;
    };
 }
-#endif
-
-
-
-
-
+#endif
--- a/src/BayesNet/BayesMetrics.cc
+++ b/src/BayesNet/BayesMetrics.cc
@@ -1,7 +1,7 @@
-#include "Metrics.hpp"
+#include "BayesMetrics.h"
 #include "Mst.h"
-using namespace std;
 namespace bayesnet {
+    //samples is nxm tensor used to fit the model
    Metrics::Metrics(torch::Tensor& samples, vector<string>& features, string& className, int classNumStates)
        : samples(samples)
        , features(features)
@@ -9,16 +9,17 @@ namespace bayesnet {
        , classNumStates(classNumStates)
    {
    }
+    //samples is nxm vector used to fit the model
    Metrics::Metrics(const vector<vector<int>>& vsamples, const vector<int>& labels, const vector<string>& features, const string& className, const int classNumStates)
        : features(features)
        , className(className)
        , classNumStates(classNumStates)
+        , samples(torch::zeros({ static_cast<int>(vsamples[0].size()), static_cast<int>(vsamples.size() + 1) }, torch::kInt32))
    {
-        samples = torch::zeros({ static_cast<int64_t>(vsamples[0].size()), static_cast<int64_t>(vsamples.size() + 1) }, torch::kInt64);
        for (int i = 0; i < vsamples.size(); ++i) {
-            samples.index_put_({ "...", i }, torch::tensor(vsamples[i], torch::kInt64));
+            samples.index_put_({ i,  "..." }, torch::tensor(vsamples[i], torch::kInt32));
        }
-        samples.index_put_({ "...", -1 }, torch::tensor(labels, torch::kInt64));
+        samples.index_put_({ -1, "..." }, torch::tensor(labels, torch::kInt32));
    }
    vector<pair<string, string>> Metrics::doCombinations(const vector<string>& source)
    {
@@ -40,17 +41,17 @@ namespace bayesnet {
        // Compute class prior
        auto margin = torch::zeros({ classNumStates });
        for (int value = 0; value < classNumStates; ++value) {
-            auto mask = samples.index({ "...", -1 }) == value;
-            margin[value] = mask.sum().item<float>() / samples.sizes()[0];
+            auto mask = samples.index({ -1,  "..." }) == value;
+            margin[value] = mask.sum().item<float>() / samples.size(1);
        }
        for (auto [first, second] : combinations) {
-            int64_t index_first = find(features.begin(), features.end(), first) - features.begin();
-            int64_t index_second = find(features.begin(), features.end(), second) - features.begin();
+            int index_first = find(features.begin(), features.end(), first) - features.begin();
+            int index_second = find(features.begin(), features.end(), second) - features.begin();
            double accumulated = 0;
            for (int value = 0; value < classNumStates; ++value) {
-                auto mask = samples.index({ "...", -1 }) == value;
-                auto first_dataset = samples.index({ mask, index_first });
-                auto second_dataset = samples.index({ mask, index_second });
+                auto mask = samples.index({ -1, "..." }) == value;
+                auto first_dataset = samples.index({ index_first, mask });
+                auto second_dataset = samples.index({ index_second, mask });
                auto mi = mutualInformation(first_dataset, second_dataset);
                auto pb = margin[value].item<float>();
                accumulated += pb * mi;
@@ -68,6 +69,7 @@ namespace bayesnet {
        }
        return matrix;
    }
+    // To use in Python
    vector<float> Metrics::conditionalEdgeWeights()
    {
        auto matrix = conditionalEdge();
@@ -95,7 +97,7 @@ namespace bayesnet {
            totalWeight += 1;
        }
        if (totalWeight == 0)
-            throw invalid_argument("Total weight should not be zero");
+            return 0;
        double entropyValue = 0;
        for (int value = 0; value < featureCounts.sizes()[0]; ++value) {
            double p_f = featureCounts[value].item<double>() / totalWeight;
@@ -124,7 +126,6 @@ namespace bayesnet {
    */
    vector<pair<int, int>> Metrics::maximumSpanningTree(vector<string> features, Tensor& weights, int root)
    {
-        auto result = vector<pair<int, int>>();
        auto mst = MST(features, weights, root);
        return mst.maximumSpanningTree();
    }
--- a/src/BayesNet/BayesMetrics.h
+++ b/src/BayesNet/BayesMetrics.h
@@ -8,10 +8,10 @@ namespace bayesnet {
    using namespace torch;
    class Metrics {
    private:
-        Tensor samples;
+        Tensor samples; // nxm tensor used to fit the model
        vector<string> features;
        string className;
-        int classNumStates;
+        int classNumStates = 0;
    public:
        Metrics() = default;
        Metrics(Tensor&, vector<string>&, string&, int);
@@ -19,7 +19,7 @@ namespace bayesnet {
        double entropy(Tensor&);
        double conditionalEntropy(Tensor&, Tensor&);
        double mutualInformation(Tensor&, Tensor&);
-        vector<float> conditionalEdgeWeights();
+        vector<float> conditionalEdgeWeights(); // To use in Python
        Tensor conditionalEdge();
        vector<pair<string, string>> doCombinations(const vector<string>&);
        vector<pair<int, int>> maximumSpanningTree(vector<string> features, Tensor& weights, int root);
--- a/src/BayesNet/CMakeLists.txt
+++ b/src/BayesNet/CMakeLists.txt
@@ -1,2 +1,5 @@
-add_library(BayesNet bayesnetUtils.cc Network.cc Node.cc Metrics.cc BaseClassifier.cc KDB.cc TAN.cc SPODE.cc Ensemble.cc AODE.cc Mst.cc)
-target_link_libraries(BayesNet "${TORCH_LIBRARIES}")
+include_directories(${BayesNet_SOURCE_DIR}/lib/mdlp)
+include_directories(${BayesNet_SOURCE_DIR}/lib/Files)
+add_library(BayesNet bayesnetUtils.cc Network.cc Node.cc BayesMetrics.cc Classifier.cc 
+    KDB.cc TAN.cc SPODE.cc Ensemble.cc AODE.cc TANLd.cc KDBLd.cc SPODELd.cc AODELd.cc Mst.cc Proposal.cc)
+target_link_libraries(BayesNet mdlp ArffFiles "${TORCH_LIBRARIES}")
--- a/src/BayesNet/Classifier.cc
+++ b/src/BayesNet/Classifier.cc
@@ -0,0 +1,145 @@
+#include "Classifier.h"
+#include "bayesnetUtils.h"
+
+namespace bayesnet {
+    using namespace torch;
+
+    Classifier::Classifier(Network model) : model(model), m(0), n(0), metrics(Metrics()), fitted(false) {}
+    Classifier& Classifier::build(vector<string>& features, string className, map<string, vector<int>>& states)
+    {
+        Tensor ytmp = torch::transpose(y.view({ y.size(0), 1 }), 0, 1);
+        samples = torch::cat({ X, ytmp }, 0);
+        this->features = features;
+        this->className = className;
+        this->states = states;
+        checkFitParameters();
+        auto n_classes = states[className].size();
+        metrics = Metrics(samples, features, className, n_classes);
+        model.initialize();
+        train();
+        if (Xv.empty()) {
+            // fit with tensors
+            model.fit(X, y, features, className);
+        } else {
+            // fit with vectors
+            model.fit(Xv, yv, features, className);
+        }
+        fitted = true;
+        return *this;
+    }
+    // X is nxm where n is the number of features and m the number of samples
+    Classifier& Classifier::fit(torch::Tensor& X, torch::Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states)
+    {
+        this->X = X;
+        this->y = y;
+        Xv = vector<vector<int>>();
+        yv = vector<int>(y.data_ptr<int>(), y.data_ptr<int>() + y.size(0));
+        return build(features, className, states);
+    }
+    void Classifier::generateTensorXFromVector()
+    {
+        X = torch::zeros({ static_cast<int>(Xv.size()), static_cast<int>(Xv[0].size()) }, kInt32);
+        for (int i = 0; i < Xv.size(); ++i) {
+            X.index_put_({ i, "..." }, torch::tensor(Xv[i], kInt32));
+        }
+    }
+    // X is nxm where n is the number of features and m the number of samples
+    Classifier& Classifier::fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states)
+    {
+        Xv = X;
+        generateTensorXFromVector();
+        this->y = torch::tensor(y, kInt32);
+        yv = y;
+        return build(features, className, states);
+    }
+    void Classifier::checkFitParameters()
+    {
+        auto sizes = X.sizes();
+        m = sizes[1];
+        n = sizes[0];
+        if (m != y.size(0)) {
+            throw invalid_argument("X and y must have the same number of samples");
+        }
+        if (n != features.size()) {
+            throw invalid_argument("X and features must have the same number of features");
+        }
+        if (states.find(className) == states.end()) {
+            throw invalid_argument("className not found in states");
+        }
+        for (auto feature : features) {
+            if (states.find(feature) == states.end()) {
+                throw invalid_argument("feature [" + feature + "] not found in states");
+            }
+        }
+    }
+    Tensor Classifier::predict(Tensor& X)
+    {
+        if (!fitted) {
+            throw logic_error("Classifier has not been fitted");
+        }
+        return model.predict(X);
+    }
+    vector<int> Classifier::predict(vector<vector<int>>& X)
+    {
+        if (!fitted) {
+            throw logic_error("Classifier has not been fitted");
+        }
+        auto m_ = X[0].size();
+        auto n_ = X.size();
+        vector<vector<int>> Xd(n_, vector<int>(m_, 0));
+        for (auto i = 0; i < n_; i++) {
+            Xd[i] = vector<int>(X[i].begin(), X[i].end());
+        }
+        auto yp = model.predict(Xd);
+        return yp;
+    }
+    float Classifier::score(Tensor& X, Tensor& y)
+    {
+        if (!fitted) {
+            throw logic_error("Classifier has not been fitted");
+        }
+        Tensor y_pred = predict(X);
+        return (y_pred == y).sum().item<float>() / y.size(0);
+    }
+    float Classifier::score(vector<vector<int>>& X, vector<int>& y)
+    {
+        if (!fitted) {
+            throw logic_error("Classifier has not been fitted");
+        }
+        return model.score(X, y);
+    }
+    vector<string> Classifier::show()
+    {
+        return model.show();
+    }
+    void Classifier::addNodes()
+    {
+        // Add all nodes to the network
+        for (const auto& feature : features) {
+            model.addNode(feature);
+        }
+        model.addNode(className);
+    }
+    int Classifier::getNumberOfNodes()
+    {
+        // Features does not include class
+        return fitted ? model.getFeatures().size() + 1 : 0;
+    }
+    int Classifier::getNumberOfEdges()
+    {
+        return fitted ? model.getEdges().size() : 0;
+    }
+    int Classifier::getNumberOfStates()
+    {
+        return fitted ? model.getStates() : 0;
+    }
+    vector<string> Classifier::topological_order()
+    {
+        return model.topological_sort();
+    }
+    void Classifier::dump_cpt()
+    {
+        model.dump_cpt();
+    }
+
+}
--- a/src/BayesNet/Classifier.h
+++ b/src/BayesNet/Classifier.h
@@ -0,0 +1,53 @@
+#ifndef CLASSIFIER_H
+#define CLASSIFIER_H
+#include <torch/torch.h>
+#include "BaseClassifier.h"
+#include "Network.h"
+#include "BayesMetrics.h"
+using namespace std;
+using namespace torch;
+
+namespace bayesnet {
+    class Classifier : public BaseClassifier {
+    private:
+        bool fitted;
+        Classifier& build(vector<string>& features, string className, map<string, vector<int>>& states);
+    protected:
+        Network model;
+        int m, n; // m: number of samples, n: number of features
+        Tensor X; // nxm tensor
+        vector<vector<int>> Xv; // nxm vector
+        Tensor y;
+        vector<int> yv;
+        Tensor samples; // (n+1)xm tensor
+        Metrics metrics;
+        vector<string> features;
+        string className;
+        map<string, vector<int>> states;
+        void checkFitParameters();
+        void generateTensorXFromVector();
+        virtual void train() = 0;
+    public:
+        Classifier(Network model);
+        virtual ~Classifier() = default;
+        Classifier& fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states) override;
+        Classifier& fit(torch::Tensor& X, torch::Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states) override;
+        void addNodes();
+        int getNumberOfNodes() override;
+        int getNumberOfEdges() override;
+        int getNumberOfStates() override;
+        Tensor predict(Tensor& X) override;
+        vector<int> predict(vector<vector<int>>& X) override;
+        float score(Tensor& X, Tensor& y) override;
+        float score(vector<vector<int>>& X, vector<int>& y) override;
+        vector<string> show() override;
+        vector<string> topological_order() override;
+        void dump_cpt() override;
+    };
+}
+#endif
+
+
+
+
+
--- a/src/BayesNet/Ensemble.cc
+++ b/src/BayesNet/Ensemble.cc
@@ -1,64 +1,93 @@
 #include "Ensemble.h"

 namespace bayesnet {
-    using namespace std;
    using namespace torch;

-    Ensemble::Ensemble() : m(0), n(0), n_models(0), metrics(Metrics()), fitted(false) {}
+    Ensemble::Ensemble() : n_models(0), metrics(Metrics()), fitted(false) {}
    Ensemble& Ensemble::build(vector<string>& features, string className, map<string, vector<int>>& states)
    {
-        dataset = cat({ X, y.view({y.size(0), 1}) }, 1);
+        Tensor ytmp = torch::transpose(y.view({ y.size(0), 1 }), 0, 1);
+        samples = torch::cat({ X, ytmp }, 0);
        this->features = features;
        this->className = className;
        this->states = states;
        auto n_classes = states[className].size();
-        metrics = Metrics(dataset, features, className, n_classes);
+        metrics = Metrics(samples, features, className, n_classes);
        // Build models
        train();
        // Train models
        n_models = models.size();
        for (auto i = 0; i < n_models; ++i) {
-            models[i]->fit(Xv, yv, features, className, states);
+            if (Xv.empty()) {
+                // fit with tensors
+                models[i]->fit(X, y, features, className, states);
+            } else {
+                // fit with vectors
+                models[i]->fit(Xv, yv, features, className, states);
+            }
        }
        fitted = true;
        return *this;
    }
+    void Ensemble::generateTensorXFromVector()
+    {
+        X = torch::zeros({ static_cast<int>(Xv.size()), static_cast<int>(Xv[0].size()) }, kInt32);
+        for (int i = 0; i < Xv.size(); ++i) {
+            X.index_put_({ i, "..." }, torch::tensor(Xv[i], kInt32));
+        }
+    }
+    Ensemble& Ensemble::fit(torch::Tensor& X, torch::Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states)
+    {
+        this->X = X;
+        this->y = y;
+        Xv = vector<vector<int>>();
+        yv = vector<int>(y.data_ptr<int>(), y.data_ptr<int>() + y.size(0));
+        return build(features, className, states);
+    }
    Ensemble& Ensemble::fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states)
    {
-        this->X = torch::zeros({ static_cast<int64_t>(X[0].size()), static_cast<int64_t>(X.size()) }, kInt64);
        Xv = X;
-        for (int i = 0; i < X.size(); ++i) {
-            this->X.index_put_({ "...", i }, torch::tensor(X[i], kInt64));
-        }
-        this->y = torch::tensor(y, kInt64);
+        generateTensorXFromVector();
+        this->y = torch::tensor(y, kInt32);
        yv = y;
        return build(features, className, states);
    }
+    vector<int> Ensemble::voting(Tensor& y_pred)
+    {
+        auto y_pred_ = y_pred.accessor<int, 2>();
+        vector<int> y_pred_final;
+        for (int i = 0; i < y_pred.size(0); ++i) {
+            vector<float> votes(y_pred.size(1), 0);
+            for (int j = 0; j < y_pred.size(1); ++j) {
+                votes[y_pred_[i][j]] += 1;
+            }
+            // argsort in descending order
+            auto indices = argsort(votes);
+            y_pred_final.push_back(indices[0]);
+        }
+        return y_pred_final;
+    }
    Tensor Ensemble::predict(Tensor& X)
    {
        if (!fitted) {
            throw logic_error("Ensemble has not been fitted");
        }
-        Tensor y_pred = torch::zeros({ X.size(0), n_models }, kInt64);
+        Tensor y_pred = torch::zeros({ X.size(1), n_models }, kInt32);
+        //Create a threadpool
+        auto threads{ vector<thread>() };
+        mutex mtx;
        for (auto i = 0; i < n_models; ++i) {
-            y_pred.index_put_({ "...", i }, models[i]->predict(X));
+            threads.push_back(thread([&, i]() {
+                auto ypredict = models[i]->predict(X);
+                lock_guard<mutex> lock(mtx);
+                y_pred.index_put_({ "...", i }, ypredict);
+                }));
+        }
+        for (auto& thread : threads) {
+            thread.join();
        }
        return torch::tensor(voting(y_pred));
    }
-    vector<int> Ensemble::voting(Tensor& y_pred)
-    {
-        auto y_pred_ = y_pred.accessor<int64_t, 2>();
-        vector<int> y_pred_final;
-        for (int i = 0; i < y_pred.size(0); ++i) {
-            vector<float> votes(states[className].size(), 0);
-            for (int j = 0; j < y_pred.size(1); ++j) {
-                votes[y_pred_[i][j]] += 1;
-            }
-            auto indices = argsort(votes);
-            y_pred_final.push_back(indices[0]);
-        }
-        return y_pred_final;
-    }
    vector<int> Ensemble::predict(vector<vector<int>>& X)
    {
        if (!fitted) {
@@ -70,12 +99,26 @@ namespace bayesnet {
        for (auto i = 0; i < n_; i++) {
            Xd[i] = vector<int>(X[i].begin(), X[i].end());
        }
-        Tensor y_pred = torch::zeros({ m_, n_models }, kInt64);
+        Tensor y_pred = torch::zeros({ m_, n_models }, kInt32);
        for (auto i = 0; i < n_models; ++i) {
-            y_pred.index_put_({ "...", i }, torch::tensor(models[i]->predict(Xd), kInt64));
+            y_pred.index_put_({ "...", i }, torch::tensor(models[i]->predict(Xd), kInt32));
        }
        return voting(y_pred);
    }
+    float Ensemble::score(Tensor& X, Tensor& y)
+    {
+        if (!fitted) {
+            throw logic_error("Ensemble has not been fitted");
+        }
+        auto y_pred = predict(X);
+        int correct = 0;
+        for (int i = 0; i < y_pred.size(0); ++i) {
+            if (y_pred[i].item<int>() == y[i].item<int>()) {
+                correct++;
+            }
+        }
+        return (double)correct / y_pred.size(0);
+    }
    float Ensemble::score(vector<vector<int>>& X, vector<int>& y)
    {
        if (!fitted) {
@@ -100,7 +143,7 @@ namespace bayesnet {
        }
        return result;
    }
-    vector<string> Ensemble::graph(string title)
+    vector<string> Ensemble::graph(const string& title)
    {
        auto result = vector<string>();
        for (auto i = 0; i < n_models; ++i) {
@@ -109,4 +152,28 @@ namespace bayesnet {
        }
        return result;
    }
+    int Ensemble::getNumberOfNodes()
+    {
+        int nodes = 0;
+        for (auto i = 0; i < n_models; ++i) {
+            nodes += models[i]->getNumberOfNodes();
+        }
+        return nodes;
+    }
+    int Ensemble::getNumberOfEdges()
+    {
+        int edges = 0;
+        for (auto i = 0; i < n_models; ++i) {
+            edges += models[i]->getNumberOfEdges();
+        }
+        return edges;
+    }
+    int Ensemble::getNumberOfStates()
+    {
+        int nstates = 0;
+        for (auto i = 0; i < n_models; ++i) {
+            nstates += models[i]->getNumberOfStates();
+        }
+        return nstates;
+    }
 }
--- a/src/BayesNet/Ensemble.h
+++ b/src/BayesNet/Ensemble.h
@@ -1,42 +1,53 @@
 #ifndef ENSEMBLE_H
 #define ENSEMBLE_H
 #include <torch/torch.h>
-#include "BaseClassifier.h"
-#include "Metrics.hpp"
+#include "Classifier.h"
+#include "BayesMetrics.h"
 #include "bayesnetUtils.h"
 using namespace std;
 using namespace torch;

 namespace bayesnet {
-    class Ensemble {
+    class Ensemble : public BaseClassifier {
    private:
-        bool fitted;
-        long n_models;
        Ensemble& build(vector<string>& features, string className, map<string, vector<int>>& states);
    protected:
-        vector<unique_ptr<BaseClassifier>> models;
-        int m, n; // m: number of samples, n: number of features
+        unsigned n_models;
+        bool fitted;
+        vector<unique_ptr<Classifier>> models;
        Tensor X;
        vector<vector<int>> Xv;
        Tensor y;
        vector<int> yv;
-        Tensor dataset;
+        Tensor samples;
        Metrics metrics;
        vector<string> features;
        string className;
        map<string, vector<int>> states;
        void virtual train() = 0;
        vector<int> voting(Tensor& y_pred);
+        void generateTensorXFromVector();
    public:
        Ensemble();
        virtual ~Ensemble() = default;
-        Ensemble& fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states);
-        Tensor predict(Tensor& X);
-        vector<int> predict(vector<vector<int>>& X);
-        float score(Tensor& X, Tensor& y);
-        float score(vector<vector<int>>& X, vector<int>& y);
-        vector<string> show();
-        vector<string> graph(string title);
+        Ensemble& fit(vector<vector<int>>& X, vector<int>& y, vector<string>& features, string className, map<string, vector<int>>& states) override;
+        Ensemble& fit(torch::Tensor& X, torch::Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states) override;
+        Tensor predict(Tensor& X) override;
+        vector<int> predict(vector<vector<int>>& X) override;
+        float score(Tensor& X, Tensor& y) override;
+        float score(vector<vector<int>>& X, vector<int>& y) override;
+        int getNumberOfNodes() override;
+        int getNumberOfEdges() override;
+        int getNumberOfStates() override;
+        vector<string> show() override;
+        vector<string> graph(const string& title) override;
+        vector<string> topological_order() override
+        {
+            return vector<string>();
+        }
+        void dump_cpt() override
+        {
+        }
    };
 }
 #endif
--- a/src/BayesNet/KDB.cc
+++ b/src/BayesNet/KDB.cc
@@ -1,10 +1,9 @@
 #include "KDB.h"

 namespace bayesnet {
-    using namespace std;
    using namespace torch;

-    KDB::KDB(int k, float theta) : BaseClassifier(Network()), k(k), theta(theta) {}
+    KDB::KDB(int k, float theta) : Classifier(Network()), k(k), theta(theta) {}
    void KDB::train()
    {
        /*
@@ -28,9 +27,10 @@ namespace bayesnet {
        */
        // 1. For each feature Xi, compute mutual information, I(X;C),
        // where C is the class.
+        addNodes();
        vector <float> mi;
        for (auto i = 0; i < features.size(); i++) {
-            Tensor firstFeature = X.index({ "...", i });
+            Tensor firstFeature = X.index({ i, "..." });
            mi.push_back(metrics.mutualInformation(firstFeature, y));
        }
        // 2. Compute class conditional mutual information I(Xi;XjIC), f or each
@@ -39,14 +39,12 @@ namespace bayesnet {
        vector<int> S;
        // 4. Let the DAG network being constructed, BN, begin with a single
        // class node, C.
-        model.addNode(className, states[className].size());
        // 5. Repeat until S includes all domain features
        // 5.1. Select feature Xmax which is not in S and has the largest value
        // I(Xmax;C).
        auto order = argsort(mi);
        for (auto idx : order) {
            // 5.2. Add a node to BN representing Xmax.
-            model.addNode(features[idx], states[features[idx]].size());
            // 5.3. Add an arc from C to Xmax in BN.
            model.addEdge(className, features[idx]);
            // 5.4. Add m = min(lSl,/c) arcs from m distinct features Xj in S with
@@ -80,11 +78,12 @@ namespace bayesnet {
            exit_cond = num == n_edges || candidates.size(0) == 0;
        }
    }
-    vector<string> KDB::graph(string title)
+    vector<string> KDB::graph(const string& title)
    {
+        string header{ title };
        if (title == "KDB") {
-            title += " (k=" + to_string(k) + ", theta=" + to_string(theta) + ")";
+            header += " (k=" + to_string(k) + ", theta=" + to_string(theta) + ")";
        }
-        return model.graph(title);
+        return model.graph(header);
    }
 }
--- a/src/BayesNet/KDB.h
+++ b/src/BayesNet/KDB.h
@@ -1,11 +1,11 @@
 #ifndef KDB_H
 #define KDB_H
-#include "BaseClassifier.h"
+#include "Classifier.h"
 #include "bayesnetUtils.h"
 namespace bayesnet {
    using namespace std;
    using namespace torch;
-    class KDB : public BaseClassifier {
+    class KDB : public Classifier {
    private:
        int k;
        float theta;
@@ -13,8 +13,9 @@ namespace bayesnet {
    protected:
        void train() override;
    public:
-        KDB(int k, float theta = 0.03);
-        vector<string> graph(string name = "KDB") override;
+        explicit KDB(int k, float theta = 0.03);
+        virtual ~KDB() {};
+        vector<string> graph(const string& name = "KDB") override;
    };
 }
 #endif
--- a/src/BayesNet/KDBLd.cc
+++ b/src/BayesNet/KDBLd.cc
@@ -0,0 +1,35 @@
+#include "KDBLd.h"
+
+namespace bayesnet {
+    using namespace std;
+    KDBLd::KDBLd(int k) : KDB(k), Proposal(KDB::Xv, KDB::yv, features, className) {}
+    KDBLd& KDBLd::fit(torch::Tensor& X_, torch::Tensor& y_, vector<string>& features_, string className_, map<string, vector<int>>& states_)
+    {
+        // This first part should go in a Classifier method called fit_local_discretization o fit_float...
+        features = features_;
+        className = className_;
+        Xf = X_;
+        y = y_;
+        // Fills vectors Xv & yv with the data from tensors X_ (discretized) & y
+        fit_local_discretization(states, y);
+        generateTensorXFromVector();
+        // We have discretized the input data
+        // 1st we need to fit the model to build the normal KDB structure, KDB::fit initializes the base Bayesian network
+        KDB::fit(KDB::Xv, KDB::yv, features, className, states);
+        localDiscretizationProposal(states, model);
+        generateTensorXFromVector();
+        Tensor ytmp = torch::transpose(y.view({ y.size(0), 1 }), 0, 1);
+        samples = torch::cat({ X, ytmp }, 0);
+        model.fit(KDB::Xv, KDB::yv, features, className);
+        return *this;
+    }
+    Tensor KDBLd::predict(Tensor& X)
+    {
+        auto Xt = prepareX(X);
+        return KDB::predict(Xt);
+    }
+    vector<string> KDBLd::graph(const string& name)
+    {
+        return KDB::graph(name);
+    }
+}
--- a/src/BayesNet/KDBLd.h
+++ b/src/BayesNet/KDBLd.h
@@ -0,0 +1,19 @@
+#ifndef KDBLD_H
+#define KDBLD_H
+#include "KDB.h"
+#include "Proposal.h"
+
+namespace bayesnet {
+    using namespace std;
+    class KDBLd : public KDB, public Proposal {
+    private:
+    public:
+        explicit KDBLd(int k);
+        virtual ~KDBLd() = default;
+        KDBLd& fit(torch::Tensor& X, torch::Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states) override;
+        vector<string> graph(const string& name = "KDB") override;
+        Tensor predict(Tensor& X) override;
+        static inline string version() { return "0.0.1"; };
+    };
+}
+#endif // !KDBLD_H
--- a/src/BayesNet/Mst.cc
+++ b/src/BayesNet/Mst.cc
@@ -7,9 +7,8 @@

 namespace bayesnet {
    using namespace std;
-    Graph::Graph(int V)
+    Graph::Graph(int V) : V(V), parent(vector<int>(V))
    {
-        parent = vector<int>(V);
        for (int i = 0; i < V; i++)
            parent[i] = i;
        G.clear();
@@ -34,10 +33,10 @@ namespace bayesnet {
    }
    void Graph::kruskal_algorithm()
    {
-        int i, uSt, vEd;
        // sort the edges ordered on decreasing weight
-        sort(G.begin(), G.end(), [](auto& left, auto& right) {return left.first > right.first;});
-        for (i = 0; i < G.size(); i++) {
+        sort(G.begin(), G.end(), [](const auto& left, const auto& right) {return left.first > right.first;});
+        for (int i = 0; i < G.size(); i++) {
+            int uSt, vEd;
            uSt = find_set(G[i].second.first);
            vEd = find_set(G[i].second.second);
            if (uSt != vEd) {
@@ -103,7 +102,7 @@ namespace bayesnet {

        // Make a complete graph
        for (int i = 0; i < num_features - 1; ++i) {
-            for (int j = i; j < num_features; ++j) {
+            for (int j = i + 1; j < num_features; ++j) {
                g.addEdge(i, j, weights[i][j].item<float>());
            }
        }
--- a/src/BayesNet/Mst.h
+++ b/src/BayesNet/Mst.h
@@ -10,7 +10,7 @@ namespace bayesnet {
    private:
        Tensor weights;
        vector<string> features;
-        int root;
+        int root = 0;
    public:
        MST() = default;
        MST(vector<string>& features, Tensor& weights, int root);
@@ -23,7 +23,7 @@ namespace bayesnet {
        vector <pair<float, pair<int, int>>> T; // vector for mst
        vector<int> parent;
    public:
-        Graph(int V);
+        explicit Graph(int V);
        void addEdge(int u, int v, float wt);
        int find_set(int i);
        void union_set(int u, int v);
--- a/src/BayesNet/Network.cc
+++ b/src/BayesNet/Network.cc
@@ -1,16 +1,28 @@
 #include <thread>
 #include <mutex>
 #include "Network.h"
+#include "bayesnetUtils.h"
 namespace bayesnet {
-    Network::Network() : laplaceSmoothing(1), features(vector<string>()), className(""), classNumStates(0), maxThreads(0.8), fitted(false) {}
-    Network::Network(float maxT) : laplaceSmoothing(1), features(vector<string>()), className(""), classNumStates(0), maxThreads(maxT), fitted(false) {}
+    Network::Network() : features(vector<string>()), className(""), classNumStates(0), fitted(false) {}
+    Network::Network(float maxT) : features(vector<string>()), className(""), classNumStates(0), maxThreads(maxT), fitted(false) {}
    Network::Network(float maxT, int smoothing) : laplaceSmoothing(smoothing), features(vector<string>()), className(""), classNumStates(0), maxThreads(maxT), fitted(false) {}
-    Network::Network(Network& other) : laplaceSmoothing(other.laplaceSmoothing), features(other.features), className(other.className), classNumStates(other.getClassNumStates()), maxThreads(other.getmaxThreads()), fitted(other.fitted)
+    Network::Network(Network& other) : laplaceSmoothing(other.laplaceSmoothing), features(other.features), className(other.className), classNumStates(other.getClassNumStates()), maxThreads(other.
+        getmaxThreads()), fitted(other.fitted)
    {
-        for (auto& pair : other.nodes) {
-            nodes[pair.first] = make_unique<Node>(*pair.second);
+        for (const auto& pair : other.nodes) {
+            nodes[pair.first] = std::make_unique<Node>(*pair.second);
        }
    }
+    void Network::initialize()
+    {
+        features = vector<string>();
+        className = "";
+        classNumStates = 0;
+        fitted = false;
+        nodes.clear();
+        dataset.clear();
+        samples = torch::Tensor();
+    }
    float Network::getmaxThreads()
    {
        return maxThreads;
@@ -19,17 +31,18 @@ namespace bayesnet {
    {
        return samples;
    }
-    void Network::addNode(string name, int numStates)
+    void Network::addNode(const string& name)
    {
+        if (name == "") {
+            throw invalid_argument("Node name cannot be empty");
+        }
+        if (nodes.find(name) != nodes.end()) {
+            return;
+        }
        if (find(features.begin(), features.end(), name) == features.end()) {
            features.push_back(name);
        }
-        if (nodes.find(name) != nodes.end()) {
-            // if node exists update its number of states
-            nodes[name]->setNumStates(numStates);
-            return;
-        }
-        nodes[name] = make_unique<Node>(name, numStates);
+        nodes[name] = std::make_unique<Node>(name);
    }
    vector<string> Network::getFeatures()
    {
@@ -67,7 +80,7 @@ namespace bayesnet {
        recStack.erase(nodeId); // remove node from recursion stack before function ends
        return false;
    }
-    void Network::addEdge(const string parent, const string child)
+    void Network::addEdge(const string& parent, const string& child)
    {
        if (nodes.find(parent) == nodes.end()) {
            throw invalid_argument("Parent node " + parent + " does not exist");
@@ -87,27 +100,73 @@ namespace bayesnet {
            nodes[child]->removeParent(nodes[parent].get());
            throw invalid_argument("Adding this edge forms a cycle in the graph.");
        }
-
    }
    map<string, std::unique_ptr<Node>>& Network::getNodes()
    {
        return nodes;
    }
-    void Network::fit(const vector<vector<int>>& input_data, const vector<int>& labels, const vector<string>& featureNames, const string& className)
+    void Network::checkFitData(int n_samples, int n_features, int n_samples_y, const vector<string>& featureNames, const string& className)
    {
-        features = featureNames;
+        if (n_samples != n_samples_y) {
+            throw invalid_argument("X and y must have the same number of samples in Network::fit (" + to_string(n_samples) + " != " + to_string(n_samples_y) + ")");
+        }
+        if (n_features != featureNames.size()) {
+            throw invalid_argument("X and features must have the same number of features in Network::fit (" + to_string(n_features) + " != " + to_string(featureNames.size()) + ")");
+        }
+        if (n_features != features.size() - 1) {
+            throw invalid_argument("X and local features must have the same number of features in Network::fit (" + to_string(n_features) + " != " + to_string(features.size() - 1) + ")");
+        }
+        if (find(features.begin(), features.end(), className) == features.end()) {
+            throw invalid_argument("className not found in Network::features");
+        }
+        for (auto& feature : featureNames) {
+            if (find(features.begin(), features.end(), feature) == features.end()) {
+                throw invalid_argument("Feature " + feature + " not found in Network::features");
+            }
+        }
+    }
+    void Network::setStates()
+    {
+        // Set states to every Node in the network
+        for (int i = 0; i < features.size(); ++i) {
+            nodes[features[i]]->setNumStates(static_cast<int>(torch::max(samples.index({ i, "..." })).item<int>()) + 1);
+        }
+        classNumStates = nodes[className]->getNumStates();
+    }
+    // X comes in nxm, where n is the number of features and m the number of samples
+    void Network::fit(torch::Tensor& X, torch::Tensor& y, const vector<string>& featureNames, const string& className)
+    {
+        checkFitData(X.size(1), X.size(0), y.size(0), featureNames, className);
        this->className = className;
        dataset.clear();
-
-        // Build dataset & tensor of samples
-        samples = torch::zeros({ static_cast<int64_t>(input_data[0].size()), static_cast<int64_t>(input_data.size() + 1) }, torch::kInt64);
+        Tensor ytmp = torch::transpose(y.view({ y.size(0), 1 }), 0, 1);
+        samples = torch::cat({ X , ytmp }, 0);
+        for (int i = 0; i < featureNames.size(); ++i) {
+            auto row_feature = X.index({ i, "..." });
+            dataset[featureNames[i]] = vector<int>(row_feature.data_ptr<int>(), row_feature.data_ptr<int>() + row_feature.size(0));;
+        }
+        dataset[className] = vector<int>(y.data_ptr<int>(), y.data_ptr<int>() + y.size(0));
+        completeFit();
+    }
+    // input_data comes in nxm, where n is the number of features and m the number of samples
+    void Network::fit(const vector<vector<int>>& input_data, const vector<int>& labels, const vector<string>& featureNames, const string& className)
+    {
+        checkFitData(input_data[0].size(), input_data.size(), labels.size(), featureNames, className);
+        this->className = className;
+        dataset.clear();
+        // Build dataset & tensor of samples (nxm) (n+1 because of the class)
+        samples = torch::zeros({ static_cast<int>(input_data.size() + 1), static_cast<int>(input_data[0].size()) }, torch::kInt32);
        for (int i = 0; i < featureNames.size(); ++i) {
            dataset[featureNames[i]] = input_data[i];
-            samples.index_put_({ "...", i }, torch::tensor(input_data[i], torch::kInt64));
+            samples.index_put_({ i, "..." }, torch::tensor(input_data[i], torch::kInt32));
        }
        dataset[className] = labels;
-        samples.index_put_({ "...", -1 }, torch::tensor(labels, torch::kInt64));
-        classNumStates = *max_element(labels.begin(), labels.end()) + 1;
+        samples.index_put_({ -1, "..." }, torch::tensor(labels, torch::kInt32));
+        completeFit();
+    }
+    void Network::completeFit()
+    {
+        setStates();
        int maxThreadsRunning = static_cast<int>(std::thread::hardware_concurrency() * maxThreads);
        if (maxThreadsRunning < 1) {
            maxThreadsRunning = 1;
@@ -117,15 +176,9 @@ namespace bayesnet {
        condition_variable cv;
        int activeThreads = 0;
        int nextNodeIndex = 0;
-
        while (nextNodeIndex < nodes.size()) {
            unique_lock<mutex> lock(mtx);
            cv.wait(lock, [&activeThreads, &maxThreadsRunning]() { return activeThreads < maxThreadsRunning; });
-
-            if (nextNodeIndex >= nodes.size()) {
-                break;  // No more work remaining
-            }
-
            threads.emplace_back([this, &nextNodeIndex, &mtx, &cv, &activeThreads]() {
                while (true) {
                    unique_lock<mutex> lock(mtx);
@@ -135,7 +188,6 @@ namespace bayesnet {
                    auto& pair = *std::next(nodes.begin(), nextNodeIndex);
                    ++nextNodeIndex;
                    lock.unlock();
-
                    pair.second->computeCPT(dataset, laplaceSmoothing);
                    lock.lock();
                    nodes[pair.first] = std::move(pair.second);
@@ -145,7 +197,6 @@ namespace bayesnet {
                --activeThreads;
                cv.notify_one();
                });
-
            ++activeThreads;
        }
        for (auto& thread : threads) {
@@ -153,7 +204,39 @@ namespace bayesnet {
        }
        fitted = true;
    }
+    torch::Tensor Network::predict_tensor(const torch::Tensor& samples, const bool proba)
+    {
+        if (!fitted) {
+            throw logic_error("You must call fit() before calling predict()");
+        }
+        torch::Tensor result;
+        result = torch::zeros({ samples.size(1), classNumStates }, torch::kFloat64);
+        for (int i = 0; i < samples.size(1); ++i) {
+            auto sample = samples.index({ "...", i });
+            auto psample = predict_sample(sample);
+            auto temp = torch::tensor(psample, torch::kFloat64);
+            //            result.index_put_({ i, "..." }, torch::tensor(predict_sample(sample), torch::kFloat64));
+            result.index_put_({ i, "..." }, temp);
+        }
+        if (proba)
+            return result;
+        else
+            return result.argmax(1);
+    }
+    // Return mxn tensor of probabilities
+    Tensor Network::predict_proba(const Tensor& samples)
+    {
+        return predict_tensor(samples, true);
+    }

+    // Return mxn tensor of probabilities
+    Tensor Network::predict(const Tensor& samples)
+    {
+        return predict_tensor(samples, false);
+    }
+
+    // Return mx1 vector of predictions
+    // tsamples is nxm vector of samples
    vector<int> Network::predict(const vector<vector<int>>& tsamples)
    {
        if (!fitted) {
@@ -174,6 +257,7 @@ namespace bayesnet {
        }
        return predictions;
    }
+    // Return mxn vector of probabilities
    vector<vector<double>> Network::predict_proba(const vector<vector<int>>& tsamples)
    {
        if (!fitted) {
@@ -201,19 +285,33 @@ namespace bayesnet {
        }
        return (double)correct / y_pred.size();
    }
+    // Return 1xn vector of probabilities
    vector<double> Network::predict_sample(const vector<int>& sample)
    {
        // Ensure the sample size is equal to the number of features
-        if (sample.size() != features.size()) {
+        if (sample.size() != features.size() - 1) {
            throw invalid_argument("Sample size (" + to_string(sample.size()) +
-                ") does not match the number of features (" + to_string(features.size()) + ")");
+                ") does not match the number of features (" + to_string(features.size() - 1) + ")");
        }
        map<string, int> evidence;
        for (int i = 0; i < sample.size(); ++i) {
            evidence[features[i]] = sample[i];
        }
        return exactInference(evidence);
-
+    }
+    // Return 1xn vector of probabilities
+    vector<double> Network::predict_sample(const Tensor& sample)
+    {
+        // Ensure the sample size is equal to the number of features
+        if (sample.size(0) != features.size() - 1) {
+            throw invalid_argument("Sample size (" + to_string(sample.size(0)) +
+                ") does not match the number of features (" + to_string(features.size() - 1) + ")");
+        }
+        map<string, int> evidence;
+        for (int i = 0; i < sample.size(0); ++i) {
+            evidence[features[i]] = sample[i].item<int>();
+        }
+        return exactInference(evidence);
    }
    double Network::computeFactor(map<string, int>& completeEvidence)
    {
@@ -230,22 +328,19 @@ namespace bayesnet {
        mutex mtx;
        for (int i = 0; i < classNumStates; ++i) {
            threads.emplace_back([this, &result, &evidence, i, &mtx]() {
-                auto completeEvidence = map<string, int>(evidence);
-                completeEvidence[getClassName()] = i;
+            auto completeEvidence = map<string, int>(evidence);
+            completeEvidence[getClassName()] = i;
                double factor = computeFactor(completeEvidence);
                lock_guard<mutex> lock(mtx);
                result[i] = factor;
-                });
+            });
        }
        for (auto& thread : threads) {
            thread.join();
        }
-
        // Normalize result
        double sum = accumulate(result.begin(), result.end(), 0.0);
-        for (double& value : result) {
-            value /= sum;
-        }
+        transform(result.begin(), result.end(), result.begin(), [sum](double& value) { return value / sum; });
        return result;
    }
    vector<string> Network::show()
@@ -261,7 +356,7 @@ namespace bayesnet {
        }
        return result;
    }
-    vector<string> Network::graph(string title)
+    vector<string> Network::graph(const string& title)
    {
        auto output = vector<string>();
        auto prefix = "digraph BayesNet {\nlabel=<BayesNet ";
@@ -287,5 +382,48 @@ namespace bayesnet {
        }
        return edges;
    }
-
+    vector<string> Network::topological_sort()
+    {
+        /* Check if al the fathers of every node are before the node */
+        auto result = features;
+        result.erase(remove(result.begin(), result.end(), className), result.end());
+        bool ending{ false };
+        int idx = 0;
+        while (!ending) {
+            ending = true;
+            for (auto feature : features) {
+                auto fathers = nodes[feature]->getParents();
+                for (const auto& father : fathers) {
+                    auto fatherName = father->getName();
+                    if (fatherName == className) {
+                        continue;
+                    }
+                    // Check if father is placed before the actual feature
+                    auto it = find(result.begin(), result.end(), fatherName);
+                    if (it != result.end()) {
+                        auto it2 = find(result.begin(), result.end(), feature);
+                        if (it2 != result.end()) {
+                            if (distance(it, it2) < 0) {
+                                // if it is not, insert it before the feature
+                                result.erase(remove(result.begin(), result.end(), fatherName), result.end());
+                                result.insert(it2, fatherName);
+                                ending = false;
+                            }
+                        } else {
+                            throw logic_error("Error in topological sort because of node " + feature + " is not in result");
+                        }
+                    } else {
+                        throw logic_error("Error in topological sort because of node father " + fatherName + " is not in result");
+                    }
+                }
+            }
+        }
+        return result;
+    }
+    void Network::dump_cpt()
+    {
+        for (auto& node : nodes) {
+            cout << "* " << node.first << ": (" << node.second->getNumStates() << ") : " << node.second->getCPT().sizes() << endl;
+        }
+    }
 }
--- a/src/BayesNet/Network.h
+++ b/src/BayesNet/Network.h
@@ -7,32 +7,36 @@
 namespace bayesnet {
    class Network {
    private:
-        map<string, std::unique_ptr<Node>> nodes;
+        map<string, unique_ptr<Node>> nodes;
        map<string, vector<int>> dataset;
        bool fitted;
-        float maxThreads;
+        float maxThreads = 0.95;
        int classNumStates;
-        vector<string> features;
+        vector<string> features; // Including class
        string className;
-        int laplaceSmoothing;
-        torch::Tensor samples;
+        int laplaceSmoothing = 1;
+        torch::Tensor samples; // nxm tensor used to fit the model
        bool isCyclic(const std::string&, std::unordered_set<std::string>&, std::unordered_set<std::string>&);
        vector<double> predict_sample(const vector<int>&);
+        vector<double> predict_sample(const torch::Tensor&);
        vector<double> exactInference(map<string, int>&);
        double computeFactor(map<string, int>&);
        double mutual_info(torch::Tensor&, torch::Tensor&);
        double entropy(torch::Tensor&);
        double conditionalEntropy(torch::Tensor&, torch::Tensor&);
        double mutualInformation(torch::Tensor&, torch::Tensor&);
+        void completeFit();
+        void checkFitData(int n_features, int n_samples, int n_samples_y, const vector<string>& featureNames, const string& className);
+        void setStates();
    public:
        Network();
-        Network(float, int);
-        Network(float);
-        Network(Network&);
+        explicit Network(float, int);
+        explicit Network(float);
+        explicit Network(Network&);
        torch::Tensor& getSamples();
        float getmaxThreads();
-        void addNode(string, int);
-        void addEdge(const string, const string);
+        void addNode(const string&);
+        void addEdge(const string&, const string&);
        map<string, std::unique_ptr<Node>>& getNodes();
        vector<string> getFeatures();
        int getStates();
@@ -40,13 +44,20 @@ namespace bayesnet {
        int getClassNumStates();
        string getClassName();
        void fit(const vector<vector<int>>&, const vector<int>&, const vector<string>&, const string&);
-        vector<int> predict(const vector<vector<int>>&);
+        void fit(torch::Tensor&, torch::Tensor&, const vector<string>&, const string&);
+        vector<int> predict(const vector<vector<int>>&); // Return mx1 vector of predictions
+        torch::Tensor predict(const torch::Tensor&); // Return mx1 tensor of predictions
        //Computes the conditional edge weight of variable index u and v conditioned on class_node
        torch::Tensor conditionalEdgeWeight();
-        vector<vector<double>> predict_proba(const vector<vector<int>>&);
+        torch::Tensor predict_tensor(const torch::Tensor& samples, const bool proba);
+        vector<vector<double>> predict_proba(const vector<vector<int>>&); // Return mxn vector of probabilities
+        torch::Tensor predict_proba(const torch::Tensor&); // Return mxn tensor of probabilities
        double score(const vector<vector<int>>&, const vector<int>&);
+        vector<string> topological_sort();
        vector<string> show();
-        vector<string> graph(string title); // Returns a vector of strings representing the graph in graphviz format
+        vector<string> graph(const string& title); // Returns a vector of strings representing the graph in graphviz format
+        void initialize();
+        void dump_cpt();
        inline string version() { return "0.1.0"; }
    };
 }
--- a/src/BayesNet/Node.cc
+++ b/src/BayesNet/Node.cc
@@ -2,10 +2,18 @@

 namespace bayesnet {

-    Node::Node(const std::string& name, int numStates)
-        : name(name), numStates(numStates), cpTable(torch::Tensor()), parents(vector<Node*>()), children(vector<Node*>())
+    Node::Node(const std::string& name)
+        : name(name), numStates(0), cpTable(torch::Tensor()), parents(vector<Node*>()), children(vector<Node*>())
    {
    }
+    void Node::clear()
+    {
+        parents.clear();
+        children.clear();
+        cpTable = torch::Tensor();
+        dimensions.clear();
+        numStates = 0;
+    }
    string Node::getName() const
    {
        return name;
@@ -78,21 +86,18 @@ namespace bayesnet {
    }
    void Node::computeCPT(map<string, vector<int>>& dataset, const int laplaceSmoothing)
    {
+        dimensions.clear();
        // Get dimensions of the CPT
        dimensions.push_back(numStates);
-        for (auto father : getParents()) {
-            dimensions.push_back(father->getNumStates());
-        }
-        auto length = dimensions.size();
+        transform(parents.begin(), parents.end(), back_inserter(dimensions), [](const auto& parent) { return parent->getNumStates(); });
+
        // Create a tensor of zeros with the dimensions of the CPT
        cpTable = torch::zeros(dimensions, torch::kFloat) + laplaceSmoothing;
        // Fill table with counts
        for (int n_sample = 0; n_sample < dataset[name].size(); ++n_sample) {
            torch::List<c10::optional<torch::Tensor>> coordinates;
            coordinates.push_back(torch::tensor(dataset[name][n_sample]));
-            for (auto father : getParents()) {
-                coordinates.push_back(torch::tensor(dataset[father->getName()][n_sample]));
-            }
+            transform(parents.begin(), parents.end(), back_inserter(coordinates), [&dataset, &n_sample](const auto& parent) { return torch::tensor(dataset[parent->getName()][n_sample]); });
            // Increment the count of the corresponding coordinate
            cpTable.index_put_({ coordinates }, cpTable.index({ coordinates }) + 1);
        }
@@ -104,19 +109,15 @@ namespace bayesnet {
        torch::List<c10::optional<torch::Tensor>> coordinates;
        // following predetermined order of indices in the cpTable (see Node.h)
        coordinates.push_back(torch::tensor(evidence[name]));
-        for (auto parent : getParents()) {
-            coordinates.push_back(torch::tensor(evidence[parent->getName()]));
-        }
+        transform(parents.begin(), parents.end(), back_inserter(coordinates), [&evidence](const auto& parent) { return torch::tensor(evidence[parent->getName()]); });
        return cpTable.index({ coordinates }).item<float>();
    }
-    vector<string> Node::graph(string className)
+    vector<string> Node::graph(const string& className)
    {
        auto output = vector<string>();
        auto suffix = name == className ? ", fontcolor=red, fillcolor=lightblue, style=filled " : "";
        output.push_back(name + " [shape=circle" + suffix + "] \n");
-        for (auto& child : children) {
-            output.push_back(name + " -> " + child->getName());
-        }
+        transform(children.begin(), children.end(), back_inserter(output), [this](const auto& child) { return name + " -> " + child->getName(); });
        return output;
    }
 }
--- a/src/BayesNet/Node.h
+++ b/src/BayesNet/Node.h
@@ -16,7 +16,8 @@ namespace bayesnet {
        vector<int64_t> dimensions; // dimensions of the cpTable
    public:
        vector<pair<string, string>> combinations(const vector<string>&);
-        Node(const std::string&, int);
+        explicit Node(const string&);
+        void clear();
        void addParent(Node*);
        void addChild(Node*);
        void removeParent(Node*);
@@ -29,7 +30,7 @@ namespace bayesnet {
        int getNumStates() const;
        void setNumStates(int);
        unsigned minFill();
-        vector<string> graph(string clasName); // Returns a vector of strings representing the graph in graphviz format
+        vector<string> graph(const string& clasName); // Returns a vector of strings representing the graph in graphviz format
        float getFactorValue(map<string, int>&);
    };
 }
--- a/src/BayesNet/Proposal.cc
+++ b/src/BayesNet/Proposal.cc
@@ -0,0 +1,102 @@
+#include "Proposal.h"
+#include "ArffFiles.h"
+
+namespace bayesnet {
+    Proposal::Proposal(vector<vector<int>>& Xv_, vector<int>& yv_, vector<string>& features_, string& className_) : Xv(Xv_), yv(yv_), pFeatures(features_), pClassName(className_) {}
+    Proposal::~Proposal()
+    {
+        for (auto& [key, value] : discretizers) {
+            delete value;
+        }
+    }
+    void Proposal::localDiscretizationProposal(map<string, vector<int>>& states, Network& model)
+    {
+        // order of local discretization is important. no good 0, 1, 2...
+        // although we rediscretize features after the local discretization of every feature
+        auto order = model.topological_sort();
+        auto& nodes = model.getNodes();
+        vector<int> indicesToReDiscretize;
+        auto n_samples = Xf.size(1);
+        bool upgrade = false; // Flag to check if we need to upgrade the model
+        for (auto feature : order) {
+            auto nodeParents = nodes[feature]->getParents();
+            if (nodeParents.size() < 2) continue; // Only has class as parent
+            upgrade = true;
+            int index = find(pFeatures.begin(), pFeatures.end(), feature) - pFeatures.begin();
+            indicesToReDiscretize.push_back(index); // We need to re-discretize this feature
+            vector<string> parents;
+            transform(nodeParents.begin(), nodeParents.end(), back_inserter(parents), [](const auto& p) { return p->getName(); });
+            // Remove class as parent as it will be added later
+            parents.erase(remove(parents.begin(), parents.end(), pClassName), parents.end());
+            // Get the indices of the parents
+            vector<int> indices;
+            transform(parents.begin(), parents.end(), back_inserter(indices), [&](const auto& p) {return find(pFeatures.begin(), pFeatures.end(), p) - pFeatures.begin(); });
+            // Now we fit the discretizer of the feature, conditioned on its parents and the class i.e. discretizer.fit(X[index], X[indices] + y)
+            vector<string> yJoinParents;
+            transform(yv.begin(), yv.end(), back_inserter(yJoinParents), [&](const auto& p) {return to_string(p); });
+            for (auto idx : indices) {
+                for (int i = 0; i < n_samples; ++i) {
+                    yJoinParents[i] += to_string(Xv[idx][i]);
+                }
+            }
+            auto arff = ArffFiles();
+            auto yxv = arff.factorize(yJoinParents);
+            auto xvf_ptr = Xf.index({ index }).data_ptr<float>();
+            auto xvf = vector<mdlp::precision_t>(xvf_ptr, xvf_ptr + Xf.size(1));
+            discretizers[feature]->fit(xvf, yxv);
+            //
+            //
+            //
+            // auto tmp = discretizers[feature]->transform(xvf);
+            // Xv[index] = tmp;
+            // auto xStates = vector<int>(discretizers[pFeatures[index]]->getCutPoints().size() + 1);
+            // iota(xStates.begin(), xStates.end(), 0);
+            // //Update new states of the feature/node
+            // states[feature] = xStates;
+        }
+        if (upgrade) {
+            // Discretize again X (only the affected indices) with the new fitted discretizers
+            for (auto index : indicesToReDiscretize) {
+                auto Xt_ptr = Xf.index({ index }).data_ptr<float>();
+                auto Xt = vector<float>(Xt_ptr, Xt_ptr + Xf.size(1));
+                Xv[index] = discretizers[pFeatures[index]]->transform(Xt);
+                auto xStates = vector<int>(discretizers[pFeatures[index]]->getCutPoints().size() + 1);
+                iota(xStates.begin(), xStates.end(), 0);
+                //Update new states of the feature/node
+                states[pFeatures[index]] = xStates;
+            }
+        }
+    }
+    void Proposal::fit_local_discretization(map<string, vector<int>>& states, torch::Tensor& y)
+    {
+        // Sharing Xv and yv with Classifier
+        Xv = vector<vector<int>>();
+        yv = vector<int>(y.data_ptr<int>(), y.data_ptr<int>() + y.size(0));
+        // discretize input data by feature(row)
+        for (int i = 0; i < pFeatures.size(); ++i) {
+            auto* discretizer = new mdlp::CPPFImdlp();
+            auto Xt_ptr = Xf.index({ i }).data_ptr<float>();
+            auto Xt = vector<float>(Xt_ptr, Xt_ptr + Xf.size(1));
+            discretizer->fit(Xt, yv);
+            Xv.push_back(discretizer->transform(Xt));
+            auto xStates = vector<int>(discretizer->getCutPoints().size() + 1);
+            iota(xStates.begin(), xStates.end(), 0);
+            states[pFeatures[i]] = xStates;
+            discretizers[pFeatures[i]] = discretizer;
+        }
+        int n_classes = torch::max(y).item<int>() + 1;
+        auto yStates = vector<int>(n_classes);
+        iota(yStates.begin(), yStates.end(), 0);
+        states[pClassName] = yStates;
+    }
+    torch::Tensor Proposal::prepareX(torch::Tensor& X)
+    {
+        auto Xtd = torch::zeros_like(X, torch::kInt32);
+        for (int i = 0; i < X.size(0); ++i) {
+            auto Xt = vector<float>(X[i].data_ptr<float>(), X[i].data_ptr<float>() + X.size(1));
+            auto Xd = discretizers[pFeatures[i]]->transform(Xt);
+            Xtd.index_put_({ i }, torch::tensor(Xd, torch::kInt32));
+        }
+        return Xtd;
+    }
+}
--- a/src/BayesNet/Proposal.h
+++ b/src/BayesNet/Proposal.h
@@ -0,0 +1,29 @@
+#ifndef PROPOSAL_H
+#define PROPOSAL_H
+#include <string>
+#include <map>
+#include <torch/torch.h>
+#include "Network.h"
+#include "CPPFImdlp.h"
+#include "Classifier.h"
+
+namespace bayesnet {
+    class Proposal {
+    public:
+        Proposal(vector<vector<int>>& Xv_, vector<int>& yv_, vector<string>& features_, string& className_);
+        virtual ~Proposal();
+    protected:
+        torch::Tensor prepareX(torch::Tensor& X);
+        void localDiscretizationProposal(map<string, vector<int>>& states, Network& model);
+        void fit_local_discretization(map<string, vector<int>>& states, torch::Tensor& y);
+        torch::Tensor Xf; // X continuous nxm tensor
+        map<string, mdlp::CPPFImdlp*> discretizers;
+    private:
+        vector<string>& pFeatures;
+        string& pClassName;
+        vector<vector<int>>& Xv; // X discrete nxm vector
+        vector<int>& yv;
+    };
+}
+
+#endif
--- a/src/BayesNet/SPODE.cc
+++ b/src/BayesNet/SPODE.cc
@@ -2,7 +2,7 @@

 namespace bayesnet {

-    SPODE::SPODE(int root) : BaseClassifier(Network()), root(root) {}
+    SPODE::SPODE(int root) : Classifier(Network()), root(root) {}

    void SPODE::train()
    {
@@ -17,7 +17,7 @@ namespace bayesnet {
            }
        }
    }
-    vector<string> SPODE::graph(string name )
+    vector<string> SPODE::graph(const string& name)
    {
        return model.graph(name);
    }
--- a/src/BayesNet/SPODE.h
+++ b/src/BayesNet/SPODE.h
@@ -1,15 +1,17 @@
 #ifndef SPODE_H
 #define SPODE_H
-#include "BaseClassifier.h"
+#include "Classifier.h"
+
 namespace bayesnet {
-    class SPODE : public BaseClassifier {
+    class SPODE : public Classifier {
    private:
        int root;
    protected:
        void train() override;
    public:
-        SPODE(int root);
-        vector<string> graph(string name = "SPODE") override;
+        explicit SPODE(int root);
+        virtual ~SPODE() {};
+        vector<string> graph(const string& name = "SPODE") override;
    };
 }
 #endif
--- a/src/BayesNet/SPODELd.cc
+++ b/src/BayesNet/SPODELd.cc
@@ -0,0 +1,35 @@
+#include "SPODELd.h"
+
+namespace bayesnet {
+    using namespace std;
+    SPODELd::SPODELd(int root) : SPODE(root), Proposal(SPODE::Xv, SPODE::yv, features, className) {}
+    SPODELd& SPODELd::fit(torch::Tensor& X_, torch::Tensor& y_, vector<string>& features_, string className_, map<string, vector<int>>& states_)
+    {
+        // This first part should go in a Classifier method called fit_local_discretization o fit_float...
+        features = features_;
+        className = className_;
+        Xf = X_;
+        y = y_;
+        // Fills vectors Xv & yv with the data from tensors X_ (discretized) & y
+        fit_local_discretization(states, y);
+        generateTensorXFromVector();
+        // We have discretized the input data
+        // 1st we need to fit the model to build the normal SPODE structure, SPODE::fit initializes the base Bayesian network
+        SPODE::fit(SPODE::Xv, SPODE::yv, features, className, states);
+        localDiscretizationProposal(states, model);
+        generateTensorXFromVector();
+        Tensor ytmp = torch::transpose(y.view({ y.size(0), 1 }), 0, 1);
+        samples = torch::cat({ X, ytmp }, 0);
+        model.fit(SPODE::Xv, SPODE::yv, features, className);
+        return *this;
+    }
+    Tensor SPODELd::predict(Tensor& X)
+    {
+        auto Xt = prepareX(X);
+        return SPODE::predict(Xt);
+    }
+    vector<string> SPODELd::graph(const string& name)
+    {
+        return SPODE::graph(name);
+    }
+}
--- a/src/BayesNet/SPODELd.h
+++ b/src/BayesNet/SPODELd.h
@@ -0,0 +1,19 @@
+#ifndef SPODELD_H
+#define SPODELD_H
+#include "SPODE.h"
+#include "Proposal.h"
+
+namespace bayesnet {
+    using namespace std;
+    class SPODELd : public SPODE, public Proposal {
+    private:
+    public:
+        explicit SPODELd(int root);
+        virtual ~SPODELd() = default;
+        SPODELd& fit(torch::Tensor& X, torch::Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states) override;
+        vector<string> graph(const string& name = "SPODE") override;
+        Tensor predict(Tensor& X) override;
+        static inline string version() { return "0.0.1"; };
+    };
+}
+#endif // !SPODELD_H
--- a/src/BayesNet/TAN.cc
+++ b/src/BayesNet/TAN.cc
@@ -1,10 +1,9 @@
 #include "TAN.h"

 namespace bayesnet {
-    using namespace std;
    using namespace torch;

-    TAN::TAN() : BaseClassifier(Network()) {}
+    TAN::TAN() : Classifier(Network()) {}

    void TAN::train()
    {
@@ -13,13 +12,13 @@ namespace bayesnet {
        // 1. Compute mutual information between each feature and the class and set the root node
        // as the highest mutual information with the class
        auto mi = vector <pair<int, float >>();
-        Tensor class_dataset = dataset.index({ "...", -1 });
+        Tensor class_dataset = samples.index({ -1, "..." });
        for (int i = 0; i < static_cast<int>(features.size()); ++i) {
-            Tensor feature_dataset = dataset.index({ "...", i });
+            Tensor feature_dataset = samples.index({ i, "..." });
            auto mi_value = metrics.mutualInformation(class_dataset, feature_dataset);
            mi.push_back({ i, mi_value });
        }
-        sort(mi.begin(), mi.end(), [](auto& left, auto& right) {return left.second < right.second;});
+        sort(mi.begin(), mi.end(), [](const auto& left, const auto& right) {return left.second < right.second;});
        auto root = mi[mi.size() - 1].first;
        // 2. Compute mutual information between each feature and the class
        auto weights = metrics.conditionalEdge();
@@ -35,7 +34,7 @@ namespace bayesnet {
            model.addEdge(className, feature);
        }
    }
-    vector<string> TAN::graph(string title)
+    vector<string> TAN::graph(const string& title)
    {
        return model.graph(title);
    }
--- a/src/BayesNet/TAN.h
+++ b/src/BayesNet/TAN.h
@@ -1,16 +1,17 @@
 #ifndef TAN_H
 #define TAN_H
-#include "BaseClassifier.h"
+#include "Classifier.h"
 namespace bayesnet {
    using namespace std;
    using namespace torch;
-    class TAN : public BaseClassifier {
+    class TAN : public Classifier {
    private:
    protected:
        void train() override;
    public:
        TAN();
-        vector<string> graph(string name = "TAN") override;
+        virtual ~TAN() {};
+        vector<string> graph(const string& name = "TAN") override;
    };
 }
 #endif
--- a/src/BayesNet/TANLd.cc
+++ b/src/BayesNet/TANLd.cc
@@ -0,0 +1,35 @@
+#include "TANLd.h"
+
+namespace bayesnet {
+    using namespace std;
+    TANLd::TANLd() : TAN(), Proposal(TAN::Xv, TAN::yv, features, className) {}
+    TANLd& TANLd::fit(torch::Tensor& X_, torch::Tensor& y_, vector<string>& features_, string className_, map<string, vector<int>>& states_)
+    {
+        // This first part should go in a Classifier method called fit_local_discretization o fit_float...
+        features = features_;
+        className = className_;
+        Xf = X_;
+        y = y_;
+        // Fills vectors Xv & yv with the data from tensors X_ (discretized) & y
+        fit_local_discretization(states, y);
+        generateTensorXFromVector();
+        // We have discretized the input data
+        // 1st we need to fit the model to build the normal TAN structure, TAN::fit initializes the base Bayesian network
+        TAN::fit(TAN::Xv, TAN::yv, features, className, states);
+        localDiscretizationProposal(states, model);
+        generateTensorXFromVector();
+        Tensor ytmp = torch::transpose(y.view({ y.size(0), 1 }), 0, 1);
+        samples = torch::cat({ X, ytmp }, 0);
+        model.fit(TAN::Xv, TAN::yv, features, className);
+        return *this;
+    }
+    Tensor TANLd::predict(Tensor& X)
+    {
+        auto Xt = prepareX(X);
+        return TAN::predict(Xt);
+    }
+    vector<string> TANLd::graph(const string& name)
+    {
+        return TAN::graph(name);
+    }
+}
--- a/src/BayesNet/TANLd.h
+++ b/src/BayesNet/TANLd.h
@@ -0,0 +1,19 @@
+#ifndef TANLD_H
+#define TANLD_H
+#include "TAN.h"
+#include "Proposal.h"
+
+namespace bayesnet {
+    using namespace std;
+    class TANLd : public TAN, public Proposal {
+    private:
+    public:
+        TANLd();
+        virtual ~TANLd() = default;
+        TANLd& fit(torch::Tensor& X, torch::Tensor& y, vector<string>& features, string className, map<string, vector<int>>& states) override;
+        vector<string> graph(const string& name = "TAN") override;
+        Tensor predict(Tensor& X) override;
+        static inline string version() { return "0.0.1"; };
+    };
+}
+#endif // !TANLD_H
--- a/src/BayesNet/bayesnetUtils.cc
+++ b/src/BayesNet/bayesnetUtils.cc
@@ -3,6 +3,7 @@
 namespace bayesnet {
    using namespace std;
    using namespace torch;
+    // Return the indices in descending order
    vector<int> argsort(vector<float>& nums)
    {
        int n = nums.size();
@@ -11,21 +12,16 @@ namespace bayesnet {
        sort(indices.begin(), indices.end(), [&nums](int i, int j) {return nums[i] > nums[j];});
        return indices;
    }
-    vector<vector<int>> tensorToVector(const Tensor& tensor)
+    vector<vector<int>> tensorToVector(Tensor& tensor)
    {
        // convert mxn tensor to nxm vector
        vector<vector<int>> result;
-        auto tensor_accessor = tensor.accessor<int, 2>();
-
-        // Iterate over columns and rows of the tensor
-        for (int j = 0; j < tensor.size(1); ++j) {
-            vector<int> column;
-            for (int i = 0; i < tensor.size(0); ++i) {
-                column.push_back(tensor_accessor[i][j]);
-            }
-            result.push_back(column);
+        // Iterate over cols
+        for (int i = 0; i < tensor.size(1); ++i) {
+            auto col_tensor = tensor.index({ "...", i });
+            auto col = vector<int>(col_tensor.data_ptr<int>(), col_tensor.data_ptr<int>() + tensor.size(0));
+            result.push_back(col);
        }
-
        return result;
    }
 }
--- a/src/BayesNet/bayesnetUtils.h
+++ b/src/BayesNet/bayesnetUtils.h
@@ -6,6 +6,6 @@ namespace bayesnet {
    using namespace std;
    using namespace torch;
    vector<int> argsort(vector<float>& nums);
-    vector<vector<int>> tensorToVector(const Tensor& tensor);
+    vector<vector<int>> tensorToVector(Tensor& tensor);
 }
 #endif //BAYESNET_UTILS_H
--- a/src/Platform/CMakeLists.txt
+++ b/src/Platform/CMakeLists.txt
@@ -1,4 +1,8 @@
 include_directories(${BayesNet_SOURCE_DIR}/src/BayesNet)
 include_directories(${BayesNet_SOURCE_DIR}/src/Platform)
-add_executable(main Experiment.cc ArffFiles.cc CPPFImdlp.cpp Metrics.cpp platformUtils.cc)
-target_link_libraries(main BayesNet "${TORCH_LIBRARIES}")
+include_directories(${BayesNet_SOURCE_DIR}/lib/Files)
+include_directories(${BayesNet_SOURCE_DIR}/lib/mdlp)
+include_directories(${BayesNet_SOURCE_DIR}/lib/argparse/include)
+include_directories(${BayesNet_SOURCE_DIR}/lib/json/include)
+add_executable(main main.cc Folding.cc platformUtils.cc Experiment.cc Datasets.cc Models.cc Report.cc)
+target_link_libraries(main BayesNet ArffFiles mdlp "${TORCH_LIBRARIES}")
--- a/src/Platform/CPPFImdlp.cpp
+++ b/src/Platform/CPPFImdlp.cpp
@@ -1,221 +0,0 @@
-#include <numeric>
-#include <algorithm>
-#include <set>
-#include <cmath>
-#include "CPPFImdlp.h"
-#include "Metrics.h"
-
-namespace mdlp {
-
-    CPPFImdlp::CPPFImdlp(size_t min_length_, int max_depth_, float proposed) : min_length(min_length_),
-        max_depth(max_depth_),
-        proposed_cuts(proposed)
-    {
-    }
-
-    CPPFImdlp::CPPFImdlp() = default;
-
-    CPPFImdlp::~CPPFImdlp() = default;
-
-    size_t CPPFImdlp::compute_max_num_cut_points() const
-    {
-        // Set the actual maximum number of cut points as a number or as a percentage of the number of samples
-        if (proposed_cuts == 0) {
-            return numeric_limits<size_t>::max();
-        }
-        if (proposed_cuts < 0 || proposed_cuts > static_cast<float>(X.size())) {
-            throw invalid_argument("wrong proposed num_cuts value");
-        }
-        if (proposed_cuts < 1)
-            return static_cast<size_t>(round(static_cast<float>(X.size()) * proposed_cuts));
-        return static_cast<size_t>(proposed_cuts);
-    }
-
-    void CPPFImdlp::fit(samples_t& X_, labels_t& y_)
-    {
-        X = X_;
-        y = y_;
-        num_cut_points = compute_max_num_cut_points();
-        depth = 0;
-        discretizedData.clear();
-        cutPoints.clear();
-        if (X.size() != y.size()) {
-            throw invalid_argument("X and y must have the same size");
-        }
-        if (X.empty() || y.empty()) {
-            throw invalid_argument("X and y must have at least one element");
-        }
-        if (min_length < 3) {
-            throw invalid_argument("min_length must be greater than 2");
-        }
-        if (max_depth < 1) {
-            throw invalid_argument("max_depth must be greater than 0");
-        }
-        indices = sortIndices(X_, y_);
-        metrics.setData(y, indices);
-        computeCutPoints(0, X.size(), 1);
-        sort(cutPoints.begin(), cutPoints.end());
-        if (num_cut_points > 0) {
-            // Select the best (with lower entropy) cut points
-            while (cutPoints.size() > num_cut_points) {
-                resizeCutPoints();
-            }
-        }
-    }
-
-    pair<precision_t, size_t> CPPFImdlp::valueCutPoint(size_t start, size_t cut, size_t end)
-    {
-        size_t n;
-        size_t m;
-        size_t idxPrev = cut - 1 >= start ? cut - 1 : cut;
-        size_t idxNext = cut + 1 < end ? cut + 1 : cut;
-        bool backWall; // true if duplicates reach beginning of the interval
-        precision_t previous;
-        precision_t actual;
-        precision_t next;
-        previous = X[indices[idxPrev]];
-        actual = X[indices[cut]];
-        next = X[indices[idxNext]];
-        // definition 2 of the paper => X[t-1] < X[t]
-        // get the first equal value of X in the interval
-        while (idxPrev > start && actual == previous) {
-            previous = X[indices[--idxPrev]];
-        }
-        backWall = idxPrev == start && actual == previous;
-        // get the last equal value of X in the interval
-        while (idxNext < end - 1 && actual == next) {
-            next = X[indices[++idxNext]];
-        }
-        // # of duplicates before cutpoint
-        n = cut - 1 - idxPrev;
-        // # of duplicates after cutpoint
-        m = idxNext - cut - 1;
-        // Decide which values to use
-        cut = cut + (backWall ? m + 1 : -n);
-        actual = X[indices[cut]];
-        return { (actual + previous) / 2, cut };
-    }
-
-    void CPPFImdlp::computeCutPoints(size_t start, size_t end, int depth_)
-    {
-        size_t cut;
-        pair<precision_t, size_t> result;
-        // Check if the interval length and the depth are Ok
-        if (end - start < min_length || depth_ > max_depth)
-            return;
-        depth = depth_ > depth ? depth_ : depth;
-        cut = getCandidate(start, end);
-        if (cut == numeric_limits<size_t>::max())
-            return;
-        if (mdlp(start, cut, end)) {
-            result = valueCutPoint(start, cut, end);
-            cut = result.second;
-            cutPoints.push_back(result.first);
-            computeCutPoints(start, cut, depth_ + 1);
-            computeCutPoints(cut, end, depth_ + 1);
-        }
-    }
-
-    size_t CPPFImdlp::getCandidate(size_t start, size_t end)
-    {
-        /* Definition 1: A binary discretization for A is determined by selecting the cut point TA for which
-        E(A, TA; S) is minimal amongst all the candidate cut points. */
-        size_t candidate = numeric_limits<size_t>::max();
-        size_t elements = end - start;
-        bool sameValues = true;
-        precision_t entropy_left;
-        precision_t entropy_right;
-        precision_t minEntropy;
-        // Check if all the values of the variable in the interval are the same
-        for (size_t idx = start + 1; idx < end; idx++) {
-            if (X[indices[idx]] != X[indices[start]]) {
-                sameValues = false;
-                break;
-            }
-        }
-        if (sameValues)
-            return candidate;
-        minEntropy = metrics.entropy(start, end);
-        for (size_t idx = start + 1; idx < end; idx++) {
-            // Cutpoints are always on boundaries (definition 2)
-            if (y[indices[idx]] == y[indices[idx - 1]])
-                continue;
-            entropy_left = precision_t(idx - start) / static_cast<precision_t>(elements) * metrics.entropy(start, idx);
-            entropy_right = precision_t(end - idx) / static_cast<precision_t>(elements) * metrics.entropy(idx, end);
-            if (entropy_left + entropy_right < minEntropy) {
-                minEntropy = entropy_left + entropy_right;
-                candidate = idx;
-            }
-        }
-        return candidate;
-    }
-
-    bool CPPFImdlp::mdlp(size_t start, size_t cut, size_t end)
-    {
-        int k;
-        int k1;
-        int k2;
-        precision_t ig;
-        precision_t delta;
-        precision_t ent;
-        precision_t ent1;
-        precision_t ent2;
-        auto N = precision_t(end - start);
-        k = metrics.computeNumClasses(start, end);
-        k1 = metrics.computeNumClasses(start, cut);
-        k2 = metrics.computeNumClasses(cut, end);
-        ent = metrics.entropy(start, end);
-        ent1 = metrics.entropy(start, cut);
-        ent2 = metrics.entropy(cut, end);
-        ig = metrics.informationGain(start, cut, end);
-        delta = static_cast<precision_t>(log2(pow(3, precision_t(k)) - 2) -
-            (precision_t(k) * ent - precision_t(k1) * ent1 - precision_t(k2) * ent2));
-        precision_t term = 1 / N * (log2(N - 1) + delta);
-        return ig > term;
-    }
-
-    // Argsort from https://stackoverflow.com/questions/1577475/c-sorting-and-keeping-track-of-indexes
-    indices_t CPPFImdlp::sortIndices(samples_t& X_, labels_t& y_)
-    {
-        indices_t idx(X_.size());
-        iota(idx.begin(), idx.end(), 0);
-        stable_sort(idx.begin(), idx.end(), [&X_, &y_](size_t i1, size_t i2) {
-            if (X_[i1] == X_[i2])
-                return y_[i1] < y_[i2];
-            else
-                return X_[i1] < X_[i2];
-            });
-        return idx;
-    }
-
-    void CPPFImdlp::resizeCutPoints()
-    {
-        //Compute entropy of each of the whole cutpoint set and discards the biggest value
-        precision_t maxEntropy = 0;
-        precision_t entropy;
-        size_t maxEntropyIdx = 0;
-        size_t begin = 0;
-        size_t end;
-        for (size_t idx = 0; idx < cutPoints.size(); idx++) {
-            end = begin;
-            while (X[indices[end]] < cutPoints[idx] && end < X.size())
-                end++;
-            entropy = metrics.entropy(begin, end);
-            if (entropy > maxEntropy) {
-                maxEntropy = entropy;
-                maxEntropyIdx = idx;
-            }
-            begin = end;
-        }
-        cutPoints.erase(cutPoints.begin() + static_cast<long>(maxEntropyIdx));
-    }
-    labels_t& CPPFImdlp::transform(const samples_t& data)
-    {
-        discretizedData.reserve(data.size());
-        for (const precision_t& item : data) {
-            auto upper = upper_bound(cutPoints.begin(), cutPoints.end(), item);
-            discretizedData.push_back(upper - cutPoints.begin());
-        }
-        return discretizedData;
-    }
-}
--- a/src/Platform/CPPFImdlp.h
+++ b/src/Platform/CPPFImdlp.h
@@ -1,45 +0,0 @@
-#ifndef CPPFIMDLP_H
-#define CPPFIMDLP_H
-
-#include "typesFImdlp.h"
-#include "Metrics.h"
-#include <limits>
-#include <utility>
-#include <string>
-
-namespace mdlp {
-    class CPPFImdlp {
-    protected:
-        size_t min_length = 3;
-        int depth = 0;
-        int max_depth = numeric_limits<int>::max();
-        float proposed_cuts = 0;
-        indices_t indices = indices_t();
-        samples_t X = samples_t();
-        labels_t y = labels_t();
-        Metrics metrics = Metrics(y, indices);
-        cutPoints_t cutPoints;
-        size_t num_cut_points = numeric_limits<size_t>::max();
-        labels_t discretizedData = labels_t();
-
-        static indices_t sortIndices(samples_t&, labels_t&);
-
-        void computeCutPoints(size_t, size_t, int);
-        void resizeCutPoints();
-        bool mdlp(size_t, size_t, size_t);
-        size_t getCandidate(size_t, size_t);
-        size_t compute_max_num_cut_points() const;
-        pair<precision_t, size_t> valueCutPoint(size_t, size_t, size_t);
-
-    public:
-        CPPFImdlp();
-        CPPFImdlp(size_t, int, float);
-        ~CPPFImdlp();
-        void fit(samples_t&, labels_t&);
-        inline cutPoints_t getCutPoints() const { return cutPoints; };
-        labels_t& transform(const samples_t&);
-        inline int get_depth() const { return depth; };
-        static inline string version() { return "1.1.2"; };
-    };
-}
-#endif
--- a/src/Platform/Datasets.cc
+++ b/src/Platform/Datasets.cc
@@ -0,0 +1,231 @@
+#include "Datasets.h"
+#include "platformUtils.h"
+#include "ArffFiles.h"
+namespace platform {
+    void Datasets::load()
+    {
+        ifstream catalog(path + "/all.txt");
+        if (catalog.is_open()) {
+            string line;
+            while (getline(catalog, line)) {
+                vector<string> tokens = split(line, ',');
+                string name = tokens[0];
+                string className = tokens[1];
+                datasets[name] = make_unique<Dataset>(path, name, className, discretize, fileType);
+            }
+            catalog.close();
+        } else {
+            throw invalid_argument("Unable to open catalog file. [" + path + "/all.txt" + "]");
+        }
+    }
+    vector<string> Datasets::getNames()
+    {
+        vector<string> result;
+        transform(datasets.begin(), datasets.end(), back_inserter(result), [](const auto& d) { return d.first; });
+        return result;
+    }
+    vector<string> Datasets::getFeatures(string name)
+    {
+        if (datasets[name]->isLoaded()) {
+            return datasets[name]->getFeatures();
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    map<string, vector<int>> Datasets::getStates(string name)
+    {
+        if (datasets[name]->isLoaded()) {
+            return datasets[name]->getStates();
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    string Datasets::getClassName(string name)
+    {
+        if (datasets[name]->isLoaded()) {
+            return datasets[name]->getClassName();
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    int Datasets::getNSamples(string name)
+    {
+        if (datasets[name]->isLoaded()) {
+            return datasets[name]->getNSamples();
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    pair<vector<vector<float>>&, vector<int>&> Datasets::getVectors(string name)
+    {
+        if (!datasets[name]->isLoaded()) {
+            datasets[name]->load();
+        }
+        return datasets[name]->getVectors();
+    }
+    pair<vector<vector<int>>&, vector<int>&> Datasets::getVectorsDiscretized(string name)
+    {
+        if (!datasets[name]->isLoaded()) {
+            datasets[name]->load();
+        }
+        return datasets[name]->getVectorsDiscretized();
+    }
+    pair<torch::Tensor&, torch::Tensor&> Datasets::getTensors(string name)
+    {
+        if (!datasets[name]->isLoaded()) {
+            datasets[name]->load();
+        }
+        return datasets[name]->getTensors();
+    }
+    bool Datasets::isDataset(const string& name)
+    {
+        return datasets.find(name) != datasets.end();
+    }
+    Dataset::Dataset(const Dataset& dataset) : path(dataset.path), name(dataset.name), className(dataset.className), n_samples(dataset.n_samples), n_features(dataset.n_features), features(dataset.features), states(dataset.states), loaded(dataset.loaded), discretize(dataset.discretize), X(dataset.X), y(dataset.y), Xv(dataset.Xv), Xd(dataset.Xd), yv(dataset.yv), fileType(dataset.fileType)
+    {
+    }
+    string Dataset::getName()
+    {
+        return name;
+    }
+    string Dataset::getClassName()
+    {
+        return className;
+    }
+    vector<string> Dataset::getFeatures()
+    {
+        if (loaded) {
+            return features;
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    int Dataset::getNFeatures()
+    {
+        if (loaded) {
+            return n_features;
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    int Dataset::getNSamples()
+    {
+        if (loaded) {
+            return n_samples;
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    map<string, vector<int>> Dataset::getStates()
+    {
+        if (loaded) {
+            return states;
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    pair<vector<vector<float>>&, vector<int>&> Dataset::getVectors()
+    {
+        if (loaded) {
+            return { Xv, yv };
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    pair<vector<vector<int>>&, vector<int>&> Dataset::getVectorsDiscretized()
+    {
+        if (loaded) {
+            return { Xd, yv };
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    pair<torch::Tensor&, torch::Tensor&> Dataset::getTensors()
+    {
+        if (loaded) {
+            buildTensors();
+            return { X, y };
+        } else {
+            throw invalid_argument("Dataset not loaded.");
+        }
+    }
+    void Dataset::load_csv()
+    {
+        ifstream file(path + "/" + name + ".csv");
+        if (file.is_open()) {
+            string line;
+            getline(file, line);
+            vector<string> tokens = split(line, ',');
+            features = vector<string>(tokens.begin(), tokens.end() - 1);
+            className = tokens.back();
+            for (auto i = 0; i < features.size(); ++i) {
+                Xv.push_back(vector<float>());
+            }
+            while (getline(file, line)) {
+                tokens = split(line, ',');
+                for (auto i = 0; i < features.size(); ++i) {
+                    Xv[i].push_back(stof(tokens[i]));
+                }
+                yv.push_back(stoi(tokens.back()));
+            }
+            file.close();
+        } else {
+            throw invalid_argument("Unable to open dataset file.");
+        }
+    }
+    void Dataset::computeStates()
+    {
+        for (int i = 0; i < features.size(); ++i) {
+            states[features[i]] = vector<int>(*max_element(Xd[i].begin(), Xd[i].end()) + 1);
+            iota(begin(states[features[i]]), end(states[features[i]]), 0);
+        }
+        states[className] = vector<int>(*max_element(yv.begin(), yv.end()) + 1);
+        iota(begin(states[className]), end(states[className]), 0);
+    }
+    void Dataset::load_arff()
+    {
+        auto arff = ArffFiles();
+        arff.load(path + "/" + name + ".arff", className);
+        // Get Dataset X, y
+        Xv = arff.getX();
+        yv = arff.getY();
+        // Get className & Features
+        className = arff.getClassName();
+        auto attributes = arff.getAttributes();
+        transform(attributes.begin(), attributes.end(), back_inserter(features), [](const auto& attribute) { return attribute.first; });
+    }
+    void Dataset::load()
+    {
+        if (loaded) {
+            return;
+        }
+        if (fileType == CSV) {
+            load_csv();
+        } else if (fileType == ARFF) {
+            load_arff();
+        }
+        if (discretize) {
+            Xd = discretizeDataset(Xv, yv);
+            computeStates();
+        }
+        n_samples = Xv[0].size();
+        n_features = Xv.size();
+        loaded = true;
+    }
+    void Dataset::buildTensors()
+    {
+        if (discretize) {
+            X = torch::zeros({ static_cast<int>(n_features), static_cast<int>(n_samples) }, torch::kInt32);
+        } else {
+            X = torch::zeros({ static_cast<int>(n_features), static_cast<int>(n_samples) }, torch::kFloat32);
+        }
+        for (int i = 0; i < features.size(); ++i) {
+            if (discretize) {
+                X.index_put_({ i,  "..." }, torch::tensor(Xd[i], torch::kInt32));
+            } else {
+                X.index_put_({ i,  "..." }, torch::tensor(Xv[i], torch::kFloat32));
+            }
+        }
+        y = torch::tensor(yv, torch::kInt32);
+    }
+}
--- a/src/Platform/Datasets.h
+++ b/src/Platform/Datasets.h
@@ -0,0 +1,65 @@
+#ifndef DATASETS_H
+#define DATASETS_H
+#include <torch/torch.h>
+#include <map>
+#include <vector>
+#include <string>
+namespace platform {
+    using namespace std;
+    enum fileType_t { CSV, ARFF };
+    class Dataset {
+    private:
+        string path;
+        string name;
+        fileType_t fileType;
+        string className;
+        int n_samples{ 0 }, n_features{ 0 };
+        vector<string> features;
+        map<string, vector<int>> states;
+        bool loaded;
+        bool discretize;
+        torch::Tensor X, y;
+        vector<vector<float>> Xv;
+        vector<vector<int>> Xd;
+        vector<int> yv;
+        void buildTensors();
+        void load_csv();
+        void load_arff();
+        void computeStates();
+    public:
+        Dataset(const string& path, const string& name, const string& className, bool discretize, fileType_t fileType) : path(path), name(name), className(className), discretize(discretize), loaded(false), fileType(fileType) {};
+        explicit Dataset(const Dataset&);
+        string getName();
+        string getClassName();
+        vector<string> getFeatures();
+        map<string, vector<int>> getStates();
+        pair<vector<vector<float>>&, vector<int>&> getVectors();
+        pair<vector<vector<int>>&, vector<int>&> getVectorsDiscretized();
+        pair<torch::Tensor&, torch::Tensor&> getTensors();
+        int getNFeatures();
+        int getNSamples();
+        void load();
+        const bool inline isLoaded() const { return loaded; };
+    };
+    class Datasets {
+    private:
+        string path;
+        fileType_t fileType;
+        map<string, unique_ptr<Dataset>> datasets;
+        bool discretize;
+        void load(); // Loads the list of datasets
+    public:
+        explicit Datasets(const string& path, bool discretize = false, fileType_t fileType = ARFF) : path(path), discretize(discretize), fileType(fileType) { load(); };
+        vector<string> getNames();
+        vector<string> getFeatures(string name);
+        int getNSamples(string name);
+        string getClassName(string name);
+        map<string, vector<int>> getStates(string name);
+        pair<vector<vector<float>>&, vector<int>&> getVectors(string name);
+        pair<vector<vector<int>>&, vector<int>&> getVectorsDiscretized(string name);
+        pair<torch::Tensor&, torch::Tensor&> getTensors(string name);
+        bool isDataset(const string& name);
+    };
+};
+
+#endif
--- a/src/Platform/DotEnv.h
+++ b/src/Platform/DotEnv.h
@@ -0,0 +1,62 @@
+#ifndef DOTENV_H
+#define DOTENV_H
+#include <string>
+#include <map>
+#include <fstream>
+#include <sstream>
+#include "platformUtils.h"
+namespace platform {
+    class DotEnv {
+    private:
+        std::map<std::string, std::string> env;
+        std::string trim(const std::string& str)
+        {
+            std::string result = str;
+            result.erase(result.begin(), std::find_if(result.begin(), result.end(), [](int ch) {
+                return !std::isspace(ch);
+                }));
+            result.erase(std::find_if(result.rbegin(), result.rend(), [](int ch) {
+                return !std::isspace(ch);
+                }).base(), result.end());
+            return result;
+        }
+    public:
+        DotEnv()
+        {
+            std::ifstream file(".env");
+            if (!file.is_open()) {
+                std::cerr << "File .env not found" << std::endl;
+                exit(1);
+            }
+            std::string line;
+            while (std::getline(file, line)) {
+                line = trim(line);
+                if (line.empty() || line[0] == '#') {
+                    continue;
+                }
+                std::istringstream iss(line);
+                std::string key, value;
+                if (std::getline(iss, key, '=') && std::getline(iss, value)) {
+                    env[key] = value;
+                }
+            }
+        }
+        std::string get(const std::string& key)
+        {
+            return env[key];
+        }
+        std::vector<int> getSeeds()
+        {
+            auto seeds = std::vector<int>();
+            auto seeds_str = env["seeds"];
+            seeds_str = trim(seeds_str);
+            seeds_str = seeds_str.substr(1, seeds_str.size() - 2);
+            auto seeds_str_split = split(seeds_str, ',');
+            transform(seeds_str_split.begin(), seeds_str_split.end(), back_inserter(seeds), [](const std::string& str) {
+                return stoi(str);
+                });
+            return seeds;
+        }
+    };
+}
+#endif
--- a/src/Platform/Experiment.cc
+++ b/src/Platform/Experiment.cc
@@ -1,201 +1,184 @@
-#include <iostream>
-#include <string>
-#include <torch/torch.h>
-#include <thread>
-#include <getopt.h>
-#include "ArffFiles.h"
-#include "Network.h"
-#include "Metrics.hpp"
-#include "CPPFImdlp.h"
-#include "KDB.h"
-#include "SPODE.h"
-#include "AODE.h"
-#include "TAN.h"
-#include "platformUtils.h"
+#include "Experiment.h"
+#include "Datasets.h"
+#include "Models.h"
+#include "Report.h"

+namespace platform {
+    using json = nlohmann::json;
+    string get_date()
+    {
+        time_t rawtime;
+        tm* timeinfo;
+        time(&rawtime);
+        timeinfo = std::localtime(&rawtime);
+        std::ostringstream oss;
+        oss << std::put_time(timeinfo, "%Y-%m-%d");
+        return oss.str();
+    }
+    string get_time()
+    {
+        time_t rawtime;
+        tm* timeinfo;
+        time(&rawtime);
+        timeinfo = std::localtime(&rawtime);
+        std::ostringstream oss;
+        oss << std::put_time(timeinfo, "%H:%M:%S");
+        return oss.str();
+    }
+    string Experiment::get_file_name()
+    {
+        string result = "results_" + score_name + "_" + model + "_" + platform + "_" + get_date() + "_" + get_time() + "_" + (stratified ? "1" : "0") + ".json";
+        return result;
+    }

-using namespace std;
+    json Experiment::build_json()
+    {
+        json result;
+        result["title"] = title;
+        result["date"] = get_date();
+        result["time"] = get_time();
+        result["model"] = model;
+        result["version"] = model_version;
+        result["platform"] = platform;
+        result["score_name"] = score_name;
+        result["language"] = language;
+        result["language_version"] = language_version;
+        result["discretized"] = discretized;
+        result["stratified"] = stratified;
+        result["folds"] = nfolds;
+        result["seeds"] = randomSeeds;
+        result["duration"] = duration;
+        result["results"] = json::array();
+        for (const auto& r : results) {
+            json j;
+            j["dataset"] = r.getDataset();
+            j["hyperparameters"] = r.getHyperparameters();
+            j["samples"] = r.getSamples();
+            j["features"] = r.getFeatures();
+            j["classes"] = r.getClasses();
+            j["score_train"] = r.getScoreTrain();
+            j["score_test"] = r.getScoreTest();
+            j["score"] = r.getScoreTest();
+            j["score_std"] = r.getScoreTestStd();
+            j["score_train_std"] = r.getScoreTrainStd();
+            j["score_test_std"] = r.getScoreTestStd();
+            j["train_time"] = r.getTrainTime();
+            j["train_time_std"] = r.getTrainTimeStd();
+            j["test_time"] = r.getTestTime();
+            j["test_time_std"] = r.getTestTimeStd();
+            j["time"] = r.getTestTime() + r.getTrainTime();
+            j["time_std"] = r.getTestTimeStd() + r.getTrainTimeStd();
+            j["scores_train"] = r.getScoresTrain();
+            j["scores_test"] = r.getScoresTest();
+            j["times_train"] = r.getTimesTrain();
+            j["times_test"] = r.getTimesTest();
+            j["nodes"] = r.getNodes();
+            j["leaves"] = r.getLeaves();
+            j["depth"] = r.getDepth();
+            result["results"].push_back(j);
+        }
+        return result;
+    }
+    void Experiment::save(const string& path)
+    {
+        json data = build_json();
+        ofstream file(path + "/" + get_file_name());
+        file << data;
+        file.close();
+    }

-/* print a description of all supported options */
-void usage(const char* path)
-{
-    /* take only the last portion of the path */
-    const char* basename = strrchr(path, '/');
-    basename = basename ? basename + 1 : path;
+    void Experiment::report()
+    {
+        json data = build_json();
+        Report report(data);
+        report.show();
+    }

-    cout << "usage: " << basename << "[OPTION]" << endl;
-    cout << "  -h, --help\t\t Print this help and exit." << endl;
-    cout
-        << "  -f, --file[=FILENAME]\t {diabetes, glass, iris, kdd_JapaneseVowels, letter, liver-disorders, mfeat-factors}."
-        << endl;
-    cout << "  -p, --path[=FILENAME]\t folder where the data files are located, default " << PATH << endl;
-    cout << "  -m, --model={AODE, KDB, SPODE, TAN}\t " << endl;
-}
+    void Experiment::show()
+    {
+        json data = build_json();
+        cout << data.dump(4) << endl;
+    }

-tuple<string, string, string> parse_arguments(int argc, char** argv)
-{
-    string file_name;
-    string model_name;
-    string path = PATH;
-    const vector<struct option> long_options = {
-            {"help",          no_argument,       nullptr, 'h'},
-            {"file",          required_argument, nullptr, 'f'},
-            {"path",          required_argument, nullptr, 'p'},
-            {"model",         required_argument, nullptr, 'm'},
-            {nullptr,         no_argument,       nullptr, 0}
-    };
-    while (true) {
-        const auto c = getopt_long(argc, argv, "hf:p:m:", long_options.data(), nullptr);
-        if (c == -1)
-            break;
-        switch (c) {
-            case 'h':
-                usage(argv[0]);
-                exit(0);
-            case 'f':
-                file_name = string(optarg);
-                break;
-            case 'm':
-                model_name = string(optarg);
-                break;
-            case 'p':
-                path = optarg;
-                if (path.back() != '/')
-                    path += '/';
-                break;
-            case '?':
-                usage(argv[0]);
-                exit(1);
-            default:
-                abort();
+    void Experiment::go(vector<string> filesToProcess, const string& path)
+    {
+        cout << "*** Starting experiment: " << title << " ***" << endl;
+        for (auto fileName : filesToProcess) {
+            cout << "- " << setw(20) << left << fileName << " " << right << flush;
+            cross_validation(path, fileName);
+            cout << endl;
        }
    }
-    if (file_name.empty()) {
-        usage(argv[0]);
-        exit(1);
-    }
-    return make_tuple(file_name, path, model_name);
-}

-inline constexpr auto hash_conv(const std::string_view sv)
-{
-    unsigned long hash{ 5381 };
-    for (unsigned char c : sv) {
-        hash = ((hash << 5) + hash) ^ c;
+    void Experiment::cross_validation(const string& path, const string& fileName)
+    {
+        auto datasets = platform::Datasets(path, discretized, platform::ARFF);
+        // Get dataset
+        auto [X, y] = datasets.getTensors(fileName);
+        auto states = datasets.getStates(fileName);
+        auto features = datasets.getFeatures(fileName);
+        auto samples = datasets.getNSamples(fileName);
+        auto className = datasets.getClassName(fileName);
+        cout << " (" << setw(5) << samples << "," << setw(3) << features.size() << ") " << flush;
+        // Prepare Result
+        auto result = Result();
+        auto [values, counts] = at::_unique(y);
+        result.setSamples(X.size(1)).setFeatures(X.size(0)).setClasses(values.size(0));
+        int nResults = nfolds * static_cast<int>(randomSeeds.size());
+        auto accuracy_test = torch::zeros({ nResults }, torch::kFloat64);
+        auto accuracy_train = torch::zeros({ nResults }, torch::kFloat64);
+        auto train_time = torch::zeros({ nResults }, torch::kFloat64);
+        auto test_time = torch::zeros({ nResults }, torch::kFloat64);
+        auto nodes = torch::zeros({ nResults }, torch::kFloat64);
+        auto edges = torch::zeros({ nResults }, torch::kFloat64);
+        auto num_states = torch::zeros({ nResults }, torch::kFloat64);
+        Timer train_timer, test_timer;
+        int item = 0;
+        for (auto seed : randomSeeds) {
+            cout << "(" << seed << ") doing Fold: " << flush;
+            Fold* fold;
+            if (stratified)
+                fold = new StratifiedKFold(nfolds, y, seed);
+            else
+                fold = new KFold(nfolds, y.size(0), seed);
+            for (int nfold = 0; nfold < nfolds; nfold++) {
+                auto clf = Models::instance()->create(model);
+                setModelVersion(clf->getVersion());
+                train_timer.start();
+                auto [train, test] = fold->getFold(nfold);
+                auto train_t = torch::tensor(train);
+                auto test_t = torch::tensor(test);
+                auto X_train = X.index({ "...", train_t });
+                auto y_train = y.index({ train_t });
+                auto X_test = X.index({ "...", test_t });
+                auto y_test = y.index({ test_t });
+                cout << nfold + 1 << ", " << flush;
+                clf->fit(X_train, y_train, features, className, states);
+                nodes[item] = clf->getNumberOfNodes();
+                edges[item] = clf->getNumberOfEdges();
+                num_states[item] = clf->getNumberOfStates();
+                train_time[item] = train_timer.getDuration();
+                auto accuracy_train_value = clf->score(X_train, y_train);
+                test_timer.start();
+                auto accuracy_test_value = clf->score(X_test, y_test);
+                test_time[item] = test_timer.getDuration();
+                accuracy_train[item] = accuracy_train_value;
+                accuracy_test[item] = accuracy_test_value;
+                // Store results and times in vector
+                result.addScoreTrain(accuracy_train_value);
+                result.addScoreTest(accuracy_test_value);
+                result.addTimeTrain(train_time[item].item<double>());
+                result.addTimeTest(test_time[item].item<double>());
+                item++;
+            }
+            cout << "end. " << flush;
+            delete fold;
+        }
+        result.setScoreTest(torch::mean(accuracy_test).item<double>()).setScoreTrain(torch::mean(accuracy_train).item<double>());
+        result.setScoreTestStd(torch::std(accuracy_test).item<double>()).setScoreTrainStd(torch::std(accuracy_train).item<double>());
+        result.setTrainTime(torch::mean(train_time).item<double>()).setTestTime(torch::mean(test_time).item<double>());
+        result.setNodes(torch::mean(nodes).item<double>()).setLeaves(torch::mean(edges).item<double>()).setDepth(torch::mean(num_states).item<double>());
+        result.setDataset(fileName);
+        addResult(result);
    }
-    return hash;
-}
-
-inline constexpr auto operator"" _sh(const char* str, size_t len)
-{
-    return hash_conv(std::string_view{ str, len });
-}
-
-
-
-tuple<string, string, string> get_options(int argc, char** argv)
-{
-    map<string, bool> datasets = {
-            {"diabetes",           true},
-            {"ecoli",              true},
-            {"glass",              true},
-            {"iris",               true},
-            {"kdd_JapaneseVowels", false},
-            {"letter",             true},
-            {"liver-disorders",    true},
-            {"mfeat-factors",      true},
-    };
-    vector <string> models = { "AODE", "KDB", "SPODE", "TAN" };
-    string file_name;
-    string path;
-    string model_name;
-    tie(file_name, path, model_name) = parse_arguments(argc, argv);
-    if (datasets.find(file_name) == datasets.end()) {
-        cout << "Invalid file name: " << file_name << endl;
-        usage(argv[0]);
-        exit(1);
-    }
-    if (!file_exists(path + file_name + ".arff")) {
-        cout << "Data File " << path + file_name + ".arff" << " does not exist" << endl;
-        usage(argv[0]);
-        exit(1);
-    }
-    if (find(models.begin(), models.end(), model_name) == models.end()) {
-        cout << "Invalid model name: " << model_name << endl;
-        usage(argv[0]);
-        exit(1);
-    }
-    return { file_name, path, model_name };
-}
-
-int main(int argc, char** argv)
-{
-    string file_name, path, model_name;
-    tie(file_name, path, model_name) = get_options(argc, argv);
-    auto handler = ArffFiles();
-    handler.load(path + file_name + ".arff");
-    // Get Dataset X, y
-    vector<mdlp::samples_t>& X = handler.getX();
-    mdlp::labels_t& y = handler.getY();
-    // Get className & Features
-    auto className = handler.getClassName();
-    vector<string> features;
-    for (auto feature : handler.getAttributes()) {
-        features.push_back(feature.first);
-    }
-    // Discretize Dataset
-    vector<mdlp::labels_t> Xd;
-    map<string, int> maxes;
-    tie(Xd, maxes) = discretize(X, y, features);
-    maxes[className] = *max_element(y.begin(), y.end()) + 1;
-    map<string, vector<int>> states;
-    for (auto feature : features) {
-        states[feature] = vector<int>(maxes[feature]);
-    }
-    states[className] = vector<int>(
-        maxes[className]);
-    double score;
-    vector<string> lines;
-    vector<string> graph;
-    auto kdb = bayesnet::KDB(2);
-    auto aode = bayesnet::AODE();
-    auto spode = bayesnet::SPODE(2);
-    auto tan = bayesnet::TAN();
-    switch (hash_conv(model_name)) {
-        case "AODE"_sh:
-            aode.fit(Xd, y, features, className, states);
-            lines = aode.show();
-            score = aode.score(Xd, y);
-            graph = aode.graph();
-            break;
-        case "KDB"_sh:
-            kdb.fit(Xd, y, features, className, states);
-            lines = kdb.show();
-            score = kdb.score(Xd, y);
-            graph = kdb.graph();
-            break;
-        case "SPODE"_sh:
-            spode.fit(Xd, y, features, className, states);
-            lines = spode.show();
-            score = spode.score(Xd, y);
-            graph = spode.graph();
-            break;
-        case "TAN"_sh:
-            tan.fit(Xd, y, features, className, states);
-            lines = tan.show();
-            score = tan.score(Xd, y);
-            graph = tan.graph();
-            break;
-    }
-    for (auto line : lines) {
-        cout << line << endl;
-    }
-    cout << "Score: " << score << endl;
-    auto dot_file = model_name + "_" + file_name;
-    ofstream file(dot_file + ".dot");
-    file << graph;
-    file.close();
-    cout << "Graph saved in " << model_name << "_" << file_name << ".dot" << endl;
-    cout << "dot -Tpng -o " + dot_file + ".png " + dot_file + ".dot " << endl;
-    return 0;
 }
--- a/src/Platform/Experiment.h
+++ b/src/Platform/Experiment.h
@@ -0,0 +1,114 @@
+#ifndef EXPERIMENT_H
+#define EXPERIMENT_H
+#include <torch/torch.h>
+#include <nlohmann/json.hpp>
+#include <string>
+#include <chrono>
+#include "Folding.h"
+#include "BaseClassifier.h"
+#include "TAN.h"
+#include "KDB.h"
+#include "AODE.h"
+
+using namespace std;
+namespace platform {
+    using json = nlohmann::json;
+    class Timer {
+    private:
+        chrono::high_resolution_clock::time_point begin;
+    public:
+        Timer() = default;
+        ~Timer() = default;
+        void start() { begin = chrono::high_resolution_clock::now(); }
+        double getDuration()
+        {
+            chrono::high_resolution_clock::time_point end = chrono::high_resolution_clock::now();
+            chrono::duration<double> time_span = chrono::duration_cast<chrono::duration<double>>(end - begin);
+            return time_span.count();
+        }
+    };
+    class Result {
+    private:
+        string dataset, hyperparameters, model_version;
+        int samples{ 0 }, features{ 0 }, classes{ 0 };
+        double score_train{ 0 }, score_test{ 0 }, score_train_std{ 0 }, score_test_std{ 0 }, train_time{ 0 }, train_time_std{ 0 }, test_time{ 0 }, test_time_std{ 0 };
+        float nodes{ 0 }, leaves{ 0 }, depth{ 0 };
+        vector<double> scores_train, scores_test, times_train, times_test;
+    public:
+        Result() = default;
+        Result& setDataset(const string& dataset) { this->dataset = dataset; return *this; }
+        Result& setHyperparameters(const string& hyperparameters) { this->hyperparameters = hyperparameters; return *this; }
+        Result& setSamples(int samples) { this->samples = samples; return *this; }
+        Result& setFeatures(int features) { this->features = features; return *this; }
+        Result& setClasses(int classes) { this->classes = classes; return *this; }
+        Result& setScoreTrain(double score) { this->score_train = score; return *this; }
+        Result& setScoreTest(double score) { this->score_test = score; return *this; }
+        Result& setScoreTrainStd(double score_std) { this->score_train_std = score_std; return *this; }
+        Result& setScoreTestStd(double score_std) { this->score_test_std = score_std; return *this; }
+        Result& setTrainTime(double train_time) { this->train_time = train_time; return *this; }
+        Result& setTrainTimeStd(double train_time_std) { this->train_time_std = train_time_std; return *this; }
+        Result& setTestTime(double test_time) { this->test_time = test_time; return *this; }
+        Result& setTestTimeStd(double test_time_std) { this->test_time_std = test_time_std; return *this; }
+        Result& setNodes(float nodes) { this->nodes = nodes; return *this; }
+        Result& setLeaves(float leaves) { this->leaves = leaves; return *this; }
+        Result& setDepth(float depth) { this->depth = depth; return *this; }
+        Result& addScoreTrain(double score) { scores_train.push_back(score); return *this; }
+        Result& addScoreTest(double score) { scores_test.push_back(score); return *this; }
+        Result& addTimeTrain(double time) { times_train.push_back(time); return *this; }
+        Result& addTimeTest(double time) { times_test.push_back(time); return *this; }
+        const float get_score_train() const { return score_train; }
+        float get_score_test() { return score_test; }
+        const string& getDataset() const { return dataset; }
+        const string& getHyperparameters() const { return hyperparameters; }
+        const int getSamples() const { return samples; }
+        const int getFeatures() const { return features; }
+        const int getClasses() const { return classes; }
+        const double getScoreTrain() const { return score_train; }
+        const double getScoreTest() const { return score_test; }
+        const double getScoreTrainStd() const { return score_train_std; }
+        const double getScoreTestStd() const { return score_test_std; }
+        const double getTrainTime() const { return train_time; }
+        const double getTrainTimeStd() const { return train_time_std; }
+        const double getTestTime() const { return test_time; }
+        const double getTestTimeStd() const { return test_time_std; }
+        const float getNodes() const { return nodes; }
+        const float getLeaves() const { return leaves; }
+        const float getDepth() const { return depth; }
+        const vector<double>& getScoresTrain() const { return scores_train; }
+        const vector<double>& getScoresTest() const { return scores_test; }
+        const vector<double>& getTimesTrain() const { return times_train; }
+        const vector<double>& getTimesTest() const { return times_test; }
+    };
+    class Experiment {
+    private:
+        string title, model, platform, score_name, model_version, language_version, language;
+        bool discretized{ false }, stratified{ false };
+        vector<Result> results;
+        vector<int> randomSeeds;
+        int nfolds{ 0 };
+        float duration{ 0 };
+        json build_json();
+    public:
+        Experiment() = default;
+        Experiment& setTitle(const string& title) { this->title = title; return *this; }
+        Experiment& setModel(const string& model) { this->model = model; return *this; }
+        Experiment& setPlatform(const string& platform) { this->platform = platform; return *this; }
+        Experiment& setScoreName(const string& score_name) { this->score_name = score_name; return *this; }
+        Experiment& setModelVersion(const string& model_version) { this->model_version = model_version; return *this; }
+        Experiment& setLanguage(const string& language) { this->language = language; return *this; }
+        Experiment& setLanguageVersion(const string& language_version) { this->language_version = language_version; return *this; }
+        Experiment& setDiscretized(bool discretized) { this->discretized = discretized; return *this; }
+        Experiment& setStratified(bool stratified) { this->stratified = stratified; return *this; }
+        Experiment& setNFolds(int nfolds) { this->nfolds = nfolds; return *this; }
+        Experiment& addResult(Result result) { results.push_back(result); return *this; }
+        Experiment& addRandomSeed(int randomSeed) { randomSeeds.push_back(randomSeed); return *this; }
+        Experiment& setDuration(float duration) { this->duration = duration; return *this; }
+        string get_file_name();
+        void save(const string& path);
+        void cross_validation(const string& path, const string& fileName);
+        void go(vector<string> filesToProcess, const string& path);
+        void show();
+        void report();
+    };
+}
+#endif
--- a/src/Platform/Folding.cc
+++ b/src/Platform/Folding.cc
@@ -0,0 +1,95 @@
+#include "Folding.h"
+#include <algorithm>
+#include <map>
+Fold::Fold(int k, int n, int seed) : k(k), n(n), seed(seed)
+{
+    random_device rd;
+    random_seed = default_random_engine(seed == -1 ? rd() : seed);
+    srand(seed == -1 ? time(0) : seed);
+}
+KFold::KFold(int k, int n, int seed) : Fold(k, n, seed), indices(vector<int>(n))
+{
+    iota(begin(indices), end(indices), 0); // fill with 0, 1, ..., n - 1
+    shuffle(indices.begin(), indices.end(), random_seed);
+}
+pair<vector<int>, vector<int>> KFold::getFold(int nFold)
+{
+    if (nFold >= k || nFold < 0) {
+        throw out_of_range("nFold (" + to_string(nFold) + ") must be less than k (" + to_string(k) + ")");
+    }
+    int nTest = n / k;
+    auto train = vector<int>();
+    auto test = vector<int>();
+    for (int i = 0; i < n; i++) {
+        if (i >= nTest * nFold && i < nTest * (nFold + 1)) {
+            test.push_back(indices[i]);
+        } else {
+            train.push_back(indices[i]);
+        }
+    }
+    return { train, test };
+}
+StratifiedKFold::StratifiedKFold(int k, torch::Tensor& y, int seed) : Fold(k, y.numel(), seed)
+{
+    n = y.numel();
+    this->y = vector<int>(y.data_ptr<int>(), y.data_ptr<int>() + n);
+    build();
+}
+StratifiedKFold::StratifiedKFold(int k, const vector<int>& y, int seed)
+    : Fold(k, y.size(), seed)
+{
+    this->y = y;
+    n = y.size();
+    build();
+}
+void StratifiedKFold::build()
+{
+    stratified_indices = vector<vector<int>>(k);
+    int fold_size = n / k;
+    // Compute class counts and indices
+    auto class_indices = map<int, vector<int>>();
+    vector<int> class_counts(*max_element(y.begin(), y.end()) + 1, 0);
+    for (auto i = 0; i < n; ++i) {
+        class_counts[y[i]]++;
+        class_indices[y[i]].push_back(i);
+    }
+    // Shuffle class indices
+    for (auto& [cls, indices] : class_indices) {
+        shuffle(indices.begin(), indices.end(), random_seed);
+    }
+    // Assign indices to folds
+    for (auto label = 0; label < class_counts.size(); ++label) {
+        auto num_samples_to_take = class_counts[label] / k;
+        if (num_samples_to_take == 0)
+            continue;
+        auto remainder_samples_to_take = class_counts[label] % k;
+        for (auto fold = 0; fold < k; ++fold) {
+            auto it = next(class_indices[label].begin(), num_samples_to_take);
+            move(class_indices[label].begin(), it, back_inserter(stratified_indices[fold]));  // ##
+            class_indices[label].erase(class_indices[label].begin(), it);
+        }
+        while (remainder_samples_to_take > 0) {
+            int fold = (rand() % static_cast<int>(k));
+            if (stratified_indices[fold].size() == fold_size + 1) {
+                continue;
+            }
+            auto it = next(class_indices[label].begin(), 1);
+            stratified_indices[fold].push_back(*class_indices[label].begin());
+            class_indices[label].erase(class_indices[label].begin(), it);
+            remainder_samples_to_take--;
+        }
+    }
+}
+pair<vector<int>, vector<int>> StratifiedKFold::getFold(int nFold)
+{
+    if (nFold >= k || nFold < 0) {
+        throw out_of_range("nFold (" + to_string(nFold) + ") must be less than k (" + to_string(k) + ")");
+    }
+    vector<int> test_indices = stratified_indices[nFold];
+    vector<int> train_indices;
+    for (int i = 0; i < k; ++i) {
+        if (i == nFold) continue;
+        train_indices.insert(train_indices.end(), stratified_indices[i].begin(), stratified_indices[i].end());
+    }
+    return { train_indices, test_indices };
+}
--- a/src/Platform/Folding.h
+++ b/src/Platform/Folding.h
@@ -0,0 +1,37 @@
+#ifndef FOLDING_H
+#define FOLDING_H
+#include <torch/torch.h>
+#include <vector>
+#include <random> 
+using namespace std;
+
+class Fold {
+protected:
+    int k;
+    int n;
+    int seed;
+    default_random_engine random_seed;
+public:
+    Fold(int k, int n, int seed = -1);
+    virtual pair<vector<int>, vector<int>> getFold(int nFold) = 0;
+    virtual ~Fold() = default;
+    int getNumberOfFolds() { return k; }
+};
+class KFold : public Fold {
+private:
+    vector<int> indices;
+public:
+    KFold(int k, int n, int seed = -1);
+    pair<vector<int>, vector<int>> getFold(int nFold) override;
+};
+class StratifiedKFold : public Fold {
+private:
+    vector<int> y;
+    vector<vector<int>> stratified_indices;
+    void build();
+public:
+    StratifiedKFold(int k, const vector<int>& y, int seed = -1);
+    StratifiedKFold(int k, torch::Tensor& y, int seed = -1);
+    pair<vector<int>, vector<int>> getFold(int nFold) override;
+};
+#endif
--- a/src/Platform/Metrics.cpp
+++ b/src/Platform/Metrics.cpp
@@ -1,78 +0,0 @@
-#include "Metrics.h"
-#include <set>
-#include <cmath>
-
-using namespace std;
-namespace mdlp {
-    Metrics::Metrics(labels_t& y_, indices_t& indices_): y(y_), indices(indices_),
-        numClasses(computeNumClasses(0, indices.size()))
-    {
-    }
-
-    int Metrics::computeNumClasses(size_t start, size_t end)
-    {
-        set<int> nClasses;
-        for (auto i = start; i < end; ++i) {
-            nClasses.insert(y[indices[i]]);
-        }
-        return static_cast<int>(nClasses.size());
-    }
-
-    void Metrics::setData(const labels_t& y_, const indices_t& indices_)
-    {
-        indices = indices_;
-        y = y_;
-        numClasses = computeNumClasses(0, indices.size());
-        entropyCache.clear();
-        igCache.clear();
-    }
-
-    precision_t Metrics::entropy(size_t start, size_t end)
-    {
-        precision_t p;
-        precision_t ventropy = 0;
-        int nElements = 0;
-        labels_t counts(numClasses + 1, 0);
-        if (end - start < 2)
-            return 0;
-        if (entropyCache.find({ start, end }) != entropyCache.end()) {
-            return entropyCache[{start, end}];
-        }
-        for (auto i = &indices[start]; i != &indices[end]; ++i) {
-            counts[y[*i]]++;
-            nElements++;
-        }
-        for (auto count : counts) {
-            if (count > 0) {
-                p = static_cast<precision_t>(count) / static_cast<precision_t>(nElements);
-                ventropy -= p * log2(p);
-            }
-        }
-        entropyCache[{start, end}] = ventropy;
-        return ventropy;
-    }
-
-    precision_t Metrics::informationGain(size_t start, size_t cut, size_t end)
-    {
-        precision_t iGain;
-        precision_t entropyInterval;
-        precision_t entropyLeft;
-        precision_t entropyRight;
-        size_t nElementsLeft = cut - start;
-        size_t nElementsRight = end - cut;
-        size_t nElements = end - start;
-        if (igCache.find(make_tuple(start, cut, end)) != igCache.end()) {
-            return igCache[make_tuple(start, cut, end)];
-        }
-        entropyInterval = entropy(start, end);
-        entropyLeft = entropy(start, cut);
-        entropyRight = entropy(cut, end);
-        iGain = entropyInterval -
-            (static_cast<precision_t>(nElementsLeft) * entropyLeft +
-                static_cast<precision_t>(nElementsRight) * entropyRight) /
-            static_cast<precision_t>(nElements);
-        igCache[make_tuple(start, cut, end)] = iGain;
-        return iGain;
-    }
-
-}
--- a/src/Platform/Metrics.h
+++ b/src/Platform/Metrics.h
@@ -1,22 +0,0 @@
-#ifndef CCMETRICS_H
-#define CCMETRICS_H
-
-#include "typesFImdlp.h"
-
-namespace mdlp {
-    class Metrics {
-    protected:
-        labels_t& y;
-        indices_t& indices;
-        int numClasses;
-        cacheEnt_t entropyCache = cacheEnt_t();
-        cacheIg_t igCache = cacheIg_t();
-    public:
-        Metrics(labels_t&, indices_t&);
-        void setData(const labels_t&, const indices_t&);
-        int computeNumClasses(size_t, size_t);
-        precision_t entropy(size_t, size_t);
-        precision_t informationGain(size_t, size_t, size_t);
-    };
-}
-#endif
--- a/src/Platform/Models.cc
+++ b/src/Platform/Models.cc
@@ -0,0 +1,54 @@
+#include "Models.h"
+namespace platform {
+    using namespace std;
+    // Idea from: https://www.codeproject.com/Articles/567242/AplusC-2b-2bplusObjectplusFactory
+    Models* Models::factory = nullptr;;
+    Models* Models::instance()
+    {
+        //manages singleton
+        if (factory == nullptr)
+            factory = new Models();
+        return factory;
+    }
+    void Models::registerFactoryFunction(const string& name,
+        function<bayesnet::BaseClassifier* (void)> classFactoryFunction)
+    {
+        // register the class factory function
+        functionRegistry[name] = classFactoryFunction;
+    }
+    shared_ptr<bayesnet::BaseClassifier> Models::create(const string& name)
+    {
+        bayesnet::BaseClassifier* instance = nullptr;
+
+        // find name in the registry and call factory method.
+        auto it = functionRegistry.find(name);
+        if (it != functionRegistry.end())
+            instance = it->second();
+        // wrap instance in a shared ptr and return
+        if (instance != nullptr)
+            return shared_ptr<bayesnet::BaseClassifier>(instance);
+        else
+            return nullptr;
+    }
+    vector<string> Models::getNames()
+    {
+        vector<string> names;
+        transform(functionRegistry.begin(), functionRegistry.end(), back_inserter(names),
+            [](const pair<string, function<bayesnet::BaseClassifier* (void)>>& pair) { return pair.first; });
+        return names;
+    }
+    string Models::toString()
+    {
+        string result = "";
+        for (const auto& pair : functionRegistry) {
+            result += pair.first + ", ";
+        }
+        return "{" + result.substr(0, result.size() - 2) + "}";
+    }
+
+    Registrar::Registrar(const string& name, function<bayesnet::BaseClassifier* (void)> classFactoryFunction)
+    {
+        // register the class factory function 
+        Models::instance()->registerFactoryFunction(name, classFactoryFunction);
+    }
+}
--- a/src/Platform/Models.h
+++ b/src/Platform/Models.h
@@ -0,0 +1,36 @@
+#ifndef MODELS_H
+#define MODELS_H
+#include <map>
+#include "BaseClassifier.h"
+#include "AODE.h"
+#include "TAN.h"
+#include "KDB.h"
+#include "SPODE.h"
+#include "TANLd.h"
+#include "KDBLd.h"
+#include "SPODELd.h"
+#include "AODELd.h"
+namespace platform {
+    class Models {
+    private:
+        map<string, function<bayesnet::BaseClassifier* (void)>> functionRegistry;
+        static Models* factory; //singleton
+        Models() {};
+    public:
+        Models(Models&) = delete;
+        void operator=(const Models&) = delete;
+        // Idea from: https://www.codeproject.com/Articles/567242/AplusC-2b-2bplusObjectplusFactory
+        static Models* instance();
+        shared_ptr<bayesnet::BaseClassifier> create(const string& name);
+        void registerFactoryFunction(const string& name,
+            function<bayesnet::BaseClassifier* (void)> classFactoryFunction);
+        vector<string> getNames();
+        string toString();
+
+    };
+    class Registrar {
+    public:
+        Registrar(const string& className, function<bayesnet::BaseClassifier* (void)> classFactoryFunction);
+    };
+}
+#endif
--- a/src/Platform/Report.cc
+++ b/src/Platform/Report.cc
@@ -0,0 +1,66 @@
+#include "Report.h"
+
+namespace platform {
+    string headerLine(const string& text)
+    {
+        int n = MAXL - text.length() - 3;
+        return "* " + text + string(n, ' ') + "*\n";
+    }
+    string Report::fromVector(const string& key)
+    {
+        string result = "";
+
+        for (auto& item : data[key]) {
+            result += to_string(item) + ", ";
+        }
+        return "[" + result.substr(0, result.length() - 2) + "]";
+    }
+    string fVector(const json& data)
+    {
+        string result = "";
+        for (const auto& item : data) {
+            result += to_string(item) + ", ";
+        }
+        return "[" + result.substr(0, result.length() - 2) + "]";
+    }
+    void Report::show()
+    {
+        header();
+        body();
+    }
+    void Report::header()
+    {
+        cout << string(MAXL, '*') << endl;
+        cout << headerLine("Report " + data["model"].get<string>() + " ver. " + data["version"].get<string>() + " with " + to_string(data["folds"].get<int>()) + " Folds cross validation and " + to_string(data["seeds"].size()) + " random seeds. " + data["date"].get<string>() + " " + data["time"].get<string>());
+        cout << headerLine(data["title"].get<string>());
+        cout << headerLine("Random seeds: " + fromVector("seeds") + " Stratified: " + (data["stratified"].get<bool>() ? "True" : "False"));
+        cout << headerLine("Execution took  " + to_string(data["duration"].get<float>()) + " seconds,   " + to_string(data["duration"].get<float>() / 3600) + " hours, on " + data["platform"].get<string>());
+        cout << headerLine("Score is " + data["score_name"].get<string>());
+        cout << string(MAXL, '*') << endl;
+        cout << endl;
+    }
+    void Report::body()
+    {
+        cout << "Dataset                        Sampl. Feat. Cls Nodes   Edges   States  Score           Time              Hyperparameters" << endl;
+        cout << "============================== ====== ===== === ======= ======= ======= =============== ================= ===============" << endl;
+        for (const auto& r : data["results"]) {
+            cout << setw(30) << left << r["dataset"].get<string>() << " ";
+            cout << setw(6) << right << r["samples"].get<int>() << " ";
+            cout << setw(5) << right << r["features"].get<int>() << " ";
+            cout << setw(3) << right << r["classes"].get<int>() << " ";
+            cout << setw(7) << setprecision(2) << fixed << r["nodes"].get<float>() << " ";
+            cout << setw(7) << setprecision(2) << fixed << r["leaves"].get<float>() << " ";
+            cout << setw(7) << setprecision(2) << fixed << r["depth"].get<float>() << " ";
+            cout << setw(8) << right << setprecision(6) << fixed << r["score_test"].get<double>() << "±" << setw(6) << setprecision(4) << fixed << r["score_test_std"].get<double>() << " ";
+            cout << setw(10) << right << setprecision(6) << fixed << r["test_time"].get<double>() << "±" << setw(6) << setprecision(4) << fixed << r["test_time_std"].get<double>() << " ";
+            cout << " " << r["hyperparameters"].get<string>();
+            cout << endl;
+            cout << string(MAXL, '*') << endl;
+            cout << headerLine("Train scores: " + fVector(r["scores_train"]));
+            cout << headerLine("Test  scores: " + fVector(r["scores_test"]));
+            cout << headerLine("Train  times: " + fVector(r["times_train"]));
+            cout << headerLine("Test   times: " + fVector(r["times_test"]));
+            cout << string(MAXL, '*') << endl;
+        }
+    }
+}
--- a/src/Platform/Report.h
+++ b/src/Platform/Report.h
@@ -0,0 +1,23 @@
+#ifndef REPORT_H
+#define REPORT_H
+#include <string>
+#include <iostream>
+#include <nlohmann/json.hpp>
+
+using json = nlohmann::json;
+const int MAXL = 121;
+namespace platform {
+    using namespace std;
+    class Report {
+    public:
+        explicit Report(json data_) { data = data_; };
+        virtual ~Report() = default;
+        void show();
+    private:
+        void header();
+        void body();
+        string fromVector(const string& key);
+        json data;
+    };
+};
+#endif
--- a/src/Platform/main.cc
+++ b/src/Platform/main.cc
@@ -0,0 +1,123 @@
+#include <iostream>
+#include <argparse/argparse.hpp>
+#include "platformUtils.h"
+#include "Experiment.h"
+#include "Datasets.h"
+#include "DotEnv.h"
+#include "Models.h"
+#include "modelRegister.h"
+
+using namespace std;
+const string PATH_RESULTS = "results";
+const string PATH_DATASETS = "datasets";
+
+argparse::ArgumentParser manageArguments(int argc, char** argv)
+{
+    auto env = platform::DotEnv();
+    argparse::ArgumentParser program("BayesNetSample");
+    program.add_argument("-d", "--dataset").default_value("").help("Dataset file name");
+    program.add_argument("-p", "--path")
+        .help("folder where the data files are located, default")
+        .default_value(string{ PATH_DATASETS }
+    );
+    program.add_argument("-m", "--model")
+        .help("Model to use " + platform::Models::instance()->toString())
+        .action([](const std::string& value) {
+        static const vector<string> choices = platform::Models::instance()->getNames();
+        if (find(choices.begin(), choices.end(), value) != choices.end()) {
+            return value;
+        }
+        throw runtime_error("Model must be one of " + platform::Models::instance()->toString());
+            }
+    );
+    program.add_argument("--title").default_value("").help("Experiment title");
+    program.add_argument("--discretize").help("Discretize input dataset").default_value((bool)stoi(env.get("discretize"))).implicit_value(true);
+    program.add_argument("--stratified").help("If Stratified KFold is to be done").default_value((bool)stoi(env.get("stratified"))).implicit_value(true);
+    program.add_argument("-f", "--folds").help("Number of folds").default_value(stoi(env.get("n_folds"))).scan<'i', int>().action([](const string& value) {
+        try {
+            auto k = stoi(value);
+            if (k < 2) {
+                throw runtime_error("Number of folds must be greater than 1");
+            }
+            return k;
+        }
+        catch (const runtime_error& err) {
+            throw runtime_error(err.what());
+        }
+        catch (...) {
+            throw runtime_error("Number of folds must be an integer");
+        }});
+    auto seed_values = env.getSeeds();
+    program.add_argument("-s", "--seeds").nargs(1, 10).help("Random seeds. Set to -1 to have pseudo random").scan<'i', int>().default_value(seed_values);
+    try {
+        program.parse_args(argc, argv);
+        auto file_name = program.get<string>("dataset");
+        auto path = program.get<string>("path");
+        auto model_name = program.get<string>("model");
+        auto discretize_dataset = program.get<bool>("discretize");
+        auto stratified = program.get<bool>("stratified");
+        auto n_folds = program.get<int>("folds");
+        auto seeds = program.get<vector<int>>("seeds");
+        auto complete_file_name = path + file_name + ".arff";
+        auto title = program.get<string>("title");
+        if (title == "" && file_name == "") {
+            throw runtime_error("title is mandatory if dataset is not provided");
+        }
+    }
+    catch (const exception& err) {
+        cerr << err.what() << endl;
+        cerr << program;
+        exit(1);
+    }
+    return program;
+}
+
+int main(int argc, char** argv)
+{
+    auto program = manageArguments(argc, argv);
+    bool saveResults = false;
+    auto file_name = program.get<string>("dataset");
+    auto path = program.get<string>("path");
+    auto model_name = program.get<string>("model");
+    auto discretize_dataset = program.get<bool>("discretize");
+    auto stratified = program.get<bool>("stratified");
+    auto n_folds = program.get<int>("folds");
+    auto seeds = program.get<vector<int>>("seeds");
+    vector<string> filesToTest;
+    auto datasets = platform::Datasets(path, true, platform::ARFF);
+    auto title = program.get<string>("title");
+    if (file_name != "") {
+        if (!datasets.isDataset(file_name)) {
+            cerr << "Dataset " << file_name << " not found" << endl;
+            exit(1);
+        }
+        if (title == "") {
+            title = "Test " + file_name + " " + model_name + " " + to_string(n_folds) + " folds";
+        }
+        filesToTest.push_back(file_name);
+    } else {
+        filesToTest = platform::Datasets(path, true, platform::ARFF).getNames();
+        saveResults = true;
+    }
+    /*
+    * Begin Processing
+    */
+    auto env = platform::DotEnv();
+    auto experiment = platform::Experiment();
+    experiment.setTitle(title).setLanguage("cpp").setLanguageVersion("1.0.0");
+    experiment.setDiscretized(discretize_dataset).setModel(model_name).setPlatform(env.get("platform"));
+    experiment.setStratified(stratified).setNFolds(n_folds).setScoreName("accuracy");
+    for (auto seed : seeds) {
+        experiment.addRandomSeed(seed);
+    }
+    platform::Timer timer;
+    timer.start();
+    experiment.go(filesToTest, path);
+    experiment.setDuration(timer.getDuration());
+    if (saveResults)
+        experiment.save(PATH_RESULTS);
+    else
+        experiment.report();
+    cout << "Done!" << endl;
+    return 0;
+}
--- a/src/Platform/modelRegister.h
+++ b/src/Platform/modelRegister.h
@@ -0,0 +1,19 @@
+#ifndef MODEL_REGISTER_H
+#define MODEL_REGISTER_H
+static platform::Registrar registrarT("TAN",
+    [](void) -> bayesnet::BaseClassifier* { return new bayesnet::TAN();});
+static platform::Registrar registrarTLD("TANLd",
+    [](void) -> bayesnet::BaseClassifier* { return new bayesnet::TANLd();});
+static platform::Registrar registrarS("SPODE",
+    [](void) -> bayesnet::BaseClassifier* { return new bayesnet::SPODE(2);});
+static platform::Registrar registrarSLD("SPODELd",
+    [](void) -> bayesnet::BaseClassifier* { return new bayesnet::SPODELd(2);});
+static platform::Registrar registrarK("KDB",
+    [](void) -> bayesnet::BaseClassifier* { return new bayesnet::KDB(2);});
+static platform::Registrar registrarKLD("KDBLd",
+    [](void) -> bayesnet::BaseClassifier* { return new bayesnet::KDBLd(2);});
+static platform::Registrar registrarA("AODE",
+    [](void) -> bayesnet::BaseClassifier* { return new bayesnet::AODE();});
+static platform::Registrar registrarALD("AODELd",
+    [](void) -> bayesnet::BaseClassifier* { return new bayesnet::AODELd();});
+#endif
--- a/src/Platform/platformUtils.cc
+++ b/src/Platform/platformUtils.cc
@@ -1,5 +1,18 @@
 #include "platformUtils.h"

+using namespace torch;
+
+vector<string> split(const string& text, char delimiter)
+{
+    vector<string> result;
+    stringstream ss(text);
+    string token;
+    while (getline(ss, token, delimiter)) {
+        result.push_back(token);
+    }
+    return result;
+}
+
 pair<vector<mdlp::labels_t>, map<string, int>> discretize(vector<mdlp::samples_t>& X, mdlp::labels_t& y, vector<string> features)
 {
    vector<mdlp::labels_t> Xd;
@@ -14,7 +27,19 @@ pair<vector<mdlp::labels_t>, map<string, int>> discretize(vector<mdlp::samples_t
    return { Xd, maxes };
 }

-bool file_exists(const std::string& name)
+vector<mdlp::labels_t> discretizeDataset(vector<mdlp::samples_t>& X, mdlp::labels_t& y)
+{
+    vector<mdlp::labels_t> Xd;
+    auto fimdlp = mdlp::CPPFImdlp();
+    for (int i = 0; i < X.size(); i++) {
+        fimdlp.fit(X[i], y);
+        mdlp::labels_t& xd = fimdlp.transform(X[i]);
+        Xd.push_back(xd);
+    }
+    return Xd;
+}
+
+bool file_exists(const string& name)
 {
    if (FILE* file = fopen(name.c_str(), "r")) {
        fclose(file);
@@ -24,7 +49,40 @@ bool file_exists(const std::string& name)
    }
 }

-tuple<vector<vector<int>>, vector<int>, vector<string>, string, map<string, vector<int>>> loadFile(string name)
+tuple<Tensor, Tensor, vector<string>, string, map<string, vector<int>>> loadDataset(const string& path, const string& name, bool class_last, bool discretize_dataset)
+{
+    auto handler = ArffFiles();
+    handler.load(path + static_cast<string>(name) + ".arff", class_last);
+    // Get Dataset X, y
+    vector<mdlp::samples_t>& X = handler.getX();
+    mdlp::labels_t& y = handler.getY();
+    // Get className & Features
+    auto className = handler.getClassName();
+    vector<string> features;
+    auto attributes = handler.getAttributes();
+    transform(attributes.begin(), attributes.end(), back_inserter(features), [](const auto& pair) { return pair.first; });
+    Tensor Xd;
+    auto states = map<string, vector<int>>();
+    if (discretize_dataset) {
+        auto Xr = discretizeDataset(X, y);
+        Xd = torch::zeros({ static_cast<int>(Xr[0].size()), static_cast<int>(Xr.size()) }, torch::kInt32);
+        for (int i = 0; i < features.size(); ++i) {
+            states[features[i]] = vector<int>(*max_element(Xr[i].begin(), Xr[i].end()) + 1);
+            iota(begin(states[features[i]]), end(states[features[i]]), 0);
+            Xd.index_put_({ "...", i }, torch::tensor(Xr[i], torch::kInt32));
+        }
+        states[className] = vector<int>(*max_element(y.begin(), y.end()) + 1);
+        iota(begin(states[className]), end(states[className]), 0);
+    } else {
+        Xd = torch::zeros({ static_cast<int>(X[0].size()), static_cast<int>(X.size()) }, torch::kFloat32);
+        for (int i = 0; i < features.size(); ++i) {
+            Xd.index_put_({ "...", i }, torch::tensor(X[i]));
+        }
+    }
+    return { Xd, torch::tensor(y, torch::kInt32), features, className, states };
+}
+
+tuple<vector<vector<int>>, vector<int>, vector<string>, string, map<string, vector<int>>> loadFile(const string& name)
 {
    auto handler = ArffFiles();
    handler.load(PATH + static_cast<string>(name) + ".arff");
@@ -34,9 +92,8 @@ tuple<vector<vector<int>>, vector<int>, vector<string>, string, map<string, vect
    // Get className & Features
    auto className = handler.getClassName();
    vector<string> features;
-    for (auto feature : handler.getAttributes()) {
-        features.push_back(feature.first);
-    }
+    auto attributes = handler.getAttributes();
+    transform(attributes.begin(), attributes.end(), back_inserter(features), [](const auto& pair) { return pair.first; });
    // Discretize Dataset
    vector<mdlp::labels_t> Xd;
    map<string, int> maxes;
--- a/src/Platform/platformUtils.h
+++ b/src/Platform/platformUtils.h
@@ -1,5 +1,6 @@
 #ifndef PLATFORM_UTILS_H
 #define PLATFORM_UTILS_H
+#include <torch/torch.h>
 #include <string>
 #include <vector>
 #include <map>
@@ -10,6 +11,11 @@ using namespace std;
 const string PATH = "../../data/";

 bool file_exists(const std::string& name);
+vector<string> split(const string& text, char delimiter);
 pair<vector<mdlp::labels_t>, map<string, int>> discretize(vector<mdlp::samples_t>& X, mdlp::labels_t& y, vector<string> features);
-tuple<vector<vector<int>>, vector<int>, vector<string>, string, map<string, vector<int>>> loadFile(string name);
+vector<mdlp::labels_t> discretizeDataset(vector<mdlp::samples_t>& X, mdlp::labels_t& y);
+pair<torch::Tensor, map<string, vector<int>>> discretizeTorch(torch::Tensor& X, torch::Tensor& y, vector<string>& features, const string& className);
+tuple<vector<vector<int>>, vector<int>, vector<string>, string, map<string, vector<int>>> loadFile(const string& name);
+tuple<torch::Tensor, torch::Tensor, vector<string>, string, map<string, vector<int>>> loadDataset(const string& path, const string& name, bool class_last, bool discretize_dataset);
+map<string, vector<int>> get_states(vector<string>& features, string className, map<string, int>& maxes);
 #endif //PLATFORM_UTILS_H
--- a/src/Platform/typesFImdlp.h
+++ b/src/Platform/typesFImdlp.h
@@ -1,18 +0,0 @@
-#ifndef TYPES_H
-#define TYPES_H
-
-#include <vector>
-#include <map>
-#include <stdexcept>
-
-using namespace std;
-namespace mdlp {
-    typedef float precision_t;
-    typedef vector<precision_t> samples_t;
-    typedef vector<int> labels_t;
-    typedef vector<size_t> indices_t;
-    typedef vector<precision_t> cutPoints_t;
-    typedef map<pair<int, int>, precision_t> cacheEnt_t;
-    typedef map<tuple<int, int, int>, precision_t> cacheIg_t;
-}
-#endif
--- a/tests/BayesNetwork.cc
+++ b/tests/BayesNetwork.cc
@@ -9,29 +9,21 @@ TEST_CASE("Test Bayesian Network")
 {
    auto [Xd, y, features, className, states] = loadFile("iris");

-    SECTION("Test Update Nodes")
-    {
-        auto net = bayesnet::Network();
-        net.addNode("A", 3);
-        REQUIRE(net.getStates() == 3);
-        net.addNode("A", 5);
-        REQUIRE(net.getStates() == 5);
-    }
    SECTION("Test get features")
    {
        auto net = bayesnet::Network();
-        net.addNode("A", 3);
-        net.addNode("B", 5);
+        net.addNode("A");
+        net.addNode("B");
        REQUIRE(net.getFeatures() == vector<string>{"A", "B"});
-        net.addNode("C", 2);
+        net.addNode("C");
        REQUIRE(net.getFeatures() == vector<string>{"A", "B", "C"});
    }
    SECTION("Test get edges")
    {
        auto net = bayesnet::Network();
-        net.addNode("A", 3);
-        net.addNode("B", 5);
-        net.addNode("C", 2);
+        net.addNode("A");
+        net.addNode("B");
+        net.addNode("C");
        net.addEdge("A", "B");
        net.addEdge("B", "C");
        REQUIRE(net.getEdges() == vector<pair<string, string>>{ {"A", "B"}, { "B", "C" } });
--- a/tests/CMakeLists.txt
+++ b/tests/CMakeLists.txt
@@ -2,8 +2,10 @@ if(ENABLE_TESTING)
    set(TEST_MAIN "unit_tests")
    include_directories(${BayesNet_SOURCE_DIR}/src/BayesNet)
    include_directories(${BayesNet_SOURCE_DIR}/src/Platform)
-    set(TEST_SOURCES BayesModels.cc BayesNetwork.cc ${BayesNet_SOURCES} ${Platform_SOURCES})
+    include_directories(${BayesNet_SOURCE_DIR}/lib/Files)
+    include_directories(${BayesNet_SOURCE_DIR}/lib/mdlp)
+    set(TEST_SOURCES BayesModels.cc BayesNetwork.cc ${BayesNet_SOURCE_DIR}/src/Platform/platformUtils.cc ${BayesNet_SOURCES})
    add_executable(${TEST_MAIN} ${TEST_SOURCES})
-    target_link_libraries(${TEST_MAIN} PUBLIC "${TORCH_LIBRARIES}"  Catch2::Catch2WithMain)
+    target_link_libraries(${TEST_MAIN} PUBLIC "${TORCH_LIBRARIES}" ArffFiles mdlp Catch2::Catch2WithMain)
    add_test(NAME ${TEST_MAIN} COMMAND ${TEST_MAIN})
 endif(ENABLE_TESTING)
Author	SHA1	Message	Date
Ricardo Montañana	2da0fb5d8f	Merge branch 'main' into TANNew	2023-08-06 11:40:10 +02:00
Ricardo Montañana	14ea51648a	Complete AODELd	2023-08-06 11:31:44 +02:00
Ricardo Montañana	9e94f4e140	Rename suffix of proposal classifier to Ld	2023-08-05 23:23:31 +02:00
Ricardo Montañana	1d0fd629c9	Add SPODENew to models	2023-08-05 23:11:36 +02:00
Ricardo Montañana	506ef34c6f	Add report output to main	2023-08-05 20:29:05 +02:00
Ricardo Montañana	7f45495837	Refactor New classifiers to extract predict	2023-08-05 18:39:48 +02:00
Ricardo Montañana	1a09ccca4c	Add KDBNew fix computeCPT error	2023-08-05 14:40:42 +02:00
Ricardo Montañana	a1c6ab18f3	TANNew restructured with poor results	2023-08-04 20:11:22 +02:00
Ricardo Montañana	64ac8fb4f2	TANNew as a TAN variant working	2023-08-04 19:42:18 +02:00
Ricardo Montañana	c568ba111d	Add Proposal class	2023-08-04 13:05:12 +02:00
Ricardo Montañana	45c1d052ac	Compile TANNew with poor accuracy	2023-08-04 01:35:45 +02:00
Ricardo Montañana	eb1cec58a3	Complete nxm	2023-08-03 20:22:33 +02:00
Ricardo Montañana	f520b40016	Almost complete proposal in TANNew	2023-08-02 02:21:55 +02:00
Ricardo Montañana	cdfb45d2cb	Add topological order to Network	2023-08-02 00:56:52 +02:00
Ricardo Montañana	f63a9a64f9	Update Makefile to add Release & Debug build	2023-08-01 19:02:37 +02:00
Ricardo Montañana	285f0938a6	Update mdlp library	2023-08-01 17:33:01 +02:00
Ricardo Montañana	8f8f9773ce	Make TANNew same as TAN with local discretization	2023-08-01 13:17:12 +02:00
Ricardo Montañana	a9ba21560d	Add environment platform to experiment result	2023-08-01 10:55:53 +02:00
Ricardo Montañana	a18fbe5594	Begin implementation	2023-07-31 19:53:55 +02:00
Ricardo Montañana	adf650d257	Max threading	2023-07-31 18:49:18 +02:00
Ricardo Montañana	43bb017d5d	Fix problem with tensors way	2023-07-30 19:00:02 +02:00
Ricardo Montañana	53697648e7	Merge branch 'aftermath' into main	2023-07-30 01:05:31 +02:00
Ricardo Montañana	4ebc9c2013	Complete fixing the linter warnings	2023-07-30 00:16:58 +02:00
Ricardo Montañana	b882569169	Fix some more lint warnings	2023-07-30 00:04:18 +02:00
Ricardo Montañana	8b2ed26ab7	Fix some lint warnings	2023-07-29 20:37:51 +02:00
Ricardo Montañana	5efa3beaee	Fix some lint warnings	2023-07-29 20:20:38 +02:00
Ricardo Montañana	9a0449c12d	Fix some lint warnings	2023-07-29 19:38:42 +02:00
Ricardo Montañana	7222119dfb	Refactor experiment crossvalidation	2023-07-29 19:00:39 +02:00
Ricardo Montañana	cb54f61a69	Refactor Models to be a singleton factory Add Registrar of models	2023-07-29 18:22:15 +02:00
Ricardo Montañana	07d572a98c	Add Model factory	2023-07-29 17:27:43 +02:00
Ricardo Montañana	c4f3e6f19a	Refactor crossvalidation to remove unneeded params	2023-07-29 16:49:06 +02:00
Ricardo Montañana	adc0ca238f	Refactor cross_validation	2023-07-29 16:44:07 +02:00
Ricardo Montañana	b9e76becce	Add show experiment	2023-07-29 16:31:36 +02:00
Ricardo Montañana	85cb447283	Add Dataset, Models and DotEnv	2023-07-29 16:21:38 +02:00
Ricardo Montañana	b03e84044a	Fix some mistakes in timer and output format	2023-07-27 18:40:04 +02:00
Ricardo Montañana	7f7ddad36a	Fix stratified folding mistake in remainders	2023-07-27 16:51:27 +02:00
Ricardo Montañana	3d8fea7a37	Complete Experiment	2023-07-27 15:49:58 +02:00
Ricardo Montañana	bc214a496c	Adding Datasets management	2023-07-27 01:56:06 +02:00
Ricardo Montañana	3e954ba841	Complete json output compatible with benchmark	2023-07-26 19:01:39 +02:00
Ricardo Montañana	6f7fb290b0	Add json lib and json result generation	2023-07-26 17:49:03 +02:00
Ricardo Montañana	49a49a9dcd	Fix Experiment	2023-07-26 14:11:49 +02:00
Ricardo Montañana	af7a1d2b40	Fix score with tensors and finis sample	2023-07-26 13:29:47 +02:00
Ricardo Montañana	4a54bd42a2	Fix some mistakes	2023-07-26 12:53:01 +02:00
Ricardo Montañana	099b4bea09	Fix some mistakes in tensors treatment	2023-07-26 01:39:01 +02:00
Ricardo Montañana	be06e475f0	Refactor tensor2vector	2023-07-24 13:22:53 +02:00
Ricardo Montañana	c10ebca0e0	Add Experiment, Result and Timer classes	2023-07-24 01:15:12 +02:00
Ricardo Montañana	0c226371cc	Ensemble Experiment, Folding, Classifiers and Network together	2023-07-23 14:10:28 +02:00
Ricardo Montañana	644b6c9be0	Begin experiment	2023-07-23 01:47:57 +02:00
Ricardo Montañana	9981ad1811	Refactor Library renaming Base classes	2023-07-22 23:07:56 +02:00
Ricardo Montañana	41cceece20	Complete Stratified K Fold	2023-07-22 11:23:35 +02:00
Ricardo Montañana	f6e154bc6e	Begin Stratified KFold	2023-07-21 21:49:02 +02:00
Ricardo Montañana	a2622a4fb6	Begin Folding	2023-07-21 16:07:50 +02:00
Ricardo Montañana	d8218f9713	refactor sample to use new argparse library	2023-07-21 02:12:47 +02:00
Ricardo Montañana	48bfa02e1d	Add clang-tidy conf	2023-07-20 23:55:01 +02:00
Ricardo Montañana	f519003766	Remove unneeded files	2023-07-20 18:56:10 +02:00
Ricardo Montañana	8ddfd58a50	Fix some mistakes to correct tests	2023-07-20 18:55:56 +02:00