#include #include #include #include #include "TestUtils.h" #include "results/Result.h" #include "common/DotEnv.h" #include "common/Datasets.h" #include "common/Paths.h" #include "main/Scores.h" #include "config.h" auto epsilon = 1e-4; void make_test_bin(int TP, int TN, int FP, int FN, std::vector& y_test, std::vector& y_pred) { // TP for (int i = 0; i < TP; i++) { y_test.push_back(1); y_pred.push_back(1); } // TN for (int i = 0; i < TN; i++) { y_test.push_back(0); y_pred.push_back(0); } // FP for (int i = 0; i < FP; i++) { y_test.push_back(0); y_pred.push_back(1); } // FN for (int i = 0; i < FN; i++) { y_test.push_back(1); y_pred.push_back(0); } } TEST_CASE("Scores binary", "[Scores]") { std::vector y_test; std::vector y_pred; make_test_bin(197, 210, 52, 41, y_test, y_pred); auto y_test_tensor = torch::tensor(y_test, torch::kInt32); auto y_pred_tensor = torch::tensor(y_pred, torch::kInt32); platform::Scores scores(y_test_tensor, y_pred_tensor, 2); REQUIRE(scores.accuracy() == Catch::Approx(0.814).epsilon(epsilon)); REQUIRE(scores.f1_score(0) == Catch::Approx(0.818713)); REQUIRE(scores.f1_score(1) == Catch::Approx(0.809035)); REQUIRE(scores.precision(0) == Catch::Approx(0.836653)); REQUIRE(scores.precision(1) == Catch::Approx(0.791165)); REQUIRE(scores.recall(0) == Catch::Approx(0.801527)); REQUIRE(scores.recall(1) == Catch::Approx(0.827731)); REQUIRE(scores.f1_weighted() == Catch::Approx(0.814106)); REQUIRE(scores.f1_macro() == Catch::Approx(0.813874)); auto confusion_matrix = scores.get_confusion_matrix(); REQUIRE(confusion_matrix[0][0].item() == 210); REQUIRE(confusion_matrix[0][1].item() == 52); REQUIRE(confusion_matrix[1][0].item() == 41); REQUIRE(confusion_matrix[1][1].item() == 197); } TEST_CASE("Scores multiclass", "[Scores]") { std::vector y_test = { 0, 2, 2, 2, 2, 0, 1, 2, 0, 2 }; std::vector y_pred = { 0, 1, 2, 2, 1, 1, 1, 0, 0, 2 }; auto y_test_tensor = torch::tensor(y_test, torch::kInt32); auto y_pred_tensor = torch::tensor(y_pred, torch::kInt32); platform::Scores scores(y_test_tensor, y_pred_tensor, 3); REQUIRE(scores.accuracy() == Catch::Approx(0.6).epsilon(epsilon)); REQUIRE(scores.f1_score(0) == Catch::Approx(0.666667)); REQUIRE(scores.f1_score(1) == Catch::Approx(0.4)); REQUIRE(scores.f1_score(2) == Catch::Approx(0.666667)); REQUIRE(scores.precision(0) == Catch::Approx(0.666667)); REQUIRE(scores.precision(1) == Catch::Approx(0.25)); REQUIRE(scores.precision(2) == Catch::Approx(1.0)); REQUIRE(scores.recall(0) == Catch::Approx(0.666667)); REQUIRE(scores.recall(1) == Catch::Approx(1.0)); REQUIRE(scores.recall(2) == Catch::Approx(0.5)); REQUIRE(scores.f1_weighted() == Catch::Approx(0.64)); REQUIRE(scores.f1_macro() == Catch::Approx(0.577778)); } TEST_CASE("Test Confusion Matrix Values", "[Scores]") { std::vector y_test = { 0, 2, 2, 2, 2, 0, 1, 2, 0, 2 }; std::vector y_pred = { 0, 1, 2, 2, 1, 1, 1, 0, 0, 2 }; auto y_test_tensor = torch::tensor(y_test, torch::kInt32); auto y_pred_tensor = torch::tensor(y_pred, torch::kInt32); platform::Scores scores(y_test_tensor, y_pred_tensor, 3); auto confusion_matrix = scores.get_confusion_matrix(); REQUIRE(confusion_matrix[0][0].item() == 2); REQUIRE(confusion_matrix[0][1].item() == 1); REQUIRE(confusion_matrix[0][2].item() == 0); REQUIRE(confusion_matrix[1][0].item() == 0); REQUIRE(confusion_matrix[1][1].item() == 1); REQUIRE(confusion_matrix[1][2].item() == 0); REQUIRE(confusion_matrix[2][0].item() == 1); REQUIRE(confusion_matrix[2][1].item() == 2); REQUIRE(confusion_matrix[2][2].item() == 3); } TEST_CASE("Confusion Matrix JSON", "[Scores]") { std::vector y_test = { 0, 2, 2, 2, 2, 0, 1, 2, 0, 2 }; std::vector y_pred = { 0, 1, 2, 2, 1, 1, 1, 0, 0, 2 }; auto y_test_tensor = torch::tensor(y_test, torch::kInt32); auto y_pred_tensor = torch::tensor(y_pred, torch::kInt32); std::vector labels = { "Aeroplane", "Boat", "Car" }; platform::Scores scores(y_test_tensor, y_pred_tensor, 3, labels); auto res_json_int = scores.get_confusion_matrix_json(); REQUIRE(res_json_int[0][0] == 2); REQUIRE(res_json_int[0][1] == 1); REQUIRE(res_json_int[0][2] == 0); REQUIRE(res_json_int[1][0] == 0); REQUIRE(res_json_int[1][1] == 1); REQUIRE(res_json_int[1][2] == 0); REQUIRE(res_json_int[2][0] == 1); REQUIRE(res_json_int[2][1] == 2); REQUIRE(res_json_int[2][2] == 3); auto res_json_str = scores.get_confusion_matrix_json(true); REQUIRE(res_json_str["Aeroplane"][0] == 2); REQUIRE(res_json_str["Aeroplane"][1] == 1); REQUIRE(res_json_str["Aeroplane"][2] == 0); REQUIRE(res_json_str["Boat"][0] == 0); REQUIRE(res_json_str["Boat"][1] == 1); REQUIRE(res_json_str["Boat"][2] == 0); REQUIRE(res_json_str["Car"][0] == 1); REQUIRE(res_json_str["Car"][1] == 2); REQUIRE(res_json_str["Car"][2] == 3); } TEST_CASE("Classification Report", "[Scores]") { std::vector y_test = { 0, 2, 2, 2, 2, 0, 1, 2, 0, 2 }; std::vector y_pred = { 0, 1, 2, 2, 1, 1, 1, 0, 0, 2 }; auto y_test_tensor = torch::tensor(y_test, torch::kInt32); auto y_pred_tensor = torch::tensor(y_pred, torch::kInt32); std::vector labels = { "Aeroplane", "Boat", "Car" }; platform::Scores scores(y_test_tensor, y_pred_tensor, 3, labels); std::string expected = R"(Classification Report ===================== precision recall f1-score support ========= ========= ========= ========= Aeroplane 0.6666667 0.6666667 0.6666667 3 Boat 0.2500000 1.0000000 0.4000000 1 Car 1.0000000 0.5000000 0.6666667 6 accuracy 0.6000000 10 macro avg 0.6388889 0.7222223 0.5777778 10 weighted avg 0.8250000 0.6000000 0.6400000 10 )"; REQUIRE(scores.classification_report() == expected); auto json_matrix = scores.get_confusion_matrix_json(true); platform::Scores scores2(json_matrix); REQUIRE(scores.classification_report() == scores2.classification_report()); } TEST_CASE("JSON constructor", "[Scores]") { std::vector y_test = { 0, 2, 2, 2, 2, 0, 1, 2, 0, 2 }; std::vector y_pred = { 0, 1, 2, 2, 1, 1, 1, 0, 0, 2 }; auto y_test_tensor = torch::tensor(y_test, torch::kInt32); auto y_pred_tensor = torch::tensor(y_pred, torch::kInt32); std::vector labels = { "Aeroplane", "Boat", "Car" }; platform::Scores scores(y_test_tensor, y_pred_tensor, 3, labels); auto res_json_int = scores.get_confusion_matrix_json(); platform::Scores scores2(res_json_int); REQUIRE(scores.accuracy() == scores2.accuracy()); for (int i = 0; i < 2; ++i) { REQUIRE(scores.f1_score(i) == scores2.f1_score(i)); REQUIRE(scores.precision(i) == scores2.precision(i)); REQUIRE(scores.recall(i) == scores2.recall(i)); } REQUIRE(scores.f1_weighted() == scores2.f1_weighted()); REQUIRE(scores.f1_macro() == scores2.f1_macro()); auto res_json_key = scores.get_confusion_matrix_json(true); platform::Scores scores3(res_json_key); REQUIRE(scores.accuracy() == scores3.accuracy()); for (int i = 0; i < 2; ++i) { REQUIRE(scores.f1_score(i) == scores3.f1_score(i)); REQUIRE(scores.precision(i) == scores3.precision(i)); REQUIRE(scores.recall(i) == scores3.recall(i)); } REQUIRE(scores.f1_weighted() == scores3.f1_weighted()); REQUIRE(scores.f1_macro() == scores3.f1_macro()); } TEST_CASE("Aggregate", "[Scores]") { std::vector y_test; std::vector y_pred; make_test_bin(197, 210, 52, 41, y_test, y_pred); auto y_test_tensor = torch::tensor(y_test, torch::kInt32); auto y_pred_tensor = torch::tensor(y_pred, torch::kInt32); platform::Scores scores(y_test_tensor, y_pred_tensor, 2); y_test.clear(); y_pred.clear(); make_test_bin(227, 187, 39, 47, y_test, y_pred); auto y_test_tensor2 = torch::tensor(y_test, torch::kInt32); auto y_pred_tensor2 = torch::tensor(y_pred, torch::kInt32); platform::Scores scores2(y_test_tensor2, y_pred_tensor2, 2); scores.aggregate(scores2); REQUIRE(scores.accuracy() == Catch::Approx(0.821).epsilon(epsilon)); REQUIRE(scores.f1_score(0) == Catch::Approx(0.8160329)); REQUIRE(scores.f1_score(1) == Catch::Approx(0.8257059)); REQUIRE(scores.precision(0) == Catch::Approx(0.8185567)); REQUIRE(scores.precision(1) == Catch::Approx(0.8233010)); REQUIRE(scores.recall(0) == Catch::Approx(0.8135246)); REQUIRE(scores.recall(1) == Catch::Approx(0.8281250)); REQUIRE(scores.f1_weighted() == Catch::Approx(0.8209856)); REQUIRE(scores.f1_macro() == Catch::Approx(0.8208694)); y_test.clear(); y_pred.clear(); make_test_bin(197 + 227, 210 + 187, 52 + 39, 41 + 47, y_test, y_pred); y_test_tensor = torch::tensor(y_test, torch::kInt32); y_pred_tensor = torch::tensor(y_pred, torch::kInt32); platform::Scores scores3(y_test_tensor, y_pred_tensor, 2); for (int i = 0; i < 2; ++i) { REQUIRE(scores3.f1_score(i) == scores.f1_score(i)); REQUIRE(scores3.precision(i) == scores.precision(i)); REQUIRE(scores3.recall(i) == scores.recall(i)); } REQUIRE(scores3.f1_weighted() == scores.f1_weighted()); REQUIRE(scores3.f1_macro() == scores.f1_macro()); REQUIRE(scores3.accuracy() == scores.accuracy()); }