#include #include #include "best/BestScore.h" #include "ReportExcel.h" namespace platform { ReportExcel::ReportExcel(json data_, bool compare, lxw_workbook* workbook, lxw_worksheet* worksheet) : ReportBase(data_, compare), ExcelFile(workbook, worksheet) { createFile(); createFormats(); } void ReportExcel::formatColumns() { worksheet_freeze_panes(worksheet, 6, 1); std::vector columns_sizes = { 22, 10, 9, 7, 12, 12, 12, 12, 12, 3, 15, 12, 23 }; for (int i = 0; i < columns_sizes.size(); ++i) { worksheet_set_column(worksheet, i, i, columns_sizes.at(i), NULL); } } void ReportExcel::createFile() { if (workbook == NULL) { workbook = workbook_new((Paths::excel() + Paths::excelResults()).c_str()); } if (worksheet == NULL) { const std::string name = data["model"].get(); worksheet = createWorksheet(name); } setProperties(data["title"].get()); formatColumns(); } void ReportExcel::closeFile() { workbook_close(workbook); } void ReportExcel::header() { auto loc = std::locale("es_ES"); std::cout.imbue(loc); std::stringstream oss; std::string message = data["model"].get() + " ver. " + data["version"].get() + " " + data["language"].get() + " ver. " + data["language_version"].get() + " with " + std::to_string(data["folds"].get()) + " Folds cross validation and " + std::to_string(data["seeds"].size()) + " random seeds. " + data["date"].get() + " " + data["time"].get(); worksheet_merge_range(worksheet, 0, 0, 0, 12, message.c_str(), styles["headerFirst"]); worksheet_merge_range(worksheet, 1, 0, 1, 12, data["title"].get().c_str(), styles["headerRest"]); worksheet_merge_range(worksheet, 2, 0, 3, 0, ("Score is " + data["score_name"].get()).c_str(), styles["headerRest"]); writeString(2, 1, "Smooth", "headerRest"); std::string smooth = data.find("smooth_strategy") != data.end() ? data["smooth_strategy"].get() : "ORIGINAL"; writeString(3, 1, smooth, "headerSmall"); worksheet_merge_range(worksheet, 2, 2, 3, 3, "Execution time", styles["headerRest"]); oss << std::setprecision(2) << std::fixed << data["duration"].get() << " s"; worksheet_merge_range(worksheet, 2, 4, 2, 5, oss.str().c_str(), styles["headerRest"]); oss.str(""); oss.clear(); oss << std::setprecision(2) << std::fixed << data["duration"].get() / 3600 << " h"; worksheet_merge_range(worksheet, 3, 4, 3, 5, oss.str().c_str(), styles["headerRest"]); worksheet_merge_range(worksheet, 2, 6, 3, 7, "Platform", styles["headerRest"]); worksheet_merge_range(worksheet, 2, 8, 3, 9, data["platform"].get().c_str(), styles["headerRest"]); worksheet_merge_range(worksheet, 2, 10, 2, 12, ("Random seeds: " + fromVector("seeds")).c_str(), styles["headerSmall"]); oss.str(""); oss.clear(); oss << "Stratified: " << (data["stratified"].get() ? "True" : "False"); worksheet_merge_range(worksheet, 3, 10, 3, 11, oss.str().c_str(), styles["headerSmall"]); oss.str(""); oss.clear(); std::string discretize_algo = data.find("discretization_algorithm") != data.end() ? data["discretization_algorithm"].get() : "mdlp"; std::string algorithm = data["discretized"].get() ? " (" + discretize_algo + ")" : ""; oss << "Discretized: " << (data["discretized"].get() ? "True" : "False") << algorithm; worksheet_write_string(worksheet, 3, 12, oss.str().c_str(), styles["headerSmall"]); } void ReportExcel::header_notes(int row) { writeString(row, 0, "Dataset", "bodyHeader"); worksheet_merge_range(worksheet, row, 1, row, 6, "Note", styles["bodyHeader_even"]); } void ReportExcel::append_notes(const json& r, int row) { static bool even_note = true; std::string suffix; if (even_note) { even_note = false; suffix = "_even"; } else { even_note = true; suffix = "_odd"; } lxw_format* style = NULL; style = styles.at("text" + suffix); auto initial_row = row; for (const auto& note : r["notes"]) { worksheet_merge_range(worksheet, row, 1, row, 6, note.get().c_str(), style); row++; } if (row - 1 == initial_row) { writeString(initial_row, 0, r["dataset"].get(), "text"); } else { worksheet_merge_range(worksheet, initial_row, 0, row - 1, 0, r["dataset"].get().c_str(), style); } } void ReportExcel::body() { auto head = std::vector( { "Dataset", "Samples", "Features", "Classes", "Nodes", "Edges", "States", "Score", "Score Std.", "St.", "Time", "Time Std.", "Hyperparameters" }); int col = 0; for (const auto& item : head) { writeString(5, col++, item, "bodyHeader"); } row = 6; col = 0; int hypSize = 22; json lastResult; double totalScore = 0.0; std::string hyperparameters; bool only_one_result = data["results"].size() == 1; bool first_note = true; int notes_row = 15 + data["results"].size(); for (const auto& r : data["results"]) { writeString(row, col, r["dataset"].get(), "text"); writeInt(row, col + 1, r["samples"].get(), "ints"); writeInt(row, col + 2, r["features"].get(), "ints"); writeInt(row, col + 3, r["classes"].get(), "ints"); writeDouble(row, col + 4, r["nodes"].get(), "floats"); writeDouble(row, col + 5, r["leaves"].get(), "floats"); writeDouble(row, col + 6, r["depth"].get(), "floats"); writeDouble(row, col + 7, r["score"].get(), "result"); writeDouble(row, col + 8, r["score_std"].get(), "result"); const std::string status = compareResult(r["dataset"].get(), r["score"].get()); writeString(row, col + 9, status, "textCentered"); writeDouble(row, col + 10, r["time"].get(), "time"); writeDouble(row, col + 11, r["time_std"].get(), "time"); hyperparameters = r["hyperparameters"].dump(); if (hyperparameters.size() > hypSize) { hypSize = hyperparameters.size(); } writeString(row, col + 12, hyperparameters, "text"); lastResult = r; totalScore += r["score"].get(); row++; if (!only_one_result) { // take care of the possible notes if (r.find("notes") != r.end()) { if (r["notes"].size() > 0) { if (first_note) { first_note = false; header_notes(notes_row++); } append_notes(r, notes_row); notes_row += r["notes"].size(); } } } } // Set the right column width of hyperparameters with the maximum length worksheet_set_column(worksheet, 12, 12, hypSize + 5, NULL); // Show totals if only one dataset is present in the result if (only_one_result) { row++; if (lastResult.find("notes") != lastResult.end()) { if (lastResult["notes"].size() > 0) { writeString(row++, 1, "Notes: ", "bodyHeader"); for (const auto& note : lastResult["notes"]) { worksheet_merge_range(worksheet, row, 2, row, 5, note.get().c_str(), efectiveStyle("text")); row++; } } } for (const std::string& group : { "scores_train", "scores_test", "times_train", "times_test" }) { row++; col = 1; writeString(row, col, group, "text"); for (double item : lastResult[group]) { std::string style = group.find("scores") != std::string::npos ? "result" : "time"; writeDouble(row, ++col, item, style); } } // Classificacion report if (lastResult.find("confusion_matrices") != lastResult.end()) { create_classification_report(lastResult); } // Set with of columns to show those totals completely worksheet_set_column(worksheet, 1, 1, 12, NULL); for (int i = 2; i < 7; ++i) { // doesn't work with from col to col, so... worksheet_set_column(worksheet, i, i, 15, NULL); } } else { footer(totalScore, row); } } void ReportExcel::create_classification_report(const json& result) { auto matrix_sheet = createWorksheet("clf_report"); lxw_worksheet* tmp = worksheet; worksheet = matrix_sheet; if (matrix_sheet == NULL) { throw std::invalid_argument("Couldn't create sheet classif_report"); } row = 1; int col = 0; if (result.find("confusion_matrices_train") != result.end()) { // Train classification report auto score = Scores::create_aggregate(result, "confusion_matrices_train"); auto train = score.classification_report_json("Train"); std::tie(row, col) = write_classification_report(train, row, 0); int new_row = 0; int new_col = col + 1; for (int i = 0; i < result["confusion_matrices_train"].size(); ++i) { auto item = result["confusion_matrices_train"][i]; auto score_item = Scores(item); auto title = "Train Fold " + std::to_string(i); std::tie(new_row, new_col) = write_classification_report(score_item.classification_report_json(title), 1, new_col); new_col++; } col = new_col; worksheet_merge_range(matrix_sheet, 0, 0, 0, col - 1, "Train Classification Report", efectiveStyle("headerRest")); } // Test classification report worksheet_merge_range(matrix_sheet, row, 0, row, col - 1, "Test Classification Report", efectiveStyle("headerRest")); auto score = Scores::create_aggregate(result, "confusion_matrices"); auto test = score.classification_report_json("Test"); int init_row = ++row; std::tie(row, col) = write_classification_report(test, init_row, 0); int new_row = 0; int new_col = col + 1; for (int i = 0; i < result["confusion_matrices"].size(); ++i) { auto item = result["confusion_matrices"][i]; auto score_item = Scores(item); auto title = "Test Fold " + std::to_string(i); std::tie(new_row, new_col) = write_classification_report(score_item.classification_report_json(title), init_row, new_col); new_col++; } // Format columns (change size to fit the content) for (int i = 0; i < new_col; ++i) { // doesn't work with from col to col, so... worksheet_set_column(worksheet, i, i, 12, NULL); } worksheet = tmp; } std::pair ReportExcel::write_classification_report(const json& result, int init_row, int init_col) { row = init_row; auto text = result["title"].get(); worksheet_merge_range(worksheet, row, init_col, row + 1, init_col + 5, text.c_str(), efectiveStyle("bodyHeader")); row += 2; int col = init_col + 2; // Headers bool first_item = true; for (const auto& item : result["headers"]) { auto text = item.get(); if (first_item) { first_item = false; worksheet_merge_range(worksheet, row, init_col, row, init_col + 1, text.c_str(), efectiveStyle("bodyHeader")); } else { writeString(row, col++, text, "bodyHeader"); } } row++; // Classes f1-score for (const auto& item : result["body"]) { col = init_col + 2; for (const auto& value : item) { if (value.is_string()) { worksheet_merge_range(worksheet, row, init_col, row, init_col + 1, value.get().c_str(), efectiveStyle("text")); } else { if (value.is_number_integer()) { writeInt(row, col++, value.get(), "ints"); } else { writeDouble(row, col++, value.get(), "result"); } } } row++; } // Accuracy and average f1-score for (const auto& item : { "accuracy", "averages", "weighted" }) { col = init_col + 2; for (const auto& value : result[item]) { if (value.is_string()) { worksheet_merge_range(worksheet, row, init_col, row, init_col + 1, value.get().c_str(), efectiveStyle("text")); } else { if (value.is_number_integer()) { writeInt(row, col++, value.get(), "ints"); } else { writeDouble(row, col++, value.get(), "result"); } } } row++; } // Confusion matrix auto n_items = result["confusion_matrix"].size(); worksheet_merge_range(worksheet, row, init_col, row, init_col + n_items + 1, "Confusion Matrix", efectiveStyle("bodyHeader")); row++; boldGreen(); for (int i = 0; i < n_items; ++i) { col = init_col + 2; auto label = result["body"][i][0].get(); worksheet_merge_range(worksheet, row, init_col, row, init_col + 1, label.c_str(), efectiveStyle("text")); for (int j = 0; j < result["confusion_matrix"][i].size(); ++j) { auto value = result["confusion_matrix"][i][j]; if (i == j) { writeInt(row, col++, value.get(), "ints_bold"); } else { writeInt(row, col++, value.get(), "ints"); } } row++; } int maxcol = std::max(init_col + 5, int(init_col + n_items + 1)); return { row, maxcol }; } void ReportExcel::showSummary() { for (const auto& item : summary) { worksheet_write_string(worksheet, row + 2, 1, item.first.c_str(), styles["summaryStyle"]); worksheet_write_number(worksheet, row + 2, 2, item.second, styles["summaryStyle"]); worksheet_merge_range(worksheet, row + 2, 3, row + 2, 5, meaning.at(item.first).c_str(), styles["summaryStyle"]); row += 1; } } void ReportExcel::footer(double totalScore, int row) { showSummary(); row += 4 + summary.size(); auto score = data["score_name"].get(); auto best = BestScore::getScore(score); if (best.first != "") { worksheet_merge_range(worksheet, row, 1, row, 5, (score + " compared to " + best.first + " .:").c_str(), efectiveStyle("text")); writeDouble(row, 6, totalScore / best.second, "result"); } if (!getExistBestFile() && compare) { worksheet_write_string(worksheet, row + 1, 0, "*** Best Results File not found. Couldn't compare any result!", styles["summaryStyle"]); } } }