Add consistent comparative results to reports

2025-08-17 08:25:53 +00:00 · 2022-10-25 15:00:37 +02:00
parent 29c4b4ceef
commit b24a508d1c
18 changed files with 75 additions and 29 deletions
--- a/benchmark/Results.py
+++ b/benchmark/Results.py
@@ -9,16 +9,37 @@ import xlsxwriter
 import numpy as np
 from .Experiments import BestResults
 from .Datasets import Datasets
+from .Arguments import EnvData, ALL_METRICS
 from .Utils import (
    Folders,
    Files,
    Symbols,
-    BEST_ACCURACY_STREE,
    TextColor,
    NO_RESULTS,
 )


+class BestResultsEver:
+    def __init__(self):
+        self.data = {}
+        for i in ["Tanveer", "Surcov", "Arff"]:
+            self.data[i] = {}
+            for metric in ALL_METRICS:
+                self.data[i][metric.replace("-", "_")] = ["self", 1.0]
+                self.data[i][metric] = ["self", 1.0]
+        self.data["Tanveer"]["accuracy"] = [
+            "STree_default (liblinear-ovr)",
+            40.282203,
+        ]
+        self.data["Arff"]["accuracy"] = [
+            "STree_default (linear-ovo)",
+            21.9765,
+        ]
+
+    def get_name_value(self, key, score):
+        return self.data[key][score]
+
+
 class BaseReport(abc.ABC):
    def __init__(self, file_name, best_file=False):
        self.file_name = file_name
@@ -30,7 +51,20 @@ class BaseReport(abc.ABC):
        with open(self.file_name) as f:
            self.data = json.load(f)
        self.best_acc_file = best_file
-        self.lines = self.data if best_file else self.data["results"]
+        if best_file:
+            self.lines = self.data
+        else:
+            self.lines = self.data["results"]
+            self.score_name = self.data["score_name"]
+        self.__compute_best_results_ever()
+
+    def __compute_best_results_ever(self):
+        args = EnvData.load()
+        key = args["source_data"]
+        best = BestResultsEver()
+        self.best_score_name, self.best_score_value = best.get_name_value(
+            key, self.score_name
+        )

    def _get_accuracy(self, item):
        return self.data[item][0] if self.best_acc_file else item["score"]
@@ -69,6 +103,12 @@ class BaseReport(abc.ABC):
        }
        return meaning[status]

+    def _get_best_accuracy(self):
+        return self.best_score_value
+
+    def _get_message_best_accuracy(self):
+        return f"{self.score_name} compared to {self.best_score_name} .:"
+
    @abc.abstractmethod
    def header(self) -> None:
        pass
@@ -188,8 +228,8 @@ class Report(BaseReport):
                    f" {key} {self._status_meaning(key)} .....: {value:2d}"
                )
        self.header_line(
-            f" Accuracy compared to stree_default (liblinear-ovr) .: "
-            f"{accuracy/BEST_ACCURACY_STREE:7.4f}"
+            f" {self._get_message_best_accuracy()} "
+            f"{accuracy/self._get_best_accuracy():7.4f}"
        )
        self.header_line("*")

@@ -209,12 +249,12 @@ class ReportBest(BaseReport):
            if best
            else Files.grid_output(score, model)
        )
+        file_name = os.path.join(Folders.results, name)
        self.best = best
        self.grid = grid
-        file_name = os.path.join(Folders.results, name)
-        super().__init__(file_name, best_file=True)
        self.score_name = score
        self.model = model
+        super().__init__(file_name, best_file=True)

    def header_line(self, text: str) -> None:
        length = sum(self.header_lengths) + len(self.header_lengths) - 3
@@ -254,8 +294,8 @@ class ReportBest(BaseReport):
    def footer(self, accuracy):
        self.header_line("*")
        self.header_line(
-            f" Scores compared to stree_default accuracy (liblinear-ovr) .: "
-            f"{accuracy/BEST_ACCURACY_STREE:7.4f}"
+            f" {self._get_message_best_accuracy()} "
+            f"{accuracy/self._get_best_accuracy():7.4f}"
        )
        self.header_line("*")

@@ -509,8 +549,8 @@ class Excel(BaseReport):
                self.sheet.write(self.row, 3, self._status_meaning(key), bold)
                self.row += 1
        message = (
-            f"** Accuracy compared to stree_default (liblinear-ovr) .: "
-            f"{accuracy/BEST_ACCURACY_STREE:7.4f}"
+            f"** {self._get_message_best_accuracy()} "
+            f"{accuracy/self._get_best_accuracy():7.4f}"
        )
        bold = self.book.add_format({"bold": True, "font_size": 14})
        # set width of the hyperparams column with the maximum width
@@ -634,6 +674,13 @@ class Benchmark:
        self._report = {}
        self._datasets = set()
        self.visualize = visualize
+        self.__compute_best_results_ever()
+
+    def __compute_best_results_ever(self):
+        args = EnvData.load()
+        key = args["source_data"]
+        best = BestResultsEver()
+        _, self.best_score_value = best.get_name_value(key, self._score)

    def get_result_file_name(self):
        return os.path.join(Folders.exreport, Files.exreport(self._score))
@@ -971,7 +1018,7 @@ class Benchmark:
                sheet.write_formula(
                    row,
                    col + 1,
-                    f"=sum({range_metric})/{BEST_ACCURACY_STREE}",
+                    f"=sum({range_metric})/{self.best_score_value}",
                    decimal_total,
                )
                range_rank = (
@@ -1063,7 +1110,7 @@ class StubReport(BaseReport):

    def footer(self, accuracy: float) -> None:
        self.accuracy = accuracy
-        self.score = accuracy / BEST_ACCURACY_STREE
+        self.score = accuracy / self._get_best_accuracy()


 class Summary: