mirror of
https://github.com/Doctorado-ML/mufs.git
synced 2025-08-18 00:55:53 +00:00
202 lines
6.8 KiB
Python
Executable File
202 lines
6.8 KiB
Python
Executable File
import unittest
|
|
import os
|
|
import pandas as pd
|
|
import numpy as np
|
|
from mdlp import MDLP
|
|
from sklearn.datasets import load_wine, load_iris
|
|
from ..Selection import MUFS
|
|
from .._version import __version__
|
|
|
|
|
|
class MUFSTest(unittest.TestCase):
|
|
def __init__(self, *args, **kwargs):
|
|
super().__init__(*args, **kwargs)
|
|
mdlp = MDLP(random_state=1)
|
|
self.X_wc, self.y_w = load_wine(return_X_y=True)
|
|
self.X_w = mdlp.fit_transform(self.X_wc, self.y_w).astype("int64")
|
|
self.X_ic, self.y_i = load_iris(return_X_y=True)
|
|
mdlp = MDLP(random_state=1)
|
|
self.X_i = mdlp.fit_transform(self.X_ic, self.y_i).astype("int64")
|
|
|
|
def test_version(self):
|
|
"""Check package version."""
|
|
mufs = MUFS()
|
|
self.assertEqual(__version__, mufs.version())
|
|
|
|
def assertListAlmostEqual(self, list1, list2, tol=7):
|
|
self.assertEqual(len(list1), len(list2))
|
|
for a, b in zip(list1, list2):
|
|
self.assertAlmostEqual(a, b, tol)
|
|
|
|
def test_initialize(self):
|
|
mufs = MUFS()
|
|
mufs.fcbf(self.X_w, self.y_w, 0.05)
|
|
mufs._initialize(self.X_w, self.y_w)
|
|
self.assertIsNone(mufs.get_results())
|
|
self.assertListEqual([], mufs.get_scores())
|
|
self.assertDictEqual({}, mufs._su_features)
|
|
self.assertIsNone(mufs._su_labels)
|
|
|
|
def test_csf_wine(self):
|
|
mufs = MUFS()
|
|
expected = [6, 12, 9, 4, 10, 0]
|
|
self.assertListEqual(
|
|
expected, mufs.cfs(self.X_w, self.y_w).get_results()
|
|
)
|
|
expected = [
|
|
0.5218299405215557,
|
|
0.602513857132804,
|
|
0.4877384978817362,
|
|
0.3743688234383051,
|
|
0.28795671854246285,
|
|
0.2309165735173175,
|
|
]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_csf_wine_cont(self):
|
|
mufs = MUFS(discrete=False)
|
|
expected = [10, 6, 0, 2, 11, 9]
|
|
self.assertListEqual(
|
|
expected, mufs.cfs(self.X_wc, self.y_w).get_results()
|
|
)
|
|
expected = [
|
|
0.735264150416997,
|
|
0.8321684551546848,
|
|
0.7439915858469107,
|
|
0.6238883340158233,
|
|
0.513637402071709,
|
|
0.41596400981378984,
|
|
]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_csf_max_features(self):
|
|
mufs = MUFS(max_features=3)
|
|
expected = [6, 12, 9]
|
|
self.assertListAlmostEqual(
|
|
expected, mufs.cfs(self.X_w, self.y_w).get_results()
|
|
)
|
|
expected = [
|
|
0.5218299405215557,
|
|
0.602513857132804,
|
|
0.4877384978817362,
|
|
]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_csf_iris(self):
|
|
mufs = MUFS()
|
|
expected = [3, 2, 0, 1]
|
|
computed = mufs.cfs(self.X_i, self.y_i).get_results()
|
|
self.assertListEqual(expected, computed)
|
|
expected = [
|
|
0.870521418179061,
|
|
0.8968651482682227,
|
|
0.5908278453318913,
|
|
0.40371971570693366,
|
|
]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_fcbf_wine(self):
|
|
mufs = MUFS()
|
|
computed = mufs.fcbf(self.X_w, self.y_w, threshold=0.05).get_results()
|
|
expected = [6, 9, 12, 0, 11, 4]
|
|
self.assertListAlmostEqual(expected, computed)
|
|
expected = [
|
|
0.5218299405215557,
|
|
0.46224298637417455,
|
|
0.44518278979085646,
|
|
0.38942355544213786,
|
|
0.3790082191220976,
|
|
0.24972405134844652,
|
|
]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_fcbf_max_features(self):
|
|
mufs = MUFS(max_features=3)
|
|
computed = mufs.fcbf(self.X_w, self.y_w, threshold=0.05).get_results()
|
|
expected = [6, 9, 12]
|
|
self.assertListAlmostEqual(expected, computed)
|
|
expected = [
|
|
0.5218299405215557,
|
|
0.46224298637417455,
|
|
0.44518278979085646,
|
|
]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_fcbf_iris(self):
|
|
mufs = MUFS()
|
|
computed = mufs.fcbf(self.X_i, self.y_i, threshold=0.05).get_results()
|
|
expected = [3, 2]
|
|
self.assertListAlmostEqual(expected, computed)
|
|
expected = [0.870521418179061, 0.810724587460511]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_compute_su_labels(self):
|
|
mufs = MUFS()
|
|
mufs.fcbf(self.X_i, self.y_i, threshold=0.05)
|
|
expected = [0.0, 0.0, 0.810724587460511, 0.870521418179061]
|
|
self.assertListAlmostEqual(
|
|
expected, mufs._compute_su_labels().tolist()
|
|
)
|
|
mufs._su_labels = [1, 2, 3, 4]
|
|
self.assertListAlmostEqual([1, 2, 3, 4], mufs._compute_su_labels())
|
|
|
|
def test_invalid_threshold(self):
|
|
mufs = MUFS()
|
|
with self.assertRaises(ValueError):
|
|
mufs.fcbf(self.X_i, self.y_i, threshold=1e-15)
|
|
|
|
def test_fcbf_exit_threshold(self):
|
|
mufs = MUFS()
|
|
computed = mufs.fcbf(self.X_w, self.y_w, threshold=0.4).get_results()
|
|
expected = [6, 9, 12]
|
|
self.assertListAlmostEqual(expected, computed)
|
|
expected = [
|
|
0.5218299405215557,
|
|
0.46224298637417455,
|
|
0.44518278979085646,
|
|
]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_iwss_wine(self):
|
|
mufs = MUFS()
|
|
expected = [6, 9, 12]
|
|
self.assertListEqual(
|
|
expected, mufs.iwss(self.X_w, self.y_w, 0.2).get_results()
|
|
)
|
|
expected = [0.5218299405215557, 0.5947822876110085, 0.4877384978817362]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_iwss_wine_max_features(self):
|
|
mufs = MUFS(max_features=3)
|
|
expected = [6, 9, 12]
|
|
self.assertListEqual(
|
|
expected, mufs.iwss(self.X_w, self.y_w, 0.4).get_results()
|
|
)
|
|
expected = [0.5218299405215557, 0.5947822876110085, 0.4877384978817362]
|
|
self.assertListAlmostEqual(expected, mufs.get_scores())
|
|
|
|
def test_iwss_exception(self):
|
|
mufs = MUFS()
|
|
with self.assertRaises(ValueError):
|
|
mufs.iwss(self.X_w, self.y_w, 0.51)
|
|
with self.assertRaises(ValueError):
|
|
mufs.iwss(self.X_w, self.y_w, -0.01)
|
|
|
|
def test_iwss_better_merit_condition(self):
|
|
folder = os.path.dirname(os.path.abspath(__file__))
|
|
data = pd.read_csv(
|
|
os.path.join(folder, "balloons_R.dat"),
|
|
sep="\t",
|
|
index_col=0,
|
|
)
|
|
X = data.drop("clase", axis=1).to_numpy()
|
|
y = data["clase"].to_numpy()
|
|
mufs = MUFS()
|
|
expected = [0, 2, 3, 1]
|
|
self.assertListEqual(expected, mufs.iwss(X, y, 0.3).get_results())
|
|
|
|
def test_iwss_empty(self):
|
|
mufs = MUFS()
|
|
X = np.delete(self.X_i, [0, 1], 1)
|
|
self.assertListEqual(mufs.iwss(X, self.y_i, 0.3).get_results(), [1, 0])
|