mirror of
https://github.com/Doctorado-ML/Stree_datasets.git
synced 2025-08-15 23:46:03 +00:00
Commit Inicial
This commit is contained in:
32
analysis.py
Normal file
32
analysis.py
Normal file
@@ -0,0 +1,32 @@
|
||||
import sweetviz as sv
|
||||
import pandas as pd
|
||||
import numpy as np
|
||||
from experimentation import Dataset
|
||||
|
||||
|
||||
def dataframe(X, y):
|
||||
label = y.reshape(-1, 1)
|
||||
return pd.DataFrame(np.concatenate((X, label), axis=1))
|
||||
|
||||
|
||||
# datasets = Dataset()
|
||||
# for dataset in datasets:
|
||||
# if dataset[0] > "usps" and dataset[0] != "usps":
|
||||
# data = dataframe(*datasets.load(dataset[0]))
|
||||
# print(dataset[0], data.shape)
|
||||
# report = sv.analyze(source=[data, dataset[0]])
|
||||
# report.show_html(f"html/{dataset[0]}.html")
|
||||
|
||||
# datasets = Dataset()
|
||||
# for dataset in ['mnist', 'protein', 'usps', 'shuttle']:
|
||||
# data = dataframe(*datasets.load(dataset))
|
||||
# print(dataset, data.shape)
|
||||
# report = sv.analyze(source=[data, dataset], pairwise_analysis="off")
|
||||
# report.show_html(f"html/{dataset}.html")
|
||||
|
||||
datasets = Dataset(normalize=True)
|
||||
for dataset in ["shuttle"]:
|
||||
data = dataframe(*datasets.load(dataset))
|
||||
print(dataset, data.shape)
|
||||
report = sv.analyze(source=[data, dataset], pairwise_analysis="off")
|
||||
report.show_html(f"html/{dataset}.html")
|
Reference in New Issue
Block a user