datasets removed, debug output added

2024-04-23 16:30:17 +02:00 · 2024-04-23 16:30:17 +02:00 · ecfc175622
parent 522d074087
commit ecfc175622
1 changed files with 13 additions and 8 deletions
--- a/quapy/data/datasets.py
+++ b/quapy/data/datasets.py
@ -79,7 +79,6 @@ UCI_MULTICLASS_DATASETS = [
    'room',
    'phishing2',
    'rt-iot22',
    'support2',
    'image_seg',
    'steel_plates',
    'hcv',
@ -703,7 +702,6 @@ def fetch_UCIMulticlassLabelledCollection(dataset_name, data_home=None, min_clas
        'room': 864,
        'phishing2': 379,
        'rt-iot22': 942,
        'support2': 880,
        'image_seg': 147,
        'steel_plates': 198,
        'hcv': 503,
@ -737,7 +735,6 @@ def fetch_UCIMulticlassLabelledCollection(dataset_name, data_home=None, min_clas
        'room': 'Room Occupancy Estimation',
        'phishing2': 'Website Phishing',
        'rt-iot22': 'RT-IoT2022',
        'support2': 'SUPPORT2',
        'image_seg': 'Statlog (Image Segmentation)',
        'steel_plates': 'Steel Plates Faults',
        'hcv': 'Hepatitis C Virus (HCV) for Egyptian patients',
@ -753,17 +750,25 @@ def fetch_UCIMulticlassLabelledCollection(dataset_name, data_home=None, min_clas
    def download(id, name):
        df = fetch_ucirepo(id=id)
        df.data.features = pd.get_dummies(df.data.features, drop_first=True)
        X, y = df.data.features.to_numpy(), df.data.targets.to_numpy().squeeze()
-        # classes represented as arrays are transformed to tuples to treat them as single objects
+
-        if name == 'support2':
+        with open(f"var/{name}_Xy.txt", "w") as f:
-            y[:, 2] = np.fromiter((str(elm) for elm in y[:, 2]), dtype='object')
+            for row in X:
-            raise ValueError('this is support 2')
+                f.write(str(row) + "\n")
            f.write("\n\n")
            if y.ndim > 1:
                unique_y = np.unique(np.fromiter((tuple(elm) for elm in y), dtype='object'))
            else:
                unique_y = np.unique(y)
            f.write(str(unique_y) + "\n\n")
            for row in y:
                f.write(str(row) + "\n")
        if y.ndim > 1:
            y = np.fromiter((tuple(elm) for elm in y), dtype='object')
            raise ValueError('more than one y')
        classes = np.sort(np.unique(y))