datasets removed, debug output added
This commit is contained in:
parent
522d074087
commit
ecfc175622
|
@ -79,7 +79,6 @@ UCI_MULTICLASS_DATASETS = [
|
||||||
'room',
|
'room',
|
||||||
'phishing2',
|
'phishing2',
|
||||||
'rt-iot22',
|
'rt-iot22',
|
||||||
'support2',
|
|
||||||
'image_seg',
|
'image_seg',
|
||||||
'steel_plates',
|
'steel_plates',
|
||||||
'hcv',
|
'hcv',
|
||||||
|
@ -703,7 +702,6 @@ def fetch_UCIMulticlassLabelledCollection(dataset_name, data_home=None, min_clas
|
||||||
'room': 864,
|
'room': 864,
|
||||||
'phishing2': 379,
|
'phishing2': 379,
|
||||||
'rt-iot22': 942,
|
'rt-iot22': 942,
|
||||||
'support2': 880,
|
|
||||||
'image_seg': 147,
|
'image_seg': 147,
|
||||||
'steel_plates': 198,
|
'steel_plates': 198,
|
||||||
'hcv': 503,
|
'hcv': 503,
|
||||||
|
@ -737,7 +735,6 @@ def fetch_UCIMulticlassLabelledCollection(dataset_name, data_home=None, min_clas
|
||||||
'room': 'Room Occupancy Estimation',
|
'room': 'Room Occupancy Estimation',
|
||||||
'phishing2': 'Website Phishing',
|
'phishing2': 'Website Phishing',
|
||||||
'rt-iot22': 'RT-IoT2022',
|
'rt-iot22': 'RT-IoT2022',
|
||||||
'support2': 'SUPPORT2',
|
|
||||||
'image_seg': 'Statlog (Image Segmentation)',
|
'image_seg': 'Statlog (Image Segmentation)',
|
||||||
'steel_plates': 'Steel Plates Faults',
|
'steel_plates': 'Steel Plates Faults',
|
||||||
'hcv': 'Hepatitis C Virus (HCV) for Egyptian patients',
|
'hcv': 'Hepatitis C Virus (HCV) for Egyptian patients',
|
||||||
|
@ -753,17 +750,25 @@ def fetch_UCIMulticlassLabelledCollection(dataset_name, data_home=None, min_clas
|
||||||
|
|
||||||
def download(id, name):
|
def download(id, name):
|
||||||
df = fetch_ucirepo(id=id)
|
df = fetch_ucirepo(id=id)
|
||||||
|
|
||||||
|
|
||||||
df.data.features = pd.get_dummies(df.data.features, drop_first=True)
|
df.data.features = pd.get_dummies(df.data.features, drop_first=True)
|
||||||
|
|
||||||
X, y = df.data.features.to_numpy(), df.data.targets.to_numpy().squeeze()
|
X, y = df.data.features.to_numpy(), df.data.targets.to_numpy().squeeze()
|
||||||
# classes represented as arrays are transformed to tuples to treat them as single objects
|
|
||||||
if name == 'support2':
|
with open(f"var/{name}_Xy.txt", "w") as f:
|
||||||
y[:, 2] = np.fromiter((str(elm) for elm in y[:, 2]), dtype='object')
|
for row in X:
|
||||||
raise ValueError('this is support 2')
|
f.write(str(row) + "\n")
|
||||||
|
f.write("\n\n")
|
||||||
|
if y.ndim > 1:
|
||||||
|
unique_y = np.unique(np.fromiter((tuple(elm) for elm in y), dtype='object'))
|
||||||
|
else:
|
||||||
|
unique_y = np.unique(y)
|
||||||
|
f.write(str(unique_y) + "\n\n")
|
||||||
|
for row in y:
|
||||||
|
f.write(str(row) + "\n")
|
||||||
|
|
||||||
if y.ndim > 1:
|
if y.ndim > 1:
|
||||||
y = np.fromiter((tuple(elm) for elm in y), dtype='object')
|
|
||||||
raise ValueError('more than one y')
|
raise ValueError('more than one y')
|
||||||
|
|
||||||
classes = np.sort(np.unique(y))
|
classes = np.sort(np.unique(y))
|
||||||
|
|
Loading…
Reference in New Issue