mirror of
https://github.com/aladdinpersson/Machine-Learning-Collection.git
synced 2026-02-21 11:18:01 +00:00
55 lines
1.3 KiB
Python
55 lines
1.3 KiB
Python
|
|
import os
|
||
|
|
import shutil
|
||
|
|
import random
|
||
|
|
|
||
|
|
seed = 1
|
||
|
|
random.seed(seed)
|
||
|
|
directory = "ISIC/images/"
|
||
|
|
train = "data/train/"
|
||
|
|
test = "data/test/"
|
||
|
|
validation = "data/validation/"
|
||
|
|
|
||
|
|
os.makedirs(train + "benign/")
|
||
|
|
os.makedirs(train + "malignant/")
|
||
|
|
os.makedirs(test + "benign/")
|
||
|
|
os.makedirs(test + "malignant/")
|
||
|
|
os.makedirs(validation + "benign/")
|
||
|
|
os.makedirs(validation + "malignant/")
|
||
|
|
|
||
|
|
test_examples = train_examples = validation_examples = 0
|
||
|
|
|
||
|
|
for line in open("ISIC/labels.csv").readlines()[1:]:
|
||
|
|
split_line = line.split(",")
|
||
|
|
img_file = split_line[0]
|
||
|
|
benign_malign = split_line[1]
|
||
|
|
|
||
|
|
random_num = random.random()
|
||
|
|
|
||
|
|
if random_num < 0.8:
|
||
|
|
location = train
|
||
|
|
train_examples += 1
|
||
|
|
|
||
|
|
elif random_num < 0.9:
|
||
|
|
location = validation
|
||
|
|
validation_examples += 1
|
||
|
|
|
||
|
|
else:
|
||
|
|
location = test
|
||
|
|
test_examples += 1
|
||
|
|
|
||
|
|
if int(float(benign_malign)) == 0:
|
||
|
|
shutil.copy(
|
||
|
|
"ISIC/images/" + img_file + ".jpg",
|
||
|
|
location + "benign/" + img_file + ".jpg",
|
||
|
|
)
|
||
|
|
|
||
|
|
elif int(float(benign_malign)) == 1:
|
||
|
|
shutil.copy(
|
||
|
|
"ISIC/images/" + img_file + ".jpg",
|
||
|
|
location + "malignant/" + img_file + ".jpg",
|
||
|
|
)
|
||
|
|
|
||
|
|
print(f"Number of training examples {train_examples}")
|
||
|
|
print(f"Number of test examples {test_examples}")
|
||
|
|
print(f"Number of validation examples {validation_examples}")
|