-
Notifications
You must be signed in to change notification settings - Fork 1
/
split_dataset.py
executable file
·61 lines (45 loc) · 1.36 KB
/
split_dataset.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
import os
from shutil import copyfile
'''
dataset='fma_final/'
trainset = 'fma_train/'
testset = 'fma_test/'
for dirs in os.listdir(dataset):
index = 0
os.mkdir(trainset+dirs)
os.mkdir(testset+dirs)
for files in os.listdir(dataset+dirs):
if (index < 1000):
copyfile(dataset+dirs + '/' + files, testset+dirs+'/'+files)
index+=1
else:
copyfile(dataset + dirs + '/' + files, trainset + dirs+'/'+files)
index += 1
'''
'''
dataset='fma_medium_final/'
trainset = 'fma_medium_train/'
testset = 'fma_medium_test/'
category = ''
n = 0
for dirs in os.listdir(dataset):
n+=1
category = ''
length = 0
os.mkdir(trainset + dirs)
os.mkdir(testset + dirs)
for files in os.listdir(dataset + dirs):
length+=1
train_length = (length/100) * 80
test_length = (length/100) * 20
index = 0
for files in os.listdir(dataset + dirs):
index+=1
if(index<train_length):
copyfile(dataset + dirs + '/' + files, trainset + dirs + '/' + files)
else:
copyfile(dataset + dirs + '/' + files, testset + dirs + '/' + files)
#category += dirs + '___Tot: ' + str(int(length))+ '---> ' + ' Train: '+str(int(train_length))+ ' Test: '+str(int(test_length)) + '\n'
#print(category)
print('Folder ' + str(n) + ' completed! \n')
'''