Spaces:
Running
Running
Delete train_val_divide.py
Browse files- train_val_divide.py +0 -18
train_val_divide.py
DELETED
|
@@ -1,18 +0,0 @@
|
|
| 1 |
-
import os
|
| 2 |
-
import numpy as np
|
| 3 |
-
filename = 'E:/uma_voice/output.txt'
|
| 4 |
-
split ='|'
|
| 5 |
-
with open(filename, encoding='utf-8') as f:
|
| 6 |
-
filepaths_and_text = [line.strip().split(split) for line in f]
|
| 7 |
-
|
| 8 |
-
train_filename = filename.split('.')[0] + '_train' + '.txt'
|
| 9 |
-
val_filename = filename.split('.')[0] + '_val' + '.txt'
|
| 10 |
-
|
| 11 |
-
train_split_ratio = 0.99
|
| 12 |
-
train_f = open(train_filename, 'w', encoding='utf-8')
|
| 13 |
-
val_f = open(val_filename, 'w', encoding='utf-8')
|
| 14 |
-
for i in range(len(filepaths_and_text)):
|
| 15 |
-
if np.random.rand() < train_split_ratio:
|
| 16 |
-
train_f.writelines('|'.join(filepaths_and_text[i]) + '\n')
|
| 17 |
-
else:
|
| 18 |
-
val_f.writelines('|'.join(filepaths_and_text[i]) + '\n')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|