| class CONFIG: |
| gpus = "0,1" |
|
|
| class TRAIN: |
| batch_size = 90 |
| lr = 1e-4 |
| epochs = 150 |
| workers = 12 |
| val_split = 0.1 |
| clipping_val = 1.0 |
| patience = 3 |
| factor = 0.5 |
|
|
| |
| class MODEL: |
| enc_layers = 4 |
| enc_in_dim = 384 |
| enc_dim = 768 |
| pred_dim = 512 |
| pred_layers = 1 |
|
|
| |
| class DATA: |
| dataset = 'vctk' |
| ''' |
| Dictionary that specifies paths to root directories and train/test text files of each datasets. |
| 'root' is the path to the dataset and each line of the train.txt/test.txt files should contains the path to an |
| audio file from 'root'. |
| ''' |
| data_dir = {'vctk': {'root': 'data/vctk/wav48', |
| 'train': "data/vctk/train.txt", |
| 'test': "data/vctk/test.txt"}, |
| } |
|
|
| assert dataset in data_dir.keys(), 'Unknown dataset.' |
| sr = 48000 |
| audio_chunk_len = 122880 |
| window_size = 960 |
| stride = 480 |
|
|
| class TRAIN: |
| packet_sizes = [256, 512, 768, 960, 1024, |
| 1536] |
| transition_probs = ((0.9, 0.1), (0.5, 0.1), (0.5, 0.5)) |
|
|
| class EVAL: |
| packet_size = 960 |
| transition_probs = [(0.9, 0.1)] |
| masking = 'gen' |
| assert masking in ['gen', 'real'] |
| trace_path = 'test_samples/blind/lossy_singals' |
|
|
| class LOG: |
| log_dir = 'lightning_logs' |
| sample_path = 'audio_samples' |
|
|
| class TEST: |
| in_dir = 'test_samples/blind/lossy_signals' |
| out_dir = 'test_samples/blind/lossy_signals_out' |
|
|