| gpu = '0' |
| random_seed = 0 |
| data_type = 'phonemes' |
| video_path = 'lip/' |
| train_list = f'data/{data_type}_train.txt' |
| val_list = f'data/{data_type}_val.txt' |
| anno_path = 'GRID_align_txt' |
| vid_padding = 75 |
| txt_padding = 200 |
| batch_size = 16 |
| base_lr = 2e-5 |
| num_workers = 8 |
| max_epoch = 10000 |
| display = 10 |
| test_step = 1000 |
| save_prefix = f'weights/LipNet_{data_type}' |
| is_optimize = True |
|
|
| run_name = 'phonemes-nopre' |
| lsr2_dir = '/media/milselarch/47FC4BC577667AAD/LRS2' |
| pre_gru_repeats = 2 |
| frame_doubling = False |
|
|
| video_dir = 'lip/GRID' |
| audio_dir = 'lip/GRID_wavs' |
| alignments_dir = 'lip/GRID_aligns' |
| crop_images_dir = 'lip/GRID_lips' |
| images_dir = crop_images_dir |
| dataset = 'GRID' |
|
|
| phonemes_dir = 'lip/GRID_phonemes' |
| cache_videos = False |
| use_lip_crops = True |
| |
| |
| text_char_map = 'letters' |
| char_map = 'phonemes' |
|
|
| |