paulcho98 commited on
Commit
95231cc
·
verified ·
1 Parent(s): 30b134e

Backup: DF_LORA_T769_8GPU_BS8

Browse files
Files changed (29) hide show
  1. .gitattributes +11 -0
  2. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/config.yaml +192 -0
  3. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/debug-internal.log +145 -0
  4. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/debug.log +19 -0
  5. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/config.yaml +318 -0
  6. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/output.log +61 -0
  7. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/requirements.txt +417 -0
  8. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/wandb-metadata.json +102 -0
  9. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/wandb-summary.json +1 -0
  10. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/logs/debug-internal.log +24 -0
  11. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/logs/debug.log +21 -0
  12. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/run-w9xbjand.wandb +0 -0
  13. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_122daebb61ef6826b8de.mp4 +3 -0
  14. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_479372da7ed9e768cc22.mp4 +3 -0
  15. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_509f08fac994ab8cebb6.mp4 +3 -0
  16. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_5d1790cb2d9c8554b75b.mp4 +3 -0
  17. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_81b3c24ab2930c8fd6c1.mp4 +3 -0
  18. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_8495e04002c0da67769b.mp4 +3 -0
  19. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_88d3eab6ac986b51e272.mp4 +3 -0
  20. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_8bcc788bab53b0c99f6b.mp4 +3 -0
  21. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_962d9fe735e704d64274.mp4 +3 -0
  22. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_b38481beb241c6eca7c1.mp4 +3 -0
  23. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/output.log +74 -0
  24. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/requirements.txt +417 -0
  25. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/wandb-metadata.json +104 -0
  26. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/logs/debug-internal.log +145 -0
  27. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/logs/debug.log +19 -0
  28. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/run-aogal2qe.wandb +3 -0
  29. DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb_id.txt +1 -0
.gitattributes CHANGED
@@ -1897,3 +1897,14 @@ hyunbin_FastGen-redmd/FASTGEN_OUTPUT_FULL_FT_4STEP_NO_REWARD/OmniAvatar-FastGen/
1897
  hyunbin_FastGen-redmd/FASTGEN_OUTPUT_FULL_FT_4STEP_NO_REWARD/OmniAvatar-FastGen/omniavatar_sf_full_ft/sf_full_ft_4step_no_reward/wandb/run-20260503_124619-71vuvjwo/files/media/videos/val0/reconstructed_600_f5463a4ea6f68a39c5d0.mp4 filter=lfs diff=lfs merge=lfs -text
1898
  hyunbin_FastGen-redmd/FASTGEN_OUTPUT_FULL_FT_4STEP_NO_REWARD/OmniAvatar-FastGen/omniavatar_sf_full_ft/sf_full_ft_4step_no_reward/wandb/run-20260503_124619-71vuvjwo/files/media/videos/val0/reconstructed_600_f7412c9e170ffd299748.mp4 filter=lfs diff=lfs merge=lfs -text
1899
  hyunbin_FastGen-redmd/FASTGEN_OUTPUT_FULL_FT_4STEP_NO_REWARD/OmniAvatar-FastGen/omniavatar_sf_full_ft/sf_full_ft_4step_no_reward/wandb/run-20260503_124619-71vuvjwo/run-71vuvjwo.wandb filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
1897
  hyunbin_FastGen-redmd/FASTGEN_OUTPUT_FULL_FT_4STEP_NO_REWARD/OmniAvatar-FastGen/omniavatar_sf_full_ft/sf_full_ft_4step_no_reward/wandb/run-20260503_124619-71vuvjwo/files/media/videos/val0/reconstructed_600_f5463a4ea6f68a39c5d0.mp4 filter=lfs diff=lfs merge=lfs -text
1898
  hyunbin_FastGen-redmd/FASTGEN_OUTPUT_FULL_FT_4STEP_NO_REWARD/OmniAvatar-FastGen/omniavatar_sf_full_ft/sf_full_ft_4step_no_reward/wandb/run-20260503_124619-71vuvjwo/files/media/videos/val0/reconstructed_600_f7412c9e170ffd299748.mp4 filter=lfs diff=lfs merge=lfs -text
1899
  hyunbin_FastGen-redmd/FASTGEN_OUTPUT_FULL_FT_4STEP_NO_REWARD/OmniAvatar-FastGen/omniavatar_sf_full_ft/sf_full_ft_4step_no_reward/wandb/run-20260503_124619-71vuvjwo/run-71vuvjwo.wandb filter=lfs diff=lfs merge=lfs -text
1900
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_122daebb61ef6826b8de.mp4 filter=lfs diff=lfs merge=lfs -text
1901
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_479372da7ed9e768cc22.mp4 filter=lfs diff=lfs merge=lfs -text
1902
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_509f08fac994ab8cebb6.mp4 filter=lfs diff=lfs merge=lfs -text
1903
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_5d1790cb2d9c8554b75b.mp4 filter=lfs diff=lfs merge=lfs -text
1904
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_81b3c24ab2930c8fd6c1.mp4 filter=lfs diff=lfs merge=lfs -text
1905
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_8495e04002c0da67769b.mp4 filter=lfs diff=lfs merge=lfs -text
1906
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_88d3eab6ac986b51e272.mp4 filter=lfs diff=lfs merge=lfs -text
1907
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_8bcc788bab53b0c99f6b.mp4 filter=lfs diff=lfs merge=lfs -text
1908
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_962d9fe735e704d64274.mp4 filter=lfs diff=lfs merge=lfs -text
1909
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_b38481beb241c6eca7c1.mp4 filter=lfs diff=lfs merge=lfs -text
1910
+ DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/run-aogal2qe.wandb filter=lfs diff=lfs merge=lfs -text
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/config.yaml ADDED
@@ -0,0 +1,192 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dataloader_train:
2
+ _target_: <class 'fastgen.datasets.omniavatar_dataloader.OmniAvatarDataLoader'>
3
+ batch_size: '8'
4
+ data_list_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_path.txt
5
+ latentsync_mask_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/mask.png
6
+ load_ode_path: 'False'
7
+ neg_text_emb_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt
8
+ num_workers: '4'
9
+ use_ref_sequence: 'True'
10
+ dataloader_val:
11
+ _target_: <function create_omniavatar_dataloader at 0x7f9e8dc118a0>
12
+ batch_size: '1'
13
+ data_list_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_val10.txt
14
+ latentsync_mask_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/mask.png
15
+ load_ode_path: 'False'
16
+ neg_text_emb_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt
17
+ num_workers: '2'
18
+ use_ref_sequence: 'True'
19
+ eval:
20
+ max_ckpt: '100000000'
21
+ min_ckpt: '0'
22
+ num_samples: '50000'
23
+ samples_dir: samples
24
+ save_images: 'False'
25
+ log_config:
26
+ group: omniavatar_df_audiofix
27
+ name: df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter
28
+ project: OmniAvatar-FastGen
29
+ wandb_credential: ./credentials/wandb_api.txt
30
+ wandb_entity: paulhcho
31
+ wandb_mode: online
32
+ model:
33
+ add_teacher_to_fsdp_dict: 'True'
34
+ context_noise: '0.0'
35
+ ddp_find_unused_parameters: 'True'
36
+ device: cuda
37
+ enable_preprocessors: 'True'
38
+ fake_score_net: null
39
+ fsdp_meta_init: 'False'
40
+ grad_scaler_enabled: 'False'
41
+ grad_scaler_growth_interval: '2000'
42
+ grad_scaler_init_scale: '65536.0'
43
+ guidance_scale: null
44
+ input_shape:
45
+ - '16'
46
+ - '21'
47
+ - '64'
48
+ - '64'
49
+ load_student_weights: 'True'
50
+ net:
51
+ _target_: <class 'fastgen.networks.OmniAvatar.network_causal.CausalOmniAvatarWan'>
52
+ audio_hidden_size: '32'
53
+ base_model_paths: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/diffusion_pytorch_model.safetensors
54
+ chunk_size: '3'
55
+ in_dim: '65'
56
+ lora_alpha: '64'
57
+ lora_rank: '128'
58
+ merge_lora: 'False'
59
+ mode: v2v
60
+ model_size: 1.3B
61
+ net_pred_type: flow
62
+ omniavatar_ckpt_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data_checkpoints/1.3B-step-1000.pt
63
+ schedule_type: rf
64
+ stochastic_attn_configs:
65
+ - local_attn_size: '7'
66
+ sink_size: '1'
67
+ weight: '0.2'
68
+ - local_attn_size: '10'
69
+ sink_size: '1'
70
+ weight: '0.2'
71
+ - local_attn_size: '13'
72
+ sink_size: '1'
73
+ weight: '0.2'
74
+ - local_attn_size: '9'
75
+ sink_size: '3'
76
+ weight: '0.2'
77
+ - local_attn_size: '12'
78
+ sink_size: '3'
79
+ weight: '0.2'
80
+ total_num_frames: '21'
81
+ unfreeze_modules:
82
+ - _core.audio_proj
83
+ - _core.audio_cond_projs
84
+ - _core.patch_embedding
85
+ use_audio: 'True'
86
+ use_dynamic_rope: 'False'
87
+ net_optimizer:
88
+ _target_: <function get_optimizer at 0x7f9e90111940>
89
+ betas:
90
+ - '0.9'
91
+ - '0.999'
92
+ eps: 1e-08
93
+ fused: 'False'
94
+ lr: 1e-05
95
+ model: null
96
+ optim_type: adamw
97
+ weight_decay: '0.01'
98
+ net_scheduler:
99
+ _target_: <class 'fastgen.utils.lr_scheduler.LambdaLinearScheduler'>
100
+ cycle_lengths:
101
+ - '10000000000'
102
+ f_max:
103
+ - '1.0'
104
+ f_min:
105
+ - '1.0'
106
+ f_start:
107
+ - 1e-06
108
+ warm_up_steps:
109
+ - '0'
110
+ precision: bfloat16
111
+ precision_amp: null
112
+ precision_amp_enc: null
113
+ precision_amp_infer: null
114
+ precision_fsdp: float32
115
+ pretrained_model_path: ''
116
+ pretrained_student_net_path: ''
117
+ sample_t_cfg:
118
+ log_t_df: '0.01'
119
+ max_t: '0.999'
120
+ min_t: '0.001'
121
+ shift: '5.0'
122
+ t_list:
123
+ - '0.999'
124
+ - '0.769'
125
+ - '0.0'
126
+ time_dist_type: shifted
127
+ train_p_mean: '-1.1'
128
+ train_p_std: '2.0'
129
+ skip_layers: null
130
+ student_sample_steps: '2'
131
+ student_sample_type: sde
132
+ teacher: null
133
+ timestep_cfg:
134
+ enabled: 'False'
135
+ t_hi: '1.0'
136
+ t_lo: '0.0'
137
+ use_ema: 'False'
138
+ vae_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/Wan2.1_VAE.pth
139
+ model_class:
140
+ _target_: <class 'fastgen.methods.omniavatar_diffusion_forcing.OmniAvatarDiffusionForcingModel'>
141
+ config: null
142
+ trainer:
143
+ augment_pipe: null
144
+ batch_size_global: null
145
+ callbacks:
146
+ gpu_stats:
147
+ _target_: <class 'fastgen.callbacks.gpu_stats.GPUStatsCallback'>
148
+ every_n: '100'
149
+ grad_clip:
150
+ _target_: <class 'fastgen.callbacks.grad_clip.GradClipCallback'>
151
+ grad_norm: '10.0'
152
+ model_key: net
153
+ param_count:
154
+ _target_: <class 'fastgen.callbacks.param_count.ParamCountCallback'>
155
+ train_profiler:
156
+ _target_: <class 'fastgen.callbacks.train_profiler.TrainProfilerCallback'>
157
+ every_n: '100'
158
+ wandb:
159
+ _target_: <class 'fastgen.callbacks.wandb.WandbCallback'>
160
+ fps: '25'
161
+ sample_logging_iter: '500'
162
+ checkpointer:
163
+ pretrained_ckpt_key_map:
164
+ net: net
165
+ pretrained_ckpt_path: ''
166
+ s3_container: s3://checkpoints/fastgen
167
+ s3_credential: ./credentials/s3.json
168
+ save_dir: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/checkpoints
169
+ use_s3: 'False'
170
+ cudnn:
171
+ benchmark: 'True'
172
+ deterministic: 'False'
173
+ ddp: 'True'
174
+ fsdp: 'False'
175
+ fsdp_cpu_offload: 'False'
176
+ fsdp_min_num_params: '10000000'
177
+ fsdp_sharding_group_size: null
178
+ global_vars: null
179
+ global_vars_val:
180
+ - null
181
+ grad_accum_rounds: '1'
182
+ logging_iter: '1'
183
+ max_iter: '5000'
184
+ offload_module_in_decoding: 'False'
185
+ resume: 'False'
186
+ save_ckpt_iter: '500'
187
+ seed: '0'
188
+ skip_initial_validation: 'True'
189
+ tf32_enabled: 'True'
190
+ val_seed: null
191
+ validation_iter: '500'
192
+ visualize_teacher: 'False'
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/debug-internal.log ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-30T23:05:47.717661886+09:00","level":"INFO","msg":"wandb-core"}
2
+ {"time":"2026-04-30T23:05:47.719875838+09:00","level":"INFO","msg":"stream: starting","core version":"0.25.1"}
3
+ {"time":"2026-04-30T23:05:48.202102105+09:00","level":"INFO","msg":"stream: created new stream","id":"aogal2qe"}
4
+ {"time":"2026-04-30T23:05:48.202176404+09:00","level":"INFO","msg":"handler: started"}
5
+ {"time":"2026-04-30T23:05:48.203751244+09:00","level":"INFO","msg":"stream: started"}
6
+ {"time":"2026-04-30T23:05:48.203784235+09:00","level":"INFO","msg":"sender: started"}
7
+ {"time":"2026-04-30T23:05:48.203780548+09:00","level":"INFO","msg":"writer: started","stream_id":"aogal2qe"}
8
+ {"time":"2026-04-30T23:05:49.289209394+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"console_offset":0,"console_lines":1}
9
+ {"time":"2026-04-30T23:05:49.628819533+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
10
+ {"time":"2026-04-30T23:06:04.28911266+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":0,"events_lines":2,"console_offset":0,"console_lines":19,"uploaded_len":2}
11
+ {"time":"2026-04-30T23:06:04.68488743+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
12
+ {"time":"2026-04-30T23:06:19.28947862+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":2,"events_lines":2}
13
+ {"time":"2026-04-30T23:06:19.593106092+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
14
+ {"time":"2026-04-30T23:06:34.289531575+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":4,"events_lines":2}
15
+ {"time":"2026-04-30T23:06:34.638885012+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
16
+ {"time":"2026-04-30T23:06:49.289408032+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":6,"events_lines":2,"console_offset":19,"console_lines":1}
17
+ {"time":"2026-04-30T23:06:49.55441404+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
18
+ {"time":"2026-04-30T23:07:04.2893822+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":8,"events_lines":2}
19
+ {"time":"2026-04-30T23:07:04.547174503+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
20
+ {"time":"2026-04-30T23:07:19.289556072+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":10,"events_lines":2}
21
+ {"time":"2026-04-30T23:07:19.542062737+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
22
+ {"time":"2026-04-30T23:07:34.289675411+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":12,"events_lines":2,"console_offset":20,"console_lines":29}
23
+ {"time":"2026-04-30T23:07:34.590652485+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
24
+ {"time":"2026-04-30T23:07:49.289694092+09:00","level":"INFO","msg":"filestream: sending request","total_files":3,"events_offset":14,"events_lines":2,"console_offset":49,"console_lines":9,"uploaded_len":10}
25
+ {"time":"2026-04-30T23:07:49.578907428+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
26
+ {"time":"2026-04-30T23:08:04.289321845+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":16,"events_lines":2,"console_offset":58,"console_lines":3}
27
+ {"time":"2026-04-30T23:08:04.654848542+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
28
+ {"time":"2026-04-30T23:08:19.302053487+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":18,"events_lines":2,"console_offset":61,"console_lines":10}
29
+ {"time":"2026-04-30T23:08:19.606327435+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
30
+ {"time":"2026-04-30T23:08:34.288993064+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":20,"events_lines":2}
31
+ {"time":"2026-04-30T23:08:34.57863+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
32
+ {"time":"2026-04-30T23:08:49.289673912+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":22,"events_lines":2}
33
+ {"time":"2026-04-30T23:08:49.597082041+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
34
+ {"time":"2026-04-30T23:09:04.289440794+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":24,"events_lines":2}
35
+ {"time":"2026-04-30T23:09:04.62933334+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
36
+ {"time":"2026-04-30T23:09:19.289512374+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":26,"events_lines":2}
37
+ {"time":"2026-04-30T23:09:19.579604059+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
38
+ {"time":"2026-04-30T23:09:34.288965379+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":28,"events_lines":2}
39
+ {"time":"2026-04-30T23:09:34.594544765+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
40
+ {"time":"2026-04-30T23:09:49.288782859+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":30,"events_lines":2}
41
+ {"time":"2026-04-30T23:09:49.612205294+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
42
+ {"time":"2026-04-30T23:10:04.289135035+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":32,"events_lines":2}
43
+ {"time":"2026-04-30T23:10:04.630551549+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
44
+ {"time":"2026-04-30T23:10:19.288780712+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":34,"events_lines":2}
45
+ {"time":"2026-04-30T23:10:19.682644618+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
46
+ {"time":"2026-04-30T23:10:34.289481389+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":36,"events_lines":2}
47
+ {"time":"2026-04-30T23:10:34.647039103+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
48
+ {"time":"2026-04-30T23:10:49.289265985+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":38,"events_lines":2}
49
+ {"time":"2026-04-30T23:10:49.730743901+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
50
+ {"time":"2026-04-30T23:11:04.289172039+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":40,"events_lines":2}
51
+ {"time":"2026-04-30T23:11:04.731077132+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
52
+ {"time":"2026-04-30T23:11:19.289448884+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":42,"events_lines":2}
53
+ {"time":"2026-04-30T23:11:19.667453476+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
54
+ {"time":"2026-04-30T23:11:34.289592911+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":44,"events_lines":2}
55
+ {"time":"2026-04-30T23:11:34.668128144+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
56
+ {"time":"2026-04-30T23:11:49.288778693+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":46,"events_lines":2}
57
+ {"time":"2026-04-30T23:11:49.644035721+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
58
+ {"time":"2026-04-30T23:12:04.289349786+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":48,"events_lines":2}
59
+ {"time":"2026-04-30T23:12:04.736082536+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
60
+ {"time":"2026-04-30T23:12:19.288945368+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":50,"events_lines":2}
61
+ {"time":"2026-04-30T23:12:19.610329497+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
62
+ {"time":"2026-04-30T23:12:34.289571483+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":52,"events_lines":2}
63
+ {"time":"2026-04-30T23:12:34.587850694+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
64
+ {"time":"2026-04-30T23:12:49.288764613+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":54,"events_lines":2}
65
+ {"time":"2026-04-30T23:12:49.719622981+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
66
+ {"time":"2026-04-30T23:13:04.288637224+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":56,"events_lines":2}
67
+ {"time":"2026-04-30T23:13:04.582812338+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
68
+ {"time":"2026-04-30T23:13:19.289301406+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":58,"events_lines":2}
69
+ {"time":"2026-04-30T23:13:19.553204842+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
70
+ {"time":"2026-04-30T23:13:34.289451588+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":60,"events_lines":2}
71
+ {"time":"2026-04-30T23:13:34.534556354+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
72
+ {"time":"2026-04-30T23:13:49.288622643+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":62,"events_lines":2}
73
+ {"time":"2026-04-30T23:13:49.595316475+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
74
+ {"time":"2026-04-30T23:14:04.289144412+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":64,"events_lines":2}
75
+ {"time":"2026-04-30T23:14:04.543244073+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
76
+ {"time":"2026-04-30T23:14:19.288823516+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":66,"events_lines":2}
77
+ {"time":"2026-04-30T23:14:19.571833716+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
78
+ {"time":"2026-04-30T23:14:34.289509199+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":68,"events_lines":2}
79
+ {"time":"2026-04-30T23:14:34.579585848+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
80
+ {"time":"2026-04-30T23:14:49.288824765+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":70,"events_lines":2}
81
+ {"time":"2026-04-30T23:14:49.612924595+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
82
+ {"time":"2026-04-30T23:15:04.2892304+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":72,"events_lines":2}
83
+ {"time":"2026-04-30T23:15:04.566368977+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
84
+ {"time":"2026-04-30T23:15:19.288719459+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":74,"events_lines":2}
85
+ {"time":"2026-04-30T23:15:19.609636252+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
86
+ {"time":"2026-04-30T23:15:34.289310014+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":76,"events_lines":2}
87
+ {"time":"2026-04-30T23:15:34.584427145+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
88
+ {"time":"2026-04-30T23:15:49.288956977+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":78,"events_lines":2}
89
+ {"time":"2026-04-30T23:15:49.614829139+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
90
+ {"time":"2026-04-30T23:16:04.289218328+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":80,"events_lines":2}
91
+ {"time":"2026-04-30T23:16:04.60993107+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
92
+ {"time":"2026-04-30T23:16:19.289171247+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":82,"events_lines":2,"console_offset":71,"console_lines":3}
93
+ {"time":"2026-04-30T23:16:19.628814484+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
94
+ {"time":"2026-04-30T23:16:34.288676582+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":84,"events_lines":2}
95
+ {"time":"2026-04-30T23:16:34.689081134+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
96
+ {"time":"2026-04-30T23:16:49.288933188+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":86,"events_lines":2}
97
+ {"time":"2026-04-30T23:16:49.62914172+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
98
+ {"time":"2026-04-30T23:17:04.288607448+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":88,"events_lines":2}
99
+ {"time":"2026-04-30T23:17:04.589594346+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
100
+ {"time":"2026-04-30T23:17:19.289321381+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":90,"events_lines":2}
101
+ {"time":"2026-04-30T23:17:19.564264059+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
102
+ {"time":"2026-04-30T23:17:34.288994724+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":92,"events_lines":2}
103
+ {"time":"2026-04-30T23:17:34.552863001+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
104
+ {"time":"2026-04-30T23:17:49.289503425+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":94,"events_lines":2}
105
+ {"time":"2026-04-30T23:17:49.588243139+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
106
+ {"time":"2026-04-30T23:18:04.28878216+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":96,"events_lines":2}
107
+ {"time":"2026-04-30T23:18:04.554107868+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
108
+ {"time":"2026-04-30T23:18:19.289179022+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":98,"events_lines":2}
109
+ {"time":"2026-04-30T23:18:19.612210314+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
110
+ {"time":"2026-04-30T23:18:34.288875601+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":100,"events_lines":2}
111
+ {"time":"2026-04-30T23:18:34.581426522+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
112
+ {"time":"2026-04-30T23:18:49.289382733+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":102,"events_lines":2}
113
+ {"time":"2026-04-30T23:18:49.571645992+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
114
+ {"time":"2026-04-30T23:19:04.28863327+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":104,"events_lines":2}
115
+ {"time":"2026-04-30T23:19:04.567218404+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
116
+ {"time":"2026-04-30T23:19:19.288592986+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":106,"events_lines":2}
117
+ {"time":"2026-04-30T23:19:19.559133381+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
118
+ {"time":"2026-04-30T23:19:34.288571933+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":108,"events_lines":2}
119
+ {"time":"2026-04-30T23:19:34.543783797+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
120
+ {"time":"2026-04-30T23:19:49.289279029+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":110,"events_lines":2}
121
+ {"time":"2026-04-30T23:19:49.634365885+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
122
+ {"time":"2026-04-30T23:20:04.288850186+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":112,"events_lines":2}
123
+ {"time":"2026-04-30T23:20:04.569464453+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
124
+ {"time":"2026-04-30T23:20:19.289155372+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":114,"events_lines":2}
125
+ {"time":"2026-04-30T23:20:19.613994616+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
126
+ {"time":"2026-04-30T23:20:34.289328425+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":116,"events_lines":2}
127
+ {"time":"2026-04-30T23:20:34.620516915+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
128
+ {"time":"2026-04-30T23:20:49.288670175+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":118,"events_lines":2}
129
+ {"time":"2026-04-30T23:20:49.701752992+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
130
+ {"time":"2026-04-30T23:21:04.289448285+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":120,"events_lines":2}
131
+ {"time":"2026-04-30T23:21:04.672086777+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
132
+ {"time":"2026-04-30T23:21:19.288957688+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":122,"events_lines":2}
133
+ {"time":"2026-04-30T23:21:19.808028855+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
134
+ {"time":"2026-04-30T23:21:34.289496467+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":124,"events_lines":2}
135
+ {"time":"2026-04-30T23:21:34.598270838+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
136
+ {"time":"2026-04-30T23:21:49.288582737+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":126,"events_lines":2}
137
+ {"time":"2026-04-30T23:21:49.602869427+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
138
+ {"time":"2026-04-30T23:22:04.289027983+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":128,"events_lines":2}
139
+ {"time":"2026-04-30T23:22:04.602488321+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
140
+ {"time":"2026-04-30T23:22:19.288843665+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":130,"events_lines":2}
141
+ {"time":"2026-04-30T23:22:19.590625944+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
142
+ {"time":"2026-04-30T23:22:34.288973354+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":132,"events_lines":2}
143
+ {"time":"2026-04-30T23:22:34.576595162+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
144
+ {"time":"2026-04-30T23:22:49.28941316+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":134,"events_lines":1}
145
+ {"time":"2026-04-30T23:22:49.617243724+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/debug.log ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_setup.py:_flush():81] Current SDK version is 0.25.1
2
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_setup.py:_flush():81] Configure stats pid to 2767876
3
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_setup.py:_flush():81] Loading settings from environment variables
4
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:setup_run_log_directory():717] Logging user logs to /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/logs/debug.log
5
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:setup_run_log_directory():718] Logging internal logs to /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/logs/debug-internal.log
6
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:init():844] calling init triggers
7
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:init():849] wandb.init called with sweep_config: {}
8
+ config: {'log_config': {'project': 'OmniAvatar-FastGen', 'group': 'omniavatar_df_audiofix', 'name': 'df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter', 'wandb_mode': 'online', 'wandb_entity': 'paulhcho', 'wandb_credential': './credentials/wandb_api.txt'}, 'trainer': {'cudnn': {'deterministic': 'False', 'benchmark': 'True'}, 'checkpointer': {'save_dir': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/checkpoints', 'use_s3': 'False', 's3_container': 's3://checkpoints/fastgen', 's3_credential': './credentials/s3.json', 'pretrained_ckpt_path': '', 'pretrained_ckpt_key_map': {'net': 'net'}}, 'callbacks': {'grad_clip': {'grad_norm': '10.0', 'model_key': 'net', '_target_': "<class 'fastgen.callbacks.grad_clip.GradClipCallback'>"}, 'gpu_stats': {'every_n': '100', '_target_': "<class 'fastgen.callbacks.gpu_stats.GPUStatsCallback'>"}, 'train_profiler': {'every_n': '100', '_target_': "<class 'fastgen.callbacks.train_profiler.TrainProfilerCallback'>"}, 'param_count': {'_target_': "<class 'fastgen.callbacks.param_count.ParamCountCallback'>"}, 'wandb': {'sample_logging_iter': '500', 'fps': '25', '_target_': "<class 'fastgen.callbacks.wandb.WandbCallback'>"}}, 'save_ckpt_iter': '500', 'validation_iter': '500', 'skip_initial_validation': 'True', 'logging_iter': '1', 'max_iter': '5000', 'visualize_teacher': 'False', 'seed': '0', 'val_seed': None, 'resume': 'False', 'ddp': 'True', 'fsdp': 'False', 'tf32_enabled': 'True', 'grad_accum_rounds': '1', 'batch_size_global': None, 'offload_module_in_decoding': 'False', 'fsdp_cpu_offload': 'False', 'fsdp_min_num_params': '10000000', 'fsdp_sharding_group_size': None, 'global_vars': None, 'global_vars_val': [None], 'augment_pipe': None}, 'dataloader_train': {'data_list_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_path.txt', 'latentsync_mask_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/mask.png', 'batch_size': '8', 'num_workers': '4', 'neg_text_emb_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt', 'use_ref_sequence': 'True', 'load_ode_path': 'False', '_target_': "<class 'fastgen.datasets.omniavatar_dataloader.OmniAvatarDataLoader'>"}, 'dataloader_val': {'data_list_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_val10.txt', 'latentsync_mask_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/mask.png', 'batch_size': '1', 'num_workers': '2', 'neg_text_emb_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt', 'use_ref_sequence': 'True', 'load_ode_path': 'False', '_target_': '<function create_omniavatar_dataloader at 0x7fa4931818a0>'}, 'eval': {'num_samples': '50000', 'save_images': 'False', 'min_ckpt': '0', 'max_ckpt': '100000000', 'samples_dir': 'samples'}, 'model': {'net': {'model_size': '1.3B', 'in_dim': '65', 'mode': 'v2v', 'use_audio': 'True', 'audio_hidden_size': '32', 'chunk_size': '3', 'total_num_frames': '21', 'base_model_paths': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/diffusion_pytorch_model.safetensors', 'omniavatar_ckpt_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data_checkpoints/1.3B-step-1000.pt', 'net_pred_type': 'flow', 'schedule_type': 'rf', 'use_dynamic_rope': 'False', 'stochastic_attn_configs': [{'local_attn_size': '7', 'sink_size': '1', 'weight': '0.2'}, {'local_attn_size': '10', 'sink_size': '1', 'weight': '0.2'}, {'local_attn_size': '13', 'sink_size': '1', 'weight': '0.2'}, {'local_attn_size': '9', 'sink_size': '3', 'weight': '0.2'}, {'local_attn_size': '12', 'sink_size': '3', 'weight': '0.2'}], '_target_': "<class 'fastgen.networks.OmniAvatar.network_causal.CausalOmniAvatarWan'>", 'merge_lora': 'False', 'unfreeze_modules': ['_core.audio_proj', '_core.audio_cond_projs', '_core.patch_embedding'], 'lora_rank': '128', 'lora_alpha': '64'}, 'teacher': None, 'fake_score_net': None, 'guidance_scale': None, 'timestep_cfg': {'enabled': 'False', 't_lo': '0.0', 't_hi': '1.0'}, 'skip_layers': None, 'net_optimizer': {'model': None, 'optim_type': 'adamw', 'lr': '1e-05', 'weight_decay': '0.01', 'betas': ['0.9', '0.999'], 'eps': '1e-08', 'fused': 'False', '_target_': '<function get_optimizer at 0x7fa499799940>'}, 'net_scheduler': {'warm_up_steps': ['0'], 'cycle_lengths': ['10000000000'], 'f_start': ['1e-06'], 'f_max': ['1.0'], 'f_min': ['1.0'], '_target_': "<class 'fastgen.utils.lr_scheduler.LambdaLinearScheduler'>"}, 'sample_t_cfg': {'time_dist_type': 'shifted', 'train_p_mean': '-1.1', 'train_p_std': '2.0', 'shift': '5.0', 'min_t': '0.001', 'max_t': '0.999', 't_list': ['0.999', '0.769', '0.0'], 'log_t_df': '0.01'}, 'input_shape': ['16', '21', '64', '64'], 'device': 'cuda', 'grad_scaler_enabled': 'False', 'grad_scaler_init_scale': '65536.0', 'grad_scaler_growth_interval': '2000', 'pretrained_model_path': '', 'pretrained_student_net_path': '', 'load_student_weights': 'True', 'enable_preprocessors': 'True', 'use_ema': 'False', 'student_sample_steps': '2', 'student_sample_type': 'sde', 'fsdp_meta_init': 'False', 'add_teacher_to_fsdp_dict': 'True', 'ddp_find_unused_parameters': 'True', 'precision': 'bfloat16', 'precision_amp': None, 'precision_amp_infer': None, 'precision_amp_enc': None, 'precision_fsdp': 'float32', 'context_noise': '0.0', 'vae_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/Wan2.1_VAE.pth'}, 'model_class': {'config': None, '_target_': "<class 'fastgen.methods.omniavatar_diffusion_forcing.OmniAvatarDiffusionForcingModel'>"}, '_wandb': {}}
9
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:init():892] starting backend
10
+ 2026-04-30 23:05:47,705 INFO MainThread:2767876 [wandb_init.py:init():895] sending inform_init request
11
+ 2026-04-30 23:05:47,714 INFO MainThread:2767876 [wandb_init.py:init():903] backend started and connected
12
+ 2026-04-30 23:05:47,716 INFO MainThread:2767876 [wandb_init.py:init():973] updated telemetry
13
+ 2026-04-30 23:05:47,743 INFO MainThread:2767876 [wandb_init.py:init():997] communicating run to backend with 90.0 second timeout
14
+ 2026-04-30 23:05:48,972 INFO MainThread:2767876 [wandb_init.py:init():1042] starting run threads in backend
15
+ 2026-04-30 23:05:49,282 INFO MainThread:2767876 [wandb_run.py:_console_start():2524] atexit reg
16
+ 2026-04-30 23:05:49,283 INFO MainThread:2767876 [wandb_run.py:_redirect():2373] redirect: wrap_raw
17
+ 2026-04-30 23:05:49,283 INFO MainThread:2767876 [wandb_run.py:_redirect():2442] Wrapping output streams.
18
+ 2026-04-30 23:05:49,283 INFO MainThread:2767876 [wandb_run.py:_redirect():2465] Redirects installed.
19
+ 2026-04-30 23:05:49,286 INFO MainThread:2767876 [wandb_init.py:init():1082] run started, returning control to user process
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/config.yaml ADDED
@@ -0,0 +1,318 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.25.1
4
+ e:
5
+ 7agpz9rvil27ulbaooy9tu3j71z6whib:
6
+ args:
7
+ - --config=fastgen/configs/experiments/OmniAvatar/config_df_shift_5_lora_t769.py
8
+ - '-'
9
+ - dataloader_train.batch_size=8
10
+ - trainer.ddp=True
11
+ - trainer.max_iter=5000
12
+ - trainer.save_ckpt_iter=500
13
+ - trainer.resume=False
14
+ - log_config.group=omniavatar_df_audiofix
15
+ - log_config.name=df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter
16
+ - log_config.project=OmniAvatar-FastGen
17
+ - log_config.wandb_entity=paulhcho
18
+ codePath: train.py
19
+ codePathLocal: train.py
20
+ cpu_count: 64
21
+ cpu_count_logical: 128
22
+ cudaVersion: "12.9"
23
+ disk:
24
+ /:
25
+ total: "1599530123264"
26
+ used: "753074597888"
27
+ email: paul.hyunbin@gmail.com
28
+ executable: /usr/bin/python
29
+ git:
30
+ commit: f5897815a4bdcc8f11212b24f367a6839a5409ca
31
+ remote: https://github.com/paulcho98/FastGen.git
32
+ gpu: NVIDIA A100-SXM4-80GB
33
+ gpu_count: 8
34
+ gpu_nvidia:
35
+ - architecture: Ampere
36
+ cudaCores: 6912
37
+ memoryTotal: "85899345920"
38
+ name: NVIDIA A100-SXM4-80GB
39
+ uuid: GPU-c1619da3-e2c1-15b0-cb55-50e24b1f8e99
40
+ - architecture: Ampere
41
+ cudaCores: 6912
42
+ memoryTotal: "85899345920"
43
+ name: NVIDIA A100-SXM4-80GB
44
+ uuid: GPU-29f274f2-7065-4653-dcd1-055518ba099c
45
+ - architecture: Ampere
46
+ cudaCores: 6912
47
+ memoryTotal: "85899345920"
48
+ name: NVIDIA A100-SXM4-80GB
49
+ uuid: GPU-47a2dd51-a5dc-1d24-4713-ea97b7049d18
50
+ - architecture: Ampere
51
+ cudaCores: 6912
52
+ memoryTotal: "85899345920"
53
+ name: NVIDIA A100-SXM4-80GB
54
+ uuid: GPU-ad40d9cb-0070-8a6c-f0a3-d8d40d8233a7
55
+ - architecture: Ampere
56
+ cudaCores: 6912
57
+ memoryTotal: "85899345920"
58
+ name: NVIDIA A100-SXM4-80GB
59
+ uuid: GPU-97413b12-6c45-b8cd-a06a-886dd3bc94d6
60
+ - architecture: Ampere
61
+ cudaCores: 6912
62
+ memoryTotal: "85899345920"
63
+ name: NVIDIA A100-SXM4-80GB
64
+ uuid: GPU-060cf5c3-ba18-6ff1-9d4d-9e9c71bf6c67
65
+ - architecture: Ampere
66
+ cudaCores: 6912
67
+ memoryTotal: "85899345920"
68
+ name: NVIDIA A100-SXM4-80GB
69
+ uuid: GPU-6562d339-d2bb-95e2-3881-199a64c50ba7
70
+ - architecture: Ampere
71
+ cudaCores: 6912
72
+ memoryTotal: "85899345920"
73
+ name: NVIDIA A100-SXM4-80GB
74
+ uuid: GPU-a6834410-f241-7270-f5e3-129ecdc2e8f3
75
+ host: instance-35250
76
+ memory:
77
+ total: "1081693446144"
78
+ os: Linux-5.15.0-142-generic-x86_64-with-glibc2.39
79
+ program: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/train.py
80
+ python: CPython 3.12.3
81
+ root: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter
82
+ startedAt: "2026-04-30T13:59:26.861268Z"
83
+ writerId: 7agpz9rvil27ulbaooy9tu3j71z6whib
84
+ m: []
85
+ python_version: 3.12.3
86
+ t:
87
+ "1":
88
+ - 1
89
+ - 5
90
+ - 11
91
+ - 41
92
+ - 49
93
+ - 50
94
+ - 53
95
+ - 63
96
+ - 71
97
+ - 83
98
+ - 98
99
+ "2":
100
+ - 1
101
+ - 5
102
+ - 11
103
+ - 41
104
+ - 49
105
+ - 50
106
+ - 53
107
+ - 63
108
+ - 71
109
+ - 83
110
+ - 98
111
+ "3":
112
+ - 13
113
+ - 14
114
+ - 16
115
+ "4": 3.12.3
116
+ "5": 0.25.1
117
+ "6": 5.3.0
118
+ "12": 0.25.1
119
+ "13": linux-x86_64
120
+ dataloader_train:
121
+ value:
122
+ _target_: <class 'fastgen.datasets.omniavatar_dataloader.OmniAvatarDataLoader'>
123
+ batch_size: "8"
124
+ data_list_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_path.txt
125
+ latentsync_mask_path: /home/work/.local/Self-Forcing_LipSync_StableAvatar/diffsynth/utils/mask.png
126
+ load_ode_path: "False"
127
+ neg_text_emb_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt
128
+ num_workers: "4"
129
+ use_ref_sequence: "True"
130
+ dataloader_val:
131
+ value:
132
+ _target_: <function create_omniavatar_dataloader at 0x7f7b29e018a0>
133
+ batch_size: "1"
134
+ data_list_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_val10.txt
135
+ latentsync_mask_path: /home/work/.local/Self-Forcing_LipSync_StableAvatar/diffsynth/utils/mask.png
136
+ load_ode_path: "False"
137
+ neg_text_emb_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt
138
+ num_workers: "2"
139
+ use_ref_sequence: "True"
140
+ eval:
141
+ value:
142
+ max_ckpt: "100000000"
143
+ min_ckpt: "0"
144
+ num_samples: "50000"
145
+ samples_dir: samples
146
+ save_images: "False"
147
+ log_config:
148
+ value:
149
+ group: omniavatar_df_audiofix
150
+ name: df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter
151
+ project: OmniAvatar-FastGen
152
+ wandb_credential: ./credentials/wandb_api.txt
153
+ wandb_entity: paulhcho
154
+ wandb_mode: online
155
+ model:
156
+ value:
157
+ add_teacher_to_fsdp_dict: "True"
158
+ context_noise: "0.0"
159
+ ddp_find_unused_parameters: "True"
160
+ device: cuda
161
+ enable_preprocessors: "True"
162
+ fake_score_net: null
163
+ fsdp_meta_init: "False"
164
+ grad_scaler_enabled: "False"
165
+ grad_scaler_growth_interval: "2000"
166
+ grad_scaler_init_scale: "65536.0"
167
+ guidance_scale: null
168
+ input_shape:
169
+ - "16"
170
+ - "21"
171
+ - "64"
172
+ - "64"
173
+ load_student_weights: "True"
174
+ net:
175
+ _target_: <class 'fastgen.networks.OmniAvatar.network_causal.CausalOmniAvatarWan'>
176
+ audio_hidden_size: "32"
177
+ base_model_paths: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/diffusion_pytorch_model.safetensors
178
+ chunk_size: "3"
179
+ in_dim: "65"
180
+ lora_alpha: "64"
181
+ lora_rank: "128"
182
+ merge_lora: "False"
183
+ mode: v2v
184
+ model_size: 1.3B
185
+ net_pred_type: flow
186
+ omniavatar_ckpt_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data_checkpoints/1.3B-step-1000.pt
187
+ schedule_type: rf
188
+ stochastic_attn_configs:
189
+ - local_attn_size: "7"
190
+ sink_size: "1"
191
+ weight: "0.2"
192
+ - local_attn_size: "10"
193
+ sink_size: "1"
194
+ weight: "0.2"
195
+ - local_attn_size: "13"
196
+ sink_size: "1"
197
+ weight: "0.2"
198
+ - local_attn_size: "9"
199
+ sink_size: "3"
200
+ weight: "0.2"
201
+ - local_attn_size: "12"
202
+ sink_size: "3"
203
+ weight: "0.2"
204
+ total_num_frames: "21"
205
+ unfreeze_modules:
206
+ - _core.audio_proj
207
+ - _core.audio_cond_projs
208
+ - _core.patch_embedding
209
+ use_audio: "True"
210
+ use_dynamic_rope: "False"
211
+ net_optimizer:
212
+ _target_: <function get_optimizer at 0x7f7b2c301940>
213
+ betas:
214
+ - "0.9"
215
+ - "0.999"
216
+ eps: "1e-08"
217
+ fused: "False"
218
+ lr: "1e-05"
219
+ model: null
220
+ optim_type: adamw
221
+ weight_decay: "0.01"
222
+ net_scheduler:
223
+ _target_: <class 'fastgen.utils.lr_scheduler.LambdaLinearScheduler'>
224
+ cycle_lengths:
225
+ - "10000000000"
226
+ f_max:
227
+ - "1.0"
228
+ f_min:
229
+ - "1.0"
230
+ f_start:
231
+ - "1e-06"
232
+ warm_up_steps:
233
+ - "0"
234
+ precision: bfloat16
235
+ precision_amp: null
236
+ precision_amp_enc: null
237
+ precision_amp_infer: null
238
+ precision_fsdp: float32
239
+ pretrained_model_path: ""
240
+ pretrained_student_net_path: ""
241
+ sample_t_cfg:
242
+ log_t_df: "0.01"
243
+ max_t: "0.999"
244
+ min_t: "0.001"
245
+ shift: "5.0"
246
+ t_list:
247
+ - "0.999"
248
+ - "0.769"
249
+ - "0.0"
250
+ time_dist_type: shifted
251
+ train_p_mean: "-1.1"
252
+ train_p_std: "2.0"
253
+ skip_layers: null
254
+ student_sample_steps: "2"
255
+ student_sample_type: sde
256
+ teacher: null
257
+ timestep_cfg:
258
+ enabled: "False"
259
+ t_hi: "1.0"
260
+ t_lo: "0.0"
261
+ use_ema: "False"
262
+ vae_path: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/Wan2.1_VAE.pth
263
+ model_class:
264
+ value:
265
+ _target_: <class 'fastgen.methods.omniavatar_diffusion_forcing.OmniAvatarDiffusionForcingModel'>
266
+ config: null
267
+ trainer:
268
+ value:
269
+ augment_pipe: null
270
+ batch_size_global: null
271
+ callbacks:
272
+ gpu_stats:
273
+ _target_: <class 'fastgen.callbacks.gpu_stats.GPUStatsCallback'>
274
+ every_n: "100"
275
+ grad_clip:
276
+ _target_: <class 'fastgen.callbacks.grad_clip.GradClipCallback'>
277
+ grad_norm: "10.0"
278
+ model_key: net
279
+ param_count:
280
+ _target_: <class 'fastgen.callbacks.param_count.ParamCountCallback'>
281
+ train_profiler:
282
+ _target_: <class 'fastgen.callbacks.train_profiler.TrainProfilerCallback'>
283
+ every_n: "100"
284
+ wandb:
285
+ _target_: <class 'fastgen.callbacks.wandb.WandbCallback'>
286
+ fps: "25"
287
+ sample_logging_iter: "500"
288
+ checkpointer:
289
+ pretrained_ckpt_key_map:
290
+ net: net
291
+ pretrained_ckpt_path: ""
292
+ s3_container: s3://checkpoints/fastgen
293
+ s3_credential: ./credentials/s3.json
294
+ save_dir: /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/checkpoints
295
+ use_s3: "False"
296
+ cudnn:
297
+ benchmark: "True"
298
+ deterministic: "False"
299
+ ddp: "True"
300
+ fsdp: "False"
301
+ fsdp_cpu_offload: "False"
302
+ fsdp_min_num_params: "10000000"
303
+ fsdp_sharding_group_size: null
304
+ global_vars: null
305
+ global_vars_val:
306
+ - null
307
+ grad_accum_rounds: "1"
308
+ logging_iter: "1"
309
+ max_iter: "5000"
310
+ offload_module_in_decoding: "False"
311
+ resume: "False"
312
+ save_ckpt_iter: "500"
313
+ seed: "0"
314
+ skip_initial_validation: "True"
315
+ tf32_enabled: "True"
316
+ val_seed: null
317
+ validation_iter: "500"
318
+ visualize_teacher: "False"
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/output.log ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [Apr 30, 2026 - 22:59:28 | INFO | fastgen.callbacks.wandb:init_wandb:290 ] Wandb code upload disabled (set WANDB_UPLOAD_CODE=true to enable)
2
+ [Apr 30, 2026 - 22:59:28 | SUCCESS | fastgen.trainer:__init__:53 ] Callbacks initialized successfully
3
+ [Apr 30, 2026 - 22:59:28 | INFO | fastgen.trainer:__init__:57 ] Callback synchronization complete
4
+ [Apr 30, 2026 - 22:59:28 | INFO | fastgen.trainer:__init__:60 ] Initializing checkpointer...
5
+ [Apr 30, 2026 - 22:59:28 | SUCCESS | fastgen.trainer:__init__:65 ] Checkpointer initialized successfully
6
+ [Apr 30, 2026 - 22:59:28 | SUCCESS | __main__:main:33 ] Trainer initialized successfully
7
+ [Apr 30, 2026 - 22:59:28 | INFO | fastgen.trainer:run:77 ] Starting training
8
+ [Apr 30, 2026 - 22:59:28 | INFO | fastgen.trainer:run:80 ] Initializing callbacks and model ...
9
+ [Apr 30, 2026 - 22:59:28 | INFO | fastgen.trainer:run:95 ] Starting model.on_train_begin ...
10
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.trainer:run:99 ] model.on_train_begin completed
11
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.trainer:run:106 ] Wrapping model into ddp ..
12
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.trainer:run:108 ] DDP wrapping completed
13
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.networks.OmniAvatar.network_causal:_apply_unfreeze:1231 ] [CausalOmniAvatarWan] unfreeze: re-enabled requires_grad on 1.38M params in '_core.audio_proj'
14
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.networks.OmniAvatar.network_causal:_apply_unfreeze:1231 ] [CausalOmniAvatarWan] unfreeze: re-enabled requires_grad on 0.71M params in '_core.audio_cond_projs'
15
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.networks.OmniAvatar.network_causal:_apply_unfreeze:1231 ] [CausalOmniAvatarWan] unfreeze: re-enabled requires_grad on 0.40M params in '_core.patch_embedding'
16
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.networks.OmniAvatar.network_causal:apply_lora_freeze:1193 ] [CausalOmniAvatarWan] apply_lora_freeze: LoRA 174.98M trainable, base 1421.38M frozen, then unfreeze_modules re-enabled on top
17
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.trainer:run:133 ] Auto-Resume Details: None
18
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.utils.basic_utils:set_random_seed:144 ] Using random seed 0.
19
+ [Apr 30, 2026 - 22:59:30 | INFO | fastgen.trainer:run:165 ] Instantiating dataloader...
20
+ Traceback (most recent call last):
21
+ File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/train.py", line 46, in <module>
22
+ main(config)
23
+ File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/train.py", line 37, in main
24
+ fastgen_trainer.run(model)
25
+ File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/fastgen/trainer.py", line 166, in run
26
+ dataloader_train = instantiate(self.config.dataloader_train)
27
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
28
+ File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/fastgen/utils/__init__.py", line 94, in instantiate
29
+ return cls(*args, **additional_kwargs)
30
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
31
+ File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/fastgen/datasets/omniavatar_dataloader.py", line 276, in __init__
32
+ self.dataset = OmniAvatarDataset(
33
+ ^^^^^^^^^^^^^^^^^^
34
+ File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/fastgen/datasets/omniavatar_dataloader.py", line 135, in __init__
35
+ mask_img = Image.open(latentsync_mask_path)
36
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
37
+ File "/usr/local/lib/python3.12/dist-packages/PIL/Image.py", line 3505, in open
38
+ fp = builtins.open(filename, "rb")
39
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
40
+ FileNotFoundError: [Errno 2] No such file or directory: '/home/work/.local/Self-Forcing_LipSync_StableAvatar/diffsynth/utils/mask.png'
41
+ [rank0]: Traceback (most recent call last):
42
+ [rank0]: File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/train.py", line 46, in <module>
43
+ [rank0]: main(config)
44
+ [rank0]: File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/train.py", line 37, in main
45
+ [rank0]: fastgen_trainer.run(model)
46
+ [rank0]: File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/fastgen/trainer.py", line 166, in run
47
+ [rank0]: dataloader_train = instantiate(self.config.dataloader_train)
48
+ [rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
49
+ [rank0]: File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/fastgen/utils/__init__.py", line 94, in instantiate
50
+ [rank0]: return cls(*args, **additional_kwargs)
51
+ [rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
52
+ [rank0]: File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/fastgen/datasets/omniavatar_dataloader.py", line 276, in __init__
53
+ [rank0]: self.dataset = OmniAvatarDataset(
54
+ [rank0]: ^^^^^^^^^^^^^^^^^^
55
+ [rank0]: File "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/fastgen/datasets/omniavatar_dataloader.py", line 135, in __init__
56
+ [rank0]: mask_img = Image.open(latentsync_mask_path)
57
+ [rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
58
+ [rank0]: File "/usr/local/lib/python3.12/dist-packages/PIL/Image.py", line 3505, in open
59
+ [rank0]: fp = builtins.open(filename, "rb")
60
+ [rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
61
+ [rank0]: FileNotFoundError: [Errno 2] No such file or directory: '/home/work/.local/Self-Forcing_LipSync_StableAvatar/diffsynth/utils/mask.png'
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/requirements.txt ADDED
@@ -0,0 +1,417 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ DistVAE==0.0.0b5
2
+ PySocks==1.7.1
3
+ absl-py==2.4.0
4
+ accelerate==1.13.0
5
+ albucore==0.0.24
6
+ albumentations==2.0.8
7
+ antlr4-python3-runtime==4.9.3
8
+ av==17.0.0
9
+ blessed==1.33.0
10
+ boto3==1.42.74
11
+ botocore==1.42.74
12
+ braceexpand==0.1.7
13
+ cuda-bindings==13.2.0
14
+ cuda-pathfinder==1.4.4
15
+ cuda-toolkit==13.0.2
16
+ decord==0.6.0
17
+ diffusers==0.37.0
18
+ dlib==20.0.0
19
+ easydict==1.13
20
+ flatbuffers==25.12.19
21
+ ftfy==6.3.1
22
+ gdown==5.2.1
23
+ gitdb==4.0.12
24
+ GitPython==3.1.46
25
+ gpustat==1.1.1
26
+ hf-xet==1.4.2
27
+ huggingface_hub==1.7.2
28
+ hydra-core==1.3.2
29
+ ImageIO==2.37.3
30
+ imageio-ffmpeg==0.6.0
31
+ insightface==0.7.3
32
+ jmespath==1.1.0
33
+ kornia==0.8.2
34
+ kornia_rs==0.1.10
35
+ lmdb==2.2.0
36
+ loguru==0.7.3
37
+ mediapipe==0.10.18
38
+ moviepy==2.2.1
39
+ nvidia-cublas==13.1.0.3
40
+ nvidia-cuda-cupti==13.0.85
41
+ nvidia-cuda-nvrtc==13.0.88
42
+ nvidia-cuda-runtime==13.0.96
43
+ nvidia-cudnn-cu13==9.19.0.56
44
+ nvidia-cufft==12.0.0.61
45
+ nvidia-cufile==1.15.1.6
46
+ nvidia-curand==10.4.0.35
47
+ nvidia-cusolver==12.0.4.66
48
+ nvidia-cusparse==12.6.3.3
49
+ nvidia-cusparselt-cu13==0.8.0
50
+ nvidia-nccl-cu13==2.28.9
51
+ nvidia-nvjitlink==13.0.88
52
+ nvidia-nvshmem-cu13==3.4.5
53
+ nvidia-nvtx==13.0.85
54
+ nvitop==1.6.2
55
+ omegaconf==2.3.0
56
+ onnxruntime==1.24.4
57
+ onnxruntime-gpu==1.24.4
58
+ open_clip_torch==3.3.0
59
+ opencv-python-headless==4.11.0.86
60
+ optimum-quanto==0.2.7
61
+ peft==0.18.1
62
+ prettytable==3.17.0
63
+ proglog==0.1.12
64
+ pyloudnorm==0.2.0
65
+ python-dotenv==1.2.2
66
+ python_speech_features==0.6
67
+ pytorch-fid==0.3.0
68
+ s3transfer==0.16.0
69
+ scenedetect==0.6.7.1
70
+ scikit-image==0.26.0
71
+ sentencepiece==0.2.1
72
+ sentry-sdk==2.55.0
73
+ simsimd==6.5.16
74
+ smmap==5.0.3
75
+ sounddevice==0.5.5
76
+ stringzilla==4.6.0
77
+ tifffile==2026.3.3
78
+ timm==1.0.26
79
+ tokenizers==0.22.2
80
+ transformers==5.3.0
81
+ triton==3.2.0
82
+ wandb==0.25.1
83
+ wcwidth==0.6.0
84
+ webdataset==1.0.2
85
+ xfuser==0.4.5
86
+ yunchang==0.6.4
87
+ jupyterlab==4.5.0a1
88
+ nvdlfw_inspect==0.1.0
89
+ transformer_engine==2.3.0+5de3e14
90
+ einops==0.8.1
91
+ flash_attn==2.7.3
92
+ torch_tensorrt==2.8.0a0
93
+ apex==0.1
94
+ nvidia-modelopt==0.27.1
95
+ nvidia-modelopt-core==0.27.1
96
+ nvidia-resiliency-ext==0.3.0
97
+ polygraphy==0.49.20
98
+ PuLP==3.1.1
99
+ safetensors==0.5.3
100
+ torchprofile==0.0.4
101
+ tensorrt==10.10.0.31
102
+ Cython==3.0.12
103
+ aiohappyeyeballs==2.6.1
104
+ aiohttp==3.11.16
105
+ aiosignal==1.3.2
106
+ asciitree==0.3.3
107
+ cachetools==5.5.2
108
+ charset-normalizer==3.4.1
109
+ cloudpickle==3.1.1
110
+ cuda-bindings==12.8.0
111
+ cuda-python==12.8.0
112
+ cudf==25.4.0
113
+ cudf-polars==25.4.0
114
+ cugraph==25.4.0
115
+ cugraph-service-client==25.4.0
116
+ cugraph-service-server==25.4.0
117
+ cuml==25.4.0
118
+ cupy-cuda12x==13.3.0
119
+ cuvs==25.4.0
120
+ dask==2025.2.0
121
+ dask-cuda==25.4.0
122
+ dask-cudf==25.4.0
123
+ distributed==2025.2.0
124
+ distributed-ucxx==0.43.0
125
+ fasteners==0.19
126
+ fastrlock==0.8.3
127
+ frozenlist==1.5.0
128
+ fsspec==2025.3.2
129
+ grpcio==1.62.1
130
+ joblib==1.4.2
131
+ kvikio==25.4.0
132
+ libcudf==25.4.0
133
+ libcugraph==25.4.0
134
+ libcuml==25.4.0
135
+ libcuvs==25.4.0
136
+ libkvikio==25.4.0
137
+ libraft==25.4.0
138
+ librmm==25.4.0
139
+ librmm-cu12==25.4.0
140
+ libucxx==0.43.0
141
+ llvmlite==0.42.0
142
+ locket==1.0.0
143
+ multidict==6.4.3
144
+ numba==0.59.1
145
+ numba-cuda==0.4.0
146
+ numcodecs==0.13.1
147
+ nvidia-ml-py==12.570.86
148
+ nvtx==0.2.11
149
+ nx-cugraph==25.4.0
150
+ packaging==23.2
151
+ pandas==2.2.3
152
+ partd==1.4.2
153
+ ply==3.11
154
+ polars==1.25.2
155
+ propcache==0.3.1
156
+ pyarrow==19.0.1
157
+ pylibcudf==25.4.0
158
+ pylibcugraph==25.4.0
159
+ pylibraft==25.4.0
160
+ pylibwholegraph==25.4.0
161
+ pynvjitlink==0.3.0
162
+ pynvml==12.0.0
163
+ pytz==2023.4
164
+ raft-dask==25.4.0
165
+ rapids-dask-dependency==25.4.0a0
166
+ rapids-logger==0.1.11
167
+ rmm==25.4.0
168
+ scipy==1.15.2
169
+ tblib==3.1.0
170
+ thriftpy2==0.5.2
171
+ toolz==1.0.0
172
+ treelite==4.4.1
173
+ tzdata==2025.2
174
+ ucx-py==0.43.0
175
+ ucxx==0.43.0
176
+ urllib3==2.0.7
177
+ xgboost==2.1.3
178
+ yarl==1.19.0
179
+ zarr==2.18.7
180
+ zict==3.0.0
181
+ tabulate==0.9.0
182
+ nvidia-cudnn-frontend==1.11.0
183
+ onnx==1.17.0
184
+ pybind11_global==2.13.6
185
+ contourpy==1.3.2
186
+ cycler==0.12.1
187
+ fonttools==4.58.0
188
+ kiwisolver==1.4.8
189
+ matplotlib==3.10.3
190
+ pycocotools==2.0+nv0.8.1
191
+ pyparsing==3.2.3
192
+ dm-tree==0.1.9
193
+ gast==0.6.0
194
+ nvidia-dali-cuda120==1.49.0
195
+ nvidia-nvcomp-cu12==4.2.0.14
196
+ nvidia-nvimgcodec-cu12==0.5.0.13
197
+ nvidia-nvjpeg2k-cu12==0.8.1.40
198
+ nvidia-nvjpeg-cu12==12.4.0.16
199
+ nvidia-nvtiff-cu12==0.5.0.67
200
+ pytorch-triton==3.3.0+git96316ce52.nvinternal
201
+ lintrunner==0.12.7
202
+ ninja==1.11.1.4
203
+ optree==0.15.0
204
+ setuptools==78.1.1
205
+ types-dataclasses==0.6.6
206
+ filelock==3.18.0
207
+ mpmath==1.3.0
208
+ networkx==3.4.2
209
+ pillow==11.2.1
210
+ sympy==1.14.0
211
+ torch==2.8.0a0+5228986c39.nv25.5
212
+ torchvision==0.22.0a0
213
+ opencv==4.10.0
214
+ black==25.1.0
215
+ isort==6.0.1
216
+ jupyterlab_tensorboard_pro==4.0.0
217
+ jupytext==1.17.1
218
+ mdit-py-plugins==0.4.2
219
+ mypy_extensions==1.1.0
220
+ pathspec==0.12.1
221
+ Send2Trash==1.8.3
222
+ absl-py==2.2.2
223
+ anyio==4.9.0
224
+ argon2-cffi==23.1.0
225
+ argon2-cffi-bindings==21.2.0
226
+ arrow==1.3.0
227
+ asttokens==3.0.0
228
+ async-lru==2.0.5
229
+ babel==2.17.0
230
+ beautifulsoup4==4.13.4
231
+ bleach==6.2.0
232
+ comm==0.2.2
233
+ debugpy==1.8.14
234
+ defusedxml==0.7.1
235
+ executing==2.2.0
236
+ fastjsonschema==2.21.1
237
+ fqdn==1.5.1
238
+ h11==0.16.0
239
+ httpcore==1.0.9
240
+ httpx==0.28.1
241
+ ipykernel==6.29.5
242
+ ipython==9.2.0
243
+ ipython_pygments_lexers==1.1.1
244
+ isoduration==20.11.0
245
+ jedi==0.19.2
246
+ json5==0.12.0
247
+ jsonpointer==3.0.0
248
+ jsonschema==4.23.0
249
+ jsonschema-specifications==2025.4.1
250
+ jupyter_client==8.6.3
251
+ jupyter_core==5.7.2
252
+ jupyter-events==0.12.0
253
+ jupyter-lsp==2.2.5
254
+ jupyter_server==2.16.0
255
+ jupyter_server_terminals==0.5.3
256
+ jupyterlab_code_formatter==3.0.2
257
+ jupyterlab_pygments==0.3.0
258
+ jupyterlab_server==2.27.3
259
+ Markdown==3.8
260
+ matplotlib-inline==0.1.7
261
+ mistune==3.1.3
262
+ nbclient==0.10.2
263
+ nbconvert==7.16.6
264
+ nbformat==5.10.4
265
+ nest-asyncio==1.6.0
266
+ notebook==7.4.2
267
+ notebook_shim==0.2.4
268
+ overrides==7.7.0
269
+ pandocfilters==1.5.1
270
+ parso==0.8.4
271
+ pexpect==4.9.0
272
+ prometheus_client==0.22.0
273
+ prompt_toolkit==3.0.51
274
+ psutil==7.0.0
275
+ ptyprocess==0.7.0
276
+ pure_eval==0.2.3
277
+ python-dateutil==2.9.0.post0
278
+ python-hostlist==2.2.1
279
+ python-json-logger==3.3.0
280
+ pyzmq==26.4.0
281
+ referencing==0.36.2
282
+ rfc3339-validator==0.1.4
283
+ rfc3986-validator==0.1.1
284
+ rpds-py==0.25.1
285
+ sniffio==1.3.1
286
+ soupsieve==2.7
287
+ stack-data==0.6.3
288
+ tensorboard==2.16.2
289
+ tensorboard-data-server==0.7.2
290
+ terminado==0.18.1
291
+ tinycss2==1.4.0
292
+ tornado==6.5
293
+ traitlets==5.14.3
294
+ types-python-dateutil==2.9.0.20250516
295
+ uri-template==1.3.0
296
+ wcwidth==0.2.13
297
+ webcolors==24.11.1
298
+ webencodings==0.5.1
299
+ websocket-client==1.8.0
300
+ Werkzeug==3.1.3
301
+ MarkupSafe==3.0.2
302
+ PyYAML==6.0.2
303
+ annotated-types==0.7.0
304
+ astunparse==1.6.3
305
+ attrs==25.3.0
306
+ audioread==3.0.1
307
+ blis==0.7.11
308
+ catalogue==2.0.10
309
+ certifi==2025.4.26
310
+ cffi==1.17.1
311
+ click==8.1.8
312
+ cloudpathlib==0.21.1
313
+ confection==0.1.5
314
+ cymem==2.0.11
315
+ decorator==5.2.1
316
+ execnet==2.1.1
317
+ expecttest==0.3.0
318
+ hypothesis==6.130.8
319
+ idna==3.10
320
+ iniconfig==2.1.0
321
+ intel-openmp==2021.4.0
322
+ Jinja2==3.1.6
323
+ langcodes==3.5.0
324
+ language_data==1.3.0
325
+ lazy_loader==0.4
326
+ librosa==0.11.0
327
+ marisa-trie==1.2.1
328
+ markdown-it-py==3.0.0
329
+ mdurl==0.1.2
330
+ mkl==2021.1.1
331
+ mkl-devel==2021.1.1
332
+ mkl-include==2021.1.1
333
+ mock==5.2.0
334
+ msgpack==1.1.0
335
+ murmurhash==1.0.12
336
+ numpy==1.26.4
337
+ platformdirs==4.3.8
338
+ pluggy==1.6.0
339
+ pooch==1.8.2
340
+ preshed==3.0.9
341
+ protobuf==4.24.4
342
+ pybind11==2.13.6
343
+ pycparser==2.22
344
+ pydantic==2.11.4
345
+ pydantic_core==2.33.2
346
+ Pygments==2.19.1
347
+ pytest==8.1.1
348
+ pytest-flakefinder==1.1.0
349
+ pytest-rerunfailures==15.1
350
+ pytest-shard==0.1.2
351
+ pytest-xdist==3.6.1
352
+ regex==2024.11.6
353
+ requests==2.32.3
354
+ rich==14.0.0
355
+ scikit-learn==1.6.1
356
+ shellingham==1.5.4
357
+ six==1.16.0
358
+ smart-open==7.1.0
359
+ sortedcontainers==2.4.0
360
+ soundfile==0.13.1
361
+ soxr==0.5.0.post1
362
+ spacy==3.7.5
363
+ spacy-legacy==3.0.12
364
+ spacy-loggers==1.0.5
365
+ srsly==2.5.1
366
+ tbb==2021.13.1
367
+ thinc==8.2.5
368
+ threadpoolctl==3.6.0
369
+ tqdm==4.67.1
370
+ typer==0.15.4
371
+ typing_extensions==4.13.2
372
+ typing-inspection==0.4.1
373
+ wasabi==1.1.3
374
+ weasel==0.4.1
375
+ wheel==0.45.1
376
+ wrapt==1.17.2
377
+ xdoctest==1.0.2
378
+ cmake==3.31.6
379
+ pip==25.1.1
380
+ nvfuser==0.2.27a0+9bf5aca
381
+ lightning-thunder==0.2.3.dev0
382
+ dill==0.4.0
383
+ opt_einsum==3.4.0
384
+ lightning-utilities==0.14.3
385
+ looseversion==1.3.0
386
+ autocommand==2.2.2
387
+ backports.tarfile==1.2.0
388
+ importlib_metadata==8.0.0
389
+ inflect==7.3.1
390
+ jaraco.collections==5.1.0
391
+ jaraco.context==5.3.0
392
+ jaraco.functools==4.0.1
393
+ jaraco.text==3.12.1
394
+ more-itertools==10.3.0
395
+ packaging==24.2
396
+ platformdirs==4.2.2
397
+ tomli==2.0.1
398
+ typeguard==4.3.0
399
+ typing_extensions==4.12.2
400
+ wheel==0.45.1
401
+ zipp==3.19.2
402
+ PyGObject==3.48.2
403
+ PyJWT==2.7.0
404
+ blinker==1.7.0
405
+ cryptography==41.0.7
406
+ cryptography==41.0.7
407
+ dbus-python==1.3.2
408
+ distro==1.9.0
409
+ httplib2==0.20.4
410
+ launchpadlib==1.11.0
411
+ lazr.restfulclient==0.14.6
412
+ lazr.uri==1.0.6
413
+ oauthlib==3.2.2
414
+ pyparsing==3.1.1
415
+ six==1.16.0
416
+ ssh-import-id==5.11
417
+ wadllib==1.3.6
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/wandb-metadata.json ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-142-generic-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.12.3",
4
+ "startedAt": "2026-04-30T13:59:26.861268Z",
5
+ "args": [
6
+ "--config=fastgen/configs/experiments/OmniAvatar/config_df_shift_5_lora_t769.py",
7
+ "-",
8
+ "dataloader_train.batch_size=8",
9
+ "trainer.ddp=True",
10
+ "trainer.max_iter=5000",
11
+ "trainer.save_ckpt_iter=500",
12
+ "trainer.resume=False",
13
+ "log_config.group=omniavatar_df_audiofix",
14
+ "log_config.name=df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter",
15
+ "log_config.project=OmniAvatar-FastGen",
16
+ "log_config.wandb_entity=paulhcho"
17
+ ],
18
+ "program": "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/train.py",
19
+ "codePath": "train.py",
20
+ "codePathLocal": "train.py",
21
+ "git": {
22
+ "remote": "https://github.com/paulcho98/FastGen.git",
23
+ "commit": "f5897815a4bdcc8f11212b24f367a6839a5409ca"
24
+ },
25
+ "email": "paul.hyunbin@gmail.com",
26
+ "root": "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter",
27
+ "host": "instance-35250",
28
+ "executable": "/usr/bin/python",
29
+ "cpu_count": 64,
30
+ "cpu_count_logical": 128,
31
+ "gpu": "NVIDIA A100-SXM4-80GB",
32
+ "gpu_count": 8,
33
+ "disk": {
34
+ "/": {
35
+ "total": "1599530123264",
36
+ "used": "753074597888"
37
+ }
38
+ },
39
+ "memory": {
40
+ "total": "1081693446144"
41
+ },
42
+ "gpu_nvidia": [
43
+ {
44
+ "name": "NVIDIA A100-SXM4-80GB",
45
+ "memoryTotal": "85899345920",
46
+ "cudaCores": 6912,
47
+ "architecture": "Ampere",
48
+ "uuid": "GPU-c1619da3-e2c1-15b0-cb55-50e24b1f8e99"
49
+ },
50
+ {
51
+ "name": "NVIDIA A100-SXM4-80GB",
52
+ "memoryTotal": "85899345920",
53
+ "cudaCores": 6912,
54
+ "architecture": "Ampere",
55
+ "uuid": "GPU-29f274f2-7065-4653-dcd1-055518ba099c"
56
+ },
57
+ {
58
+ "name": "NVIDIA A100-SXM4-80GB",
59
+ "memoryTotal": "85899345920",
60
+ "cudaCores": 6912,
61
+ "architecture": "Ampere",
62
+ "uuid": "GPU-47a2dd51-a5dc-1d24-4713-ea97b7049d18"
63
+ },
64
+ {
65
+ "name": "NVIDIA A100-SXM4-80GB",
66
+ "memoryTotal": "85899345920",
67
+ "cudaCores": 6912,
68
+ "architecture": "Ampere",
69
+ "uuid": "GPU-ad40d9cb-0070-8a6c-f0a3-d8d40d8233a7"
70
+ },
71
+ {
72
+ "name": "NVIDIA A100-SXM4-80GB",
73
+ "memoryTotal": "85899345920",
74
+ "cudaCores": 6912,
75
+ "architecture": "Ampere",
76
+ "uuid": "GPU-97413b12-6c45-b8cd-a06a-886dd3bc94d6"
77
+ },
78
+ {
79
+ "name": "NVIDIA A100-SXM4-80GB",
80
+ "memoryTotal": "85899345920",
81
+ "cudaCores": 6912,
82
+ "architecture": "Ampere",
83
+ "uuid": "GPU-060cf5c3-ba18-6ff1-9d4d-9e9c71bf6c67"
84
+ },
85
+ {
86
+ "name": "NVIDIA A100-SXM4-80GB",
87
+ "memoryTotal": "85899345920",
88
+ "cudaCores": 6912,
89
+ "architecture": "Ampere",
90
+ "uuid": "GPU-6562d339-d2bb-95e2-3881-199a64c50ba7"
91
+ },
92
+ {
93
+ "name": "NVIDIA A100-SXM4-80GB",
94
+ "memoryTotal": "85899345920",
95
+ "cudaCores": 6912,
96
+ "architecture": "Ampere",
97
+ "uuid": "GPU-a6834410-f241-7270-f5e3-129ecdc2e8f3"
98
+ }
99
+ ],
100
+ "cudaVersion": "12.9",
101
+ "writerId": "7agpz9rvil27ulbaooy9tu3j71z6whib"
102
+ }
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_wandb":{"runtime":59},"_runtime":59}
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/logs/debug-internal.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-30T22:59:27.121240873+09:00","level":"INFO","msg":"wandb-core"}
2
+ {"time":"2026-04-30T22:59:27.127725168+09:00","level":"INFO","msg":"stream: starting","core version":"0.25.1"}
3
+ {"time":"2026-04-30T22:59:27.628090861+09:00","level":"INFO","msg":"stream: created new stream","id":"w9xbjand"}
4
+ {"time":"2026-04-30T22:59:27.628168306+09:00","level":"INFO","msg":"handler: started"}
5
+ {"time":"2026-04-30T22:59:27.629745961+09:00","level":"INFO","msg":"stream: started"}
6
+ {"time":"2026-04-30T22:59:27.629773572+09:00","level":"INFO","msg":"sender: started"}
7
+ {"time":"2026-04-30T22:59:27.629761079+09:00","level":"INFO","msg":"writer: started","stream_id":"w9xbjand"}
8
+ {"time":"2026-04-30T22:59:28.861499272+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"console_offset":0,"console_lines":1}
9
+ {"time":"2026-04-30T22:59:29.336054055+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
10
+ {"time":"2026-04-30T22:59:43.861655852+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":0,"events_lines":2,"console_offset":0,"console_lines":19,"uploaded_len":2}
11
+ {"time":"2026-04-30T22:59:44.215635379+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
12
+ {"time":"2026-04-30T22:59:58.861320253+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":2,"events_lines":2}
13
+ {"time":"2026-04-30T22:59:59.140835619+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
14
+ {"time":"2026-04-30T23:00:13.861239149+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":4,"events_lines":2}
15
+ {"time":"2026-04-30T23:00:14.149003233+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
16
+ {"time":"2026-04-30T23:00:28.273108243+09:00","level":"INFO","msg":"stream: closing"}
17
+ {"time":"2026-04-30T23:00:28.8610536+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"console_offset":19,"console_lines":42,"uploaded_len":2}
18
+ {"time":"2026-04-30T23:00:28.8835215+09:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
19
+ {"time":"2026-04-30T23:00:29.203002489+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
20
+ {"time":"2026-04-30T23:00:29.203184098+09:00","level":"INFO","msg":"filestream: sending request","total_files":0,"uploaded_len":1,"complete":true,"exit_code":1}
21
+ {"time":"2026-04-30T23:00:29.48012593+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
22
+ {"time":"2026-04-30T23:00:29.480401805+09:00","level":"INFO","msg":"handler: closed"}
23
+ {"time":"2026-04-30T23:00:29.482558051+09:00","level":"INFO","msg":"sender: closed"}
24
+ {"time":"2026-04-30T23:00:29.482571335+09:00","level":"INFO","msg":"stream: closed"}
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/logs/debug.log ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-04-30 22:59:26,882 INFO MainThread:2764132 [wandb_setup.py:_flush():81] Current SDK version is 0.25.1
2
+ 2026-04-30 22:59:26,882 INFO MainThread:2764132 [wandb_setup.py:_flush():81] Configure stats pid to 2764132
3
+ 2026-04-30 22:59:26,882 INFO MainThread:2764132 [wandb_setup.py:_flush():81] Loading settings from environment variables
4
+ 2026-04-30 22:59:26,882 INFO MainThread:2764132 [wandb_init.py:setup_run_log_directory():717] Logging user logs to /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/logs/debug.log
5
+ 2026-04-30 22:59:26,882 INFO MainThread:2764132 [wandb_init.py:setup_run_log_directory():718] Logging internal logs to /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/logs/debug-internal.log
6
+ 2026-04-30 22:59:26,882 INFO MainThread:2764132 [wandb_init.py:init():844] calling init triggers
7
+ 2026-04-30 22:59:26,882 INFO MainThread:2764132 [wandb_init.py:init():849] wandb.init called with sweep_config: {}
8
+ config: {'log_config': {'project': 'OmniAvatar-FastGen', 'group': 'omniavatar_df_audiofix', 'name': 'df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter', 'wandb_mode': 'online', 'wandb_entity': 'paulhcho', 'wandb_credential': './credentials/wandb_api.txt'}, 'trainer': {'cudnn': {'deterministic': 'False', 'benchmark': 'True'}, 'checkpointer': {'save_dir': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/checkpoints', 'use_s3': 'False', 's3_container': 's3://checkpoints/fastgen', 's3_credential': './credentials/s3.json', 'pretrained_ckpt_path': '', 'pretrained_ckpt_key_map': {'net': 'net'}}, 'callbacks': {'grad_clip': {'grad_norm': '10.0', 'model_key': 'net', '_target_': "<class 'fastgen.callbacks.grad_clip.GradClipCallback'>"}, 'gpu_stats': {'every_n': '100', '_target_': "<class 'fastgen.callbacks.gpu_stats.GPUStatsCallback'>"}, 'train_profiler': {'every_n': '100', '_target_': "<class 'fastgen.callbacks.train_profiler.TrainProfilerCallback'>"}, 'param_count': {'_target_': "<class 'fastgen.callbacks.param_count.ParamCountCallback'>"}, 'wandb': {'sample_logging_iter': '500', 'fps': '25', '_target_': "<class 'fastgen.callbacks.wandb.WandbCallback'>"}}, 'save_ckpt_iter': '500', 'validation_iter': '500', 'skip_initial_validation': 'True', 'logging_iter': '1', 'max_iter': '5000', 'visualize_teacher': 'False', 'seed': '0', 'val_seed': None, 'resume': 'False', 'ddp': 'True', 'fsdp': 'False', 'tf32_enabled': 'True', 'grad_accum_rounds': '1', 'batch_size_global': None, 'offload_module_in_decoding': 'False', 'fsdp_cpu_offload': 'False', 'fsdp_min_num_params': '10000000', 'fsdp_sharding_group_size': None, 'global_vars': None, 'global_vars_val': [None], 'augment_pipe': None}, 'dataloader_train': {'data_list_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_path.txt', 'latentsync_mask_path': '/home/work/.local/Self-Forcing_LipSync_StableAvatar/diffsynth/utils/mask.png', 'batch_size': '8', 'num_workers': '4', 'neg_text_emb_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt', 'use_ref_sequence': 'True', 'load_ode_path': 'False', '_target_': "<class 'fastgen.datasets.omniavatar_dataloader.OmniAvatarDataLoader'>"}, 'dataloader_val': {'data_list_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_val10.txt', 'latentsync_mask_path': '/home/work/.local/Self-Forcing_LipSync_StableAvatar/diffsynth/utils/mask.png', 'batch_size': '1', 'num_workers': '2', 'neg_text_emb_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt', 'use_ref_sequence': 'True', 'load_ode_path': 'False', '_target_': '<function create_omniavatar_dataloader at 0x7f7b29e018a0>'}, 'eval': {'num_samples': '50000', 'save_images': 'False', 'min_ckpt': '0', 'max_ckpt': '100000000', 'samples_dir': 'samples'}, 'model': {'net': {'model_size': '1.3B', 'in_dim': '65', 'mode': 'v2v', 'use_audio': 'True', 'audio_hidden_size': '32', 'chunk_size': '3', 'total_num_frames': '21', 'base_model_paths': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/diffusion_pytorch_model.safetensors', 'omniavatar_ckpt_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data_checkpoints/1.3B-step-1000.pt', 'net_pred_type': 'flow', 'schedule_type': 'rf', 'use_dynamic_rope': 'False', 'stochastic_attn_configs': [{'local_attn_size': '7', 'sink_size': '1', 'weight': '0.2'}, {'local_attn_size': '10', 'sink_size': '1', 'weight': '0.2'}, {'local_attn_size': '13', 'sink_size': '1', 'weight': '0.2'}, {'local_attn_size': '9', 'sink_size': '3', 'weight': '0.2'}, {'local_attn_size': '12', 'sink_size': '3', 'weight': '0.2'}], '_target_': "<class 'fastgen.networks.OmniAvatar.network_causal.CausalOmniAvatarWan'>", 'merge_lora': 'False', 'unfreeze_modules': ['_core.audio_proj', '_core.audio_cond_projs', '_core.patch_embedding'], 'lora_rank': '128', 'lora_alpha': '64'}, 'teacher': None, 'fake_score_net': None, 'guidance_scale': None, 'timestep_cfg': {'enabled': 'False', 't_lo': '0.0', 't_hi': '1.0'}, 'skip_layers': None, 'net_optimizer': {'model': None, 'optim_type': 'adamw', 'lr': '1e-05', 'weight_decay': '0.01', 'betas': ['0.9', '0.999'], 'eps': '1e-08', 'fused': 'False', '_target_': '<function get_optimizer at 0x7f7b2c301940>'}, 'net_scheduler': {'warm_up_steps': ['0'], 'cycle_lengths': ['10000000000'], 'f_start': ['1e-06'], 'f_max': ['1.0'], 'f_min': ['1.0'], '_target_': "<class 'fastgen.utils.lr_scheduler.LambdaLinearScheduler'>"}, 'sample_t_cfg': {'time_dist_type': 'shifted', 'train_p_mean': '-1.1', 'train_p_std': '2.0', 'shift': '5.0', 'min_t': '0.001', 'max_t': '0.999', 't_list': ['0.999', '0.769', '0.0'], 'log_t_df': '0.01'}, 'input_shape': ['16', '21', '64', '64'], 'device': 'cuda', 'grad_scaler_enabled': 'False', 'grad_scaler_init_scale': '65536.0', 'grad_scaler_growth_interval': '2000', 'pretrained_model_path': '', 'pretrained_student_net_path': '', 'load_student_weights': 'True', 'enable_preprocessors': 'True', 'use_ema': 'False', 'student_sample_steps': '2', 'student_sample_type': 'sde', 'fsdp_meta_init': 'False', 'add_teacher_to_fsdp_dict': 'True', 'ddp_find_unused_parameters': 'True', 'precision': 'bfloat16', 'precision_amp': None, 'precision_amp_infer': None, 'precision_amp_enc': None, 'precision_fsdp': 'float32', 'context_noise': '0.0', 'vae_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/Wan2.1_VAE.pth'}, 'model_class': {'config': None, '_target_': "<class 'fastgen.methods.omniavatar_diffusion_forcing.OmniAvatarDiffusionForcingModel'>"}, '_wandb': {}}
9
+ 2026-04-30 22:59:26,882 INFO MainThread:2764132 [wandb_init.py:init():892] starting backend
10
+ 2026-04-30 22:59:27,107 INFO MainThread:2764132 [wandb_init.py:init():895] sending inform_init request
11
+ 2026-04-30 22:59:27,118 INFO MainThread:2764132 [wandb_init.py:init():903] backend started and connected
12
+ 2026-04-30 22:59:27,121 INFO MainThread:2764132 [wandb_init.py:init():973] updated telemetry
13
+ 2026-04-30 22:59:27,162 INFO MainThread:2764132 [wandb_init.py:init():997] communicating run to backend with 90.0 second timeout
14
+ 2026-04-30 22:59:28,542 INFO MainThread:2764132 [wandb_init.py:init():1042] starting run threads in backend
15
+ 2026-04-30 22:59:28,855 INFO MainThread:2764132 [wandb_run.py:_console_start():2524] atexit reg
16
+ 2026-04-30 22:59:28,855 INFO MainThread:2764132 [wandb_run.py:_redirect():2373] redirect: wrap_raw
17
+ 2026-04-30 22:59:28,855 INFO MainThread:2764132 [wandb_run.py:_redirect():2442] Wrapping output streams.
18
+ 2026-04-30 22:59:28,855 INFO MainThread:2764132 [wandb_run.py:_redirect():2465] Redirects installed.
19
+ 2026-04-30 22:59:28,859 INFO MainThread:2764132 [wandb_init.py:init():1082] run started, returning control to user process
20
+ 2026-04-30 23:00:28,271 INFO wandb-AsyncioManager-main:2764132 [service_client.py:_forward_responses():134] Reached EOF.
21
+ 2026-04-30 23:00:28,272 INFO wandb-AsyncioManager-main:2764132 [mailbox.py:close():155] Closing mailbox, abandoning 1 handles.
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_225926-w9xbjand/run-w9xbjand.wandb ADDED
Binary file (28.5 kB). View file
 
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_122daebb61ef6826b8de.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:122daebb61ef6826b8dee51f1938139a654d163927b7a901fab656eca1d70d4c
3
+ size 173173
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_479372da7ed9e768cc22.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:479372da7ed9e768cc22ca68b676f84dc5bc2d17ad4a1b69d9e0603d07062ff0
3
+ size 190184
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_509f08fac994ab8cebb6.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:509f08fac994ab8cebb6e804de594b7eb9f9167ea4c76921bb5f72028356b14f
3
+ size 165124
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_5d1790cb2d9c8554b75b.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d1790cb2d9c8554b75bd606662be361f36a874249939a0be5a170c7592b69cf
3
+ size 249191
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_81b3c24ab2930c8fd6c1.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81b3c24ab2930c8fd6c11e679d51bcdeadef1e799803868d89e8723f2a66ae92
3
+ size 218665
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_8495e04002c0da67769b.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8495e04002c0da67769bc1c07b49ad88f9f86bb3f1569495ee69e5d26c2b032b
3
+ size 223672
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_88d3eab6ac986b51e272.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88d3eab6ac986b51e27203bcd7c70a572b2166615c1abb27f2cc57fc335c0d04
3
+ size 181968
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_8bcc788bab53b0c99f6b.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bcc788bab53b0c99f6b149c63c3b5c459461b6817a0082b55d46850c8937959
3
+ size 171165
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_962d9fe735e704d64274.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:962d9fe735e704d642747fbde8da16feffd849351360204fefacb55f79107665
3
+ size 227679
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/media/videos/val_gt/videos_0_b38481beb241c6eca7c1.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b38481beb241c6eca7c12d0e9e51785568d594ad93e71cc2d900d4a9e0a52a8e
3
+ size 165222
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/output.log ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [Apr 30, 2026 - 23:05:49 | INFO | fastgen.callbacks.wandb:init_wandb:290 ] Wandb code upload disabled (set WANDB_UPLOAD_CODE=true to enable)
2
+ [Apr 30, 2026 - 23:05:49 | SUCCESS | fastgen.trainer:__init__:53 ] Callbacks initialized successfully
3
+ [Apr 30, 2026 - 23:05:49 | INFO | fastgen.trainer:__init__:57 ] Callback synchronization complete
4
+ [Apr 30, 2026 - 23:05:49 | INFO | fastgen.trainer:__init__:60 ] Initializing checkpointer...
5
+ [Apr 30, 2026 - 23:05:49 | SUCCESS | fastgen.trainer:__init__:65 ] Checkpointer initialized successfully
6
+ [Apr 30, 2026 - 23:05:49 | SUCCESS | __main__:main:33 ] Trainer initialized successfully
7
+ [Apr 30, 2026 - 23:05:49 | INFO | fastgen.trainer:run:77 ] Starting training
8
+ [Apr 30, 2026 - 23:05:49 | INFO | fastgen.trainer:run:80 ] Initializing callbacks and model ...
9
+ [Apr 30, 2026 - 23:05:49 | INFO | fastgen.trainer:run:95 ] Starting model.on_train_begin ...
10
+ [Apr 30, 2026 - 23:05:50 | INFO | fastgen.trainer:run:99 ] model.on_train_begin completed
11
+ [Apr 30, 2026 - 23:05:50 | INFO | fastgen.trainer:run:106 ] Wrapping model into ddp ..
12
+ [Apr 30, 2026 - 23:05:51 | INFO | fastgen.trainer:run:108 ] DDP wrapping completed
13
+ [Apr 30, 2026 - 23:05:51 | INFO | fastgen.networks.OmniAvatar.network_causal:_apply_unfreeze:1231 ] [CausalOmniAvatarWan] unfreeze: re-enabled requires_grad on 1.38M params in '_core.audio_proj'
14
+ [Apr 30, 2026 - 23:05:51 | INFO | fastgen.networks.OmniAvatar.network_causal:_apply_unfreeze:1231 ] [CausalOmniAvatarWan] unfreeze: re-enabled requires_grad on 0.71M params in '_core.audio_cond_projs'
15
+ [Apr 30, 2026 - 23:05:51 | INFO | fastgen.networks.OmniAvatar.network_causal:_apply_unfreeze:1231 ] [CausalOmniAvatarWan] unfreeze: re-enabled requires_grad on 0.40M params in '_core.patch_embedding'
16
+ [Apr 30, 2026 - 23:05:51 | INFO | fastgen.networks.OmniAvatar.network_causal:apply_lora_freeze:1193 ] [CausalOmniAvatarWan] apply_lora_freeze: LoRA 174.98M trainable, base 1421.38M frozen, then unfreeze_modules re-enabled on top
17
+ [Apr 30, 2026 - 23:05:51 | INFO | fastgen.trainer:run:133 ] Auto-Resume Details: None
18
+ [Apr 30, 2026 - 23:05:51 | INFO | fastgen.utils.basic_utils:set_random_seed:144 ] Using random seed 0.
19
+ [Apr 30, 2026 - 23:05:51 | INFO | fastgen.trainer:run:165 ] Instantiating dataloader...
20
+ [Apr 30, 2026 - 23:06:47 | INFO | fastgen.callbacks.wandb:on_dataloader_init_end:438 ] Uploading GT validation videos to wandb...
21
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
22
+ warnings.warn(
23
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
24
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
25
+ warnings.warn(
26
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
27
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
28
+ warnings.warn(
29
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
30
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
31
+ warnings.warn(
32
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
33
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
34
+ warnings.warn(
35
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
36
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
37
+ warnings.warn(
38
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
39
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
40
+ warnings.warn(
41
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
42
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
43
+ warnings.warn(
44
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
45
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
46
+ warnings.warn(
47
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
48
+ /usr/local/lib/python3.12/dist-packages/torchvision/io/_video_deprecation_warning.py:5: UserWarning: The video decoding and encoding capabilities of torchvision are deprecated from version 0.22 and will be removed in version 0.24. We recommend that you migrate to TorchCodec, where we'll consolidate the future decoding/encoding capabilities of PyTorch: https://github.com/pytorch/torchcodec
49
+ warnings.warn(
50
+ wandb: WARNING `fps` argument does not affect the frame rate of the video when providing a file path or raw bytes.
51
+ [Apr 30, 2026 - 23:07:34 | INFO | fastgen.callbacks.wandb:on_dataloader_init_end:463 ] Uploaded 10 GT validation videos to wandb
52
+ [Apr 30, 2026 - 23:07:35 | INFO | fastgen.callbacks.gpu_stats:on_train_begin:57 ] every_n to measure gpus stats: 1
53
+ [Apr 30, 2026 - 23:07:35 | INFO | fastgen.callbacks.train_profiler:on_train_begin:54 ] every_n to profile trainer: 1
54
+ [Apr 30, 2026 - 23:07:35 | INFO | fastgen.callbacks.param_count:on_train_begin:79 ] model (OmniAvatarDiffusionForcingModel) has 177.47 M trainable and 1596.36 M total params (logical).
55
+ [Apr 30, 2026 - 23:07:35 | INFO | fastgen.callbacks.param_count:on_train_begin:96 ] model (OmniAvatarDiffusionForcingModel) is NOT sharded (local == logical params).
56
+ [Apr 30, 2026 - 23:07:35 | INFO | fastgen.callbacks.param_count:on_train_begin:79 ] net (CausalOmniAvatarWan) has 177.47 M trainable and 1596.36 M total params (logical).
57
+ [Apr 30, 2026 - 23:07:35 | INFO | fastgen.callbacks.param_count:on_train_begin:96 ] net (CausalOmniAvatarWan) is NOT sharded (local == logical params).
58
+ [Apr 30, 2026 - 23:07:35 | INFO | fastgen.trainer:run:174 ] iter_start: 0
59
+ [rank0]:E0430 23:07:57.183000 2767876 torch/_inductor/select_algorithm.py:2133] [0/0] Runtime error during autotuning:
60
+ [rank0]:E0430 23:07:57.183000 2767876 torch/_inductor/select_algorithm.py:2133] [0/0] No valid triton configs. OutOfResources: out of resource: shared memory, Required: 167968, Hardware limit: 166912. Reducing block sizes or `num_stages` may help..
61
+ [rank0]:E0430 23:07:57.183000 2767876 torch/_inductor/select_algorithm.py:2133] [0/0] Ignoring this choice.
62
+ AUTOTUNE flex_attention(8x12x21504x128, 8x12x21504x128, 8x12x21504x128, 8x12x21504, 1x1x168, 1x1x168x168, 1x1x168, 1x1x168x168, 21504, 21504)
63
+ strides: [33030144, 128, 1536, 1], [33030144, 128, 1536, 1], [33030144, 128, 1536, 1], [258048, 21504, 1], [168, 168, 1], [28224, 28224, 168, 1], [168, 168, 1], [28224, 28224, 168, 1], [1], [1]
64
+ dtypes: torch.bfloat16, torch.bfloat16, torch.bfloat16, torch.float32, torch.int32, torch.int32, torch.int32, torch.int32, torch.int64, torch.int64
65
+ triton_flex_attention_0 313.7815 ms 100.0% BLOCKS_ARE_CONTIGUOUS=False, BLOCK_M=128, BLOCK_N=64, FLOAT32_PRECISION="'tf32'", GQA_SHARED_HEADS=1, HAS_FULL_BLOCKS=True, IS_DIVISIBLE=True, OUTPUT_LOGSUMEXP=True, PRESCALE_QK=False, QK_HEAD_DIM=128, QK_HEAD_DIM_ROUNDED=128, ROWS_GUARANTEED_SAFE=False, SAFE_HEAD_DIM=True, SM_SCALE=0.08838834764831843, SPARSE_KV_BLOCK_SIZE=128, SPARSE_Q_BLOCK_SIZE=128, V_HEAD_DIM=128, V_HEAD_DIM_ROUNDED=128, WRITE_DQ=True, num_stages=3, num_warps=8
66
+ triton_flex_attention_3 317.5469 ms 98.8% BLOCKS_ARE_CONTIGUOUS=False, BLOCK_M=128, BLOCK_N=128, FLOAT32_PRECISION="'tf32'", GQA_SHARED_HEADS=1, HAS_FULL_BLOCKS=True, IS_DIVISIBLE=True, OUTPUT_LOGSUMEXP=True, PRESCALE_QK=False, QK_HEAD_DIM=128, QK_HEAD_DIM_ROUNDED=128, ROWS_GUARANTEED_SAFE=False, SAFE_HEAD_DIM=True, SM_SCALE=0.08838834764831843, SPARSE_KV_BLOCK_SIZE=128, SPARSE_Q_BLOCK_SIZE=128, V_HEAD_DIM=128, V_HEAD_DIM_ROUNDED=128, WRITE_DQ=True, num_stages=2, num_warps=8
67
+ triton_flex_attention_4 423.0356 ms 74.2% BLOCKS_ARE_CONTIGUOUS=False, BLOCK_M=64, BLOCK_N=128, FLOAT32_PRECISION="'tf32'", GQA_SHARED_HEADS=1, HAS_FULL_BLOCKS=True, IS_DIVISIBLE=True, OUTPUT_LOGSUMEXP=True, PRESCALE_QK=False, QK_HEAD_DIM=128, QK_HEAD_DIM_ROUNDED=128, ROWS_GUARANTEED_SAFE=False, SAFE_HEAD_DIM=True, SM_SCALE=0.08838834764831843, SPARSE_KV_BLOCK_SIZE=128, SPARSE_Q_BLOCK_SIZE=128, V_HEAD_DIM=128, V_HEAD_DIM_ROUNDED=128, WRITE_DQ=True, num_stages=3, num_warps=4
68
+ triton_flex_attention_5 500.5695 ms 62.7% BLOCKS_ARE_CONTIGUOUS=False, BLOCK_M=64, BLOCK_N=64, FLOAT32_PRECISION="'tf32'", GQA_SHARED_HEADS=1, HAS_FULL_BLOCKS=True, IS_DIVISIBLE=True, OUTPUT_LOGSUMEXP=True, PRESCALE_QK=False, QK_HEAD_DIM=128, QK_HEAD_DIM_ROUNDED=128, ROWS_GUARANTEED_SAFE=False, SAFE_HEAD_DIM=True, SM_SCALE=0.08838834764831843, SPARSE_KV_BLOCK_SIZE=128, SPARSE_Q_BLOCK_SIZE=128, V_HEAD_DIM=128, V_HEAD_DIM_ROUNDED=128, WRITE_DQ=True, num_stages=3, num_warps=4
69
+ triton_flex_attention_1 713.1403 ms 44.0% BLOCKS_ARE_CONTIGUOUS=False, BLOCK_M=128, BLOCK_N=64, FLOAT32_PRECISION="'tf32'", GQA_SHARED_HEADS=1, HAS_FULL_BLOCKS=True, IS_DIVISIBLE=True, OUTPUT_LOGSUMEXP=True, PRESCALE_QK=False, QK_HEAD_DIM=128, QK_HEAD_DIM_ROUNDED=128, ROWS_GUARANTEED_SAFE=False, SAFE_HEAD_DIM=True, SM_SCALE=0.08838834764831843, SPARSE_KV_BLOCK_SIZE=128, SPARSE_Q_BLOCK_SIZE=128, V_HEAD_DIM=128, V_HEAD_DIM_ROUNDED=128, WRITE_DQ=True, num_stages=3, num_warps=4
70
+ triton_flex_attention_2 inf ms 0.0% BLOCKS_ARE_CONTIGUOUS=False, BLOCK_M=128, BLOCK_N=128, FLOAT32_PRECISION="'tf32'", GQA_SHARED_HEADS=1, HAS_FULL_BLOCKS=True, IS_DIVISIBLE=True, OUTPUT_LOGSUMEXP=True, PRESCALE_QK=False, QK_HEAD_DIM=128, QK_HEAD_DIM_ROUNDED=128, ROWS_GUARANTEED_SAFE=False, SAFE_HEAD_DIM=True, SM_SCALE=0.08838834764831843, SPARSE_KV_BLOCK_SIZE=128, SPARSE_Q_BLOCK_SIZE=128, V_HEAD_DIM=128, V_HEAD_DIM_ROUNDED=128, WRITE_DQ=True, num_stages=3, num_warps=4
71
+ SingleProcess AUTOTUNE benchmarking takes 16.4067 seconds and 6.2248 seconds precompiling for 6 choices
72
+ [rank0]:E0430 23:16:11.647000 2767876 torch/_inductor/select_algorithm.py:2133] [0/0] Runtime error during autotuning:
73
+ [rank0]:E0430 23:16:11.647000 2767876 torch/_inductor/select_algorithm.py:2133] [0/0] No valid triton configs. OutOfResources: out of resource: shared memory, Required: 172032, Hardware limit: 166912. Reducing block sizes or `num_stages` may help..
74
+ [rank0]:E0430 23:16:11.647000 2767876 torch/_inductor/select_algorithm.py:2133] [0/0] Ignoring this choice.
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/requirements.txt ADDED
@@ -0,0 +1,417 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ DistVAE==0.0.0b5
2
+ PySocks==1.7.1
3
+ absl-py==2.4.0
4
+ accelerate==1.13.0
5
+ albucore==0.0.24
6
+ albumentations==2.0.8
7
+ antlr4-python3-runtime==4.9.3
8
+ av==17.0.0
9
+ blessed==1.33.0
10
+ boto3==1.42.74
11
+ botocore==1.42.74
12
+ braceexpand==0.1.7
13
+ cuda-bindings==13.2.0
14
+ cuda-pathfinder==1.4.4
15
+ cuda-toolkit==13.0.2
16
+ decord==0.6.0
17
+ diffusers==0.37.0
18
+ dlib==20.0.0
19
+ easydict==1.13
20
+ flatbuffers==25.12.19
21
+ ftfy==6.3.1
22
+ gdown==5.2.1
23
+ gitdb==4.0.12
24
+ GitPython==3.1.46
25
+ gpustat==1.1.1
26
+ hf-xet==1.4.2
27
+ huggingface_hub==1.7.2
28
+ hydra-core==1.3.2
29
+ ImageIO==2.37.3
30
+ imageio-ffmpeg==0.6.0
31
+ insightface==0.7.3
32
+ jmespath==1.1.0
33
+ kornia==0.8.2
34
+ kornia_rs==0.1.10
35
+ lmdb==2.2.0
36
+ loguru==0.7.3
37
+ mediapipe==0.10.18
38
+ moviepy==2.2.1
39
+ nvidia-cublas==13.1.0.3
40
+ nvidia-cuda-cupti==13.0.85
41
+ nvidia-cuda-nvrtc==13.0.88
42
+ nvidia-cuda-runtime==13.0.96
43
+ nvidia-cudnn-cu13==9.19.0.56
44
+ nvidia-cufft==12.0.0.61
45
+ nvidia-cufile==1.15.1.6
46
+ nvidia-curand==10.4.0.35
47
+ nvidia-cusolver==12.0.4.66
48
+ nvidia-cusparse==12.6.3.3
49
+ nvidia-cusparselt-cu13==0.8.0
50
+ nvidia-nccl-cu13==2.28.9
51
+ nvidia-nvjitlink==13.0.88
52
+ nvidia-nvshmem-cu13==3.4.5
53
+ nvidia-nvtx==13.0.85
54
+ nvitop==1.6.2
55
+ omegaconf==2.3.0
56
+ onnxruntime==1.24.4
57
+ onnxruntime-gpu==1.24.4
58
+ open_clip_torch==3.3.0
59
+ opencv-python-headless==4.11.0.86
60
+ optimum-quanto==0.2.7
61
+ peft==0.18.1
62
+ prettytable==3.17.0
63
+ proglog==0.1.12
64
+ pyloudnorm==0.2.0
65
+ python-dotenv==1.2.2
66
+ python_speech_features==0.6
67
+ pytorch-fid==0.3.0
68
+ s3transfer==0.16.0
69
+ scenedetect==0.6.7.1
70
+ scikit-image==0.26.0
71
+ sentencepiece==0.2.1
72
+ sentry-sdk==2.55.0
73
+ simsimd==6.5.16
74
+ smmap==5.0.3
75
+ sounddevice==0.5.5
76
+ stringzilla==4.6.0
77
+ tifffile==2026.3.3
78
+ timm==1.0.26
79
+ tokenizers==0.22.2
80
+ transformers==5.3.0
81
+ triton==3.2.0
82
+ wandb==0.25.1
83
+ wcwidth==0.6.0
84
+ webdataset==1.0.2
85
+ xfuser==0.4.5
86
+ yunchang==0.6.4
87
+ jupyterlab==4.5.0a1
88
+ nvdlfw_inspect==0.1.0
89
+ transformer_engine==2.3.0+5de3e14
90
+ einops==0.8.1
91
+ flash_attn==2.7.3
92
+ torch_tensorrt==2.8.0a0
93
+ apex==0.1
94
+ nvidia-modelopt==0.27.1
95
+ nvidia-modelopt-core==0.27.1
96
+ nvidia-resiliency-ext==0.3.0
97
+ polygraphy==0.49.20
98
+ PuLP==3.1.1
99
+ safetensors==0.5.3
100
+ torchprofile==0.0.4
101
+ tensorrt==10.10.0.31
102
+ Cython==3.0.12
103
+ aiohappyeyeballs==2.6.1
104
+ aiohttp==3.11.16
105
+ aiosignal==1.3.2
106
+ asciitree==0.3.3
107
+ cachetools==5.5.2
108
+ charset-normalizer==3.4.1
109
+ cloudpickle==3.1.1
110
+ cuda-bindings==12.8.0
111
+ cuda-python==12.8.0
112
+ cudf==25.4.0
113
+ cudf-polars==25.4.0
114
+ cugraph==25.4.0
115
+ cugraph-service-client==25.4.0
116
+ cugraph-service-server==25.4.0
117
+ cuml==25.4.0
118
+ cupy-cuda12x==13.3.0
119
+ cuvs==25.4.0
120
+ dask==2025.2.0
121
+ dask-cuda==25.4.0
122
+ dask-cudf==25.4.0
123
+ distributed==2025.2.0
124
+ distributed-ucxx==0.43.0
125
+ fasteners==0.19
126
+ fastrlock==0.8.3
127
+ frozenlist==1.5.0
128
+ fsspec==2025.3.2
129
+ grpcio==1.62.1
130
+ joblib==1.4.2
131
+ kvikio==25.4.0
132
+ libcudf==25.4.0
133
+ libcugraph==25.4.0
134
+ libcuml==25.4.0
135
+ libcuvs==25.4.0
136
+ libkvikio==25.4.0
137
+ libraft==25.4.0
138
+ librmm==25.4.0
139
+ librmm-cu12==25.4.0
140
+ libucxx==0.43.0
141
+ llvmlite==0.42.0
142
+ locket==1.0.0
143
+ multidict==6.4.3
144
+ numba==0.59.1
145
+ numba-cuda==0.4.0
146
+ numcodecs==0.13.1
147
+ nvidia-ml-py==12.570.86
148
+ nvtx==0.2.11
149
+ nx-cugraph==25.4.0
150
+ packaging==23.2
151
+ pandas==2.2.3
152
+ partd==1.4.2
153
+ ply==3.11
154
+ polars==1.25.2
155
+ propcache==0.3.1
156
+ pyarrow==19.0.1
157
+ pylibcudf==25.4.0
158
+ pylibcugraph==25.4.0
159
+ pylibraft==25.4.0
160
+ pylibwholegraph==25.4.0
161
+ pynvjitlink==0.3.0
162
+ pynvml==12.0.0
163
+ pytz==2023.4
164
+ raft-dask==25.4.0
165
+ rapids-dask-dependency==25.4.0a0
166
+ rapids-logger==0.1.11
167
+ rmm==25.4.0
168
+ scipy==1.15.2
169
+ tblib==3.1.0
170
+ thriftpy2==0.5.2
171
+ toolz==1.0.0
172
+ treelite==4.4.1
173
+ tzdata==2025.2
174
+ ucx-py==0.43.0
175
+ ucxx==0.43.0
176
+ urllib3==2.0.7
177
+ xgboost==2.1.3
178
+ yarl==1.19.0
179
+ zarr==2.18.7
180
+ zict==3.0.0
181
+ tabulate==0.9.0
182
+ nvidia-cudnn-frontend==1.11.0
183
+ onnx==1.17.0
184
+ pybind11_global==2.13.6
185
+ contourpy==1.3.2
186
+ cycler==0.12.1
187
+ fonttools==4.58.0
188
+ kiwisolver==1.4.8
189
+ matplotlib==3.10.3
190
+ pycocotools==2.0+nv0.8.1
191
+ pyparsing==3.2.3
192
+ dm-tree==0.1.9
193
+ gast==0.6.0
194
+ nvidia-dali-cuda120==1.49.0
195
+ nvidia-nvcomp-cu12==4.2.0.14
196
+ nvidia-nvimgcodec-cu12==0.5.0.13
197
+ nvidia-nvjpeg2k-cu12==0.8.1.40
198
+ nvidia-nvjpeg-cu12==12.4.0.16
199
+ nvidia-nvtiff-cu12==0.5.0.67
200
+ pytorch-triton==3.3.0+git96316ce52.nvinternal
201
+ lintrunner==0.12.7
202
+ ninja==1.11.1.4
203
+ optree==0.15.0
204
+ setuptools==78.1.1
205
+ types-dataclasses==0.6.6
206
+ filelock==3.18.0
207
+ mpmath==1.3.0
208
+ networkx==3.4.2
209
+ pillow==11.2.1
210
+ sympy==1.14.0
211
+ torch==2.8.0a0+5228986c39.nv25.5
212
+ torchvision==0.22.0a0
213
+ opencv==4.10.0
214
+ black==25.1.0
215
+ isort==6.0.1
216
+ jupyterlab_tensorboard_pro==4.0.0
217
+ jupytext==1.17.1
218
+ mdit-py-plugins==0.4.2
219
+ mypy_extensions==1.1.0
220
+ pathspec==0.12.1
221
+ Send2Trash==1.8.3
222
+ absl-py==2.2.2
223
+ anyio==4.9.0
224
+ argon2-cffi==23.1.0
225
+ argon2-cffi-bindings==21.2.0
226
+ arrow==1.3.0
227
+ asttokens==3.0.0
228
+ async-lru==2.0.5
229
+ babel==2.17.0
230
+ beautifulsoup4==4.13.4
231
+ bleach==6.2.0
232
+ comm==0.2.2
233
+ debugpy==1.8.14
234
+ defusedxml==0.7.1
235
+ executing==2.2.0
236
+ fastjsonschema==2.21.1
237
+ fqdn==1.5.1
238
+ h11==0.16.0
239
+ httpcore==1.0.9
240
+ httpx==0.28.1
241
+ ipykernel==6.29.5
242
+ ipython==9.2.0
243
+ ipython_pygments_lexers==1.1.1
244
+ isoduration==20.11.0
245
+ jedi==0.19.2
246
+ json5==0.12.0
247
+ jsonpointer==3.0.0
248
+ jsonschema==4.23.0
249
+ jsonschema-specifications==2025.4.1
250
+ jupyter_client==8.6.3
251
+ jupyter_core==5.7.2
252
+ jupyter-events==0.12.0
253
+ jupyter-lsp==2.2.5
254
+ jupyter_server==2.16.0
255
+ jupyter_server_terminals==0.5.3
256
+ jupyterlab_code_formatter==3.0.2
257
+ jupyterlab_pygments==0.3.0
258
+ jupyterlab_server==2.27.3
259
+ Markdown==3.8
260
+ matplotlib-inline==0.1.7
261
+ mistune==3.1.3
262
+ nbclient==0.10.2
263
+ nbconvert==7.16.6
264
+ nbformat==5.10.4
265
+ nest-asyncio==1.6.0
266
+ notebook==7.4.2
267
+ notebook_shim==0.2.4
268
+ overrides==7.7.0
269
+ pandocfilters==1.5.1
270
+ parso==0.8.4
271
+ pexpect==4.9.0
272
+ prometheus_client==0.22.0
273
+ prompt_toolkit==3.0.51
274
+ psutil==7.0.0
275
+ ptyprocess==0.7.0
276
+ pure_eval==0.2.3
277
+ python-dateutil==2.9.0.post0
278
+ python-hostlist==2.2.1
279
+ python-json-logger==3.3.0
280
+ pyzmq==26.4.0
281
+ referencing==0.36.2
282
+ rfc3339-validator==0.1.4
283
+ rfc3986-validator==0.1.1
284
+ rpds-py==0.25.1
285
+ sniffio==1.3.1
286
+ soupsieve==2.7
287
+ stack-data==0.6.3
288
+ tensorboard==2.16.2
289
+ tensorboard-data-server==0.7.2
290
+ terminado==0.18.1
291
+ tinycss2==1.4.0
292
+ tornado==6.5
293
+ traitlets==5.14.3
294
+ types-python-dateutil==2.9.0.20250516
295
+ uri-template==1.3.0
296
+ wcwidth==0.2.13
297
+ webcolors==24.11.1
298
+ webencodings==0.5.1
299
+ websocket-client==1.8.0
300
+ Werkzeug==3.1.3
301
+ MarkupSafe==3.0.2
302
+ PyYAML==6.0.2
303
+ annotated-types==0.7.0
304
+ astunparse==1.6.3
305
+ attrs==25.3.0
306
+ audioread==3.0.1
307
+ blis==0.7.11
308
+ catalogue==2.0.10
309
+ certifi==2025.4.26
310
+ cffi==1.17.1
311
+ click==8.1.8
312
+ cloudpathlib==0.21.1
313
+ confection==0.1.5
314
+ cymem==2.0.11
315
+ decorator==5.2.1
316
+ execnet==2.1.1
317
+ expecttest==0.3.0
318
+ hypothesis==6.130.8
319
+ idna==3.10
320
+ iniconfig==2.1.0
321
+ intel-openmp==2021.4.0
322
+ Jinja2==3.1.6
323
+ langcodes==3.5.0
324
+ language_data==1.3.0
325
+ lazy_loader==0.4
326
+ librosa==0.11.0
327
+ marisa-trie==1.2.1
328
+ markdown-it-py==3.0.0
329
+ mdurl==0.1.2
330
+ mkl==2021.1.1
331
+ mkl-devel==2021.1.1
332
+ mkl-include==2021.1.1
333
+ mock==5.2.0
334
+ msgpack==1.1.0
335
+ murmurhash==1.0.12
336
+ numpy==1.26.4
337
+ platformdirs==4.3.8
338
+ pluggy==1.6.0
339
+ pooch==1.8.2
340
+ preshed==3.0.9
341
+ protobuf==4.24.4
342
+ pybind11==2.13.6
343
+ pycparser==2.22
344
+ pydantic==2.11.4
345
+ pydantic_core==2.33.2
346
+ Pygments==2.19.1
347
+ pytest==8.1.1
348
+ pytest-flakefinder==1.1.0
349
+ pytest-rerunfailures==15.1
350
+ pytest-shard==0.1.2
351
+ pytest-xdist==3.6.1
352
+ regex==2024.11.6
353
+ requests==2.32.3
354
+ rich==14.0.0
355
+ scikit-learn==1.6.1
356
+ shellingham==1.5.4
357
+ six==1.16.0
358
+ smart-open==7.1.0
359
+ sortedcontainers==2.4.0
360
+ soundfile==0.13.1
361
+ soxr==0.5.0.post1
362
+ spacy==3.7.5
363
+ spacy-legacy==3.0.12
364
+ spacy-loggers==1.0.5
365
+ srsly==2.5.1
366
+ tbb==2021.13.1
367
+ thinc==8.2.5
368
+ threadpoolctl==3.6.0
369
+ tqdm==4.67.1
370
+ typer==0.15.4
371
+ typing_extensions==4.13.2
372
+ typing-inspection==0.4.1
373
+ wasabi==1.1.3
374
+ weasel==0.4.1
375
+ wheel==0.45.1
376
+ wrapt==1.17.2
377
+ xdoctest==1.0.2
378
+ cmake==3.31.6
379
+ pip==25.1.1
380
+ nvfuser==0.2.27a0+9bf5aca
381
+ lightning-thunder==0.2.3.dev0
382
+ dill==0.4.0
383
+ opt_einsum==3.4.0
384
+ lightning-utilities==0.14.3
385
+ looseversion==1.3.0
386
+ autocommand==2.2.2
387
+ backports.tarfile==1.2.0
388
+ importlib_metadata==8.0.0
389
+ inflect==7.3.1
390
+ jaraco.collections==5.1.0
391
+ jaraco.context==5.3.0
392
+ jaraco.functools==4.0.1
393
+ jaraco.text==3.12.1
394
+ more-itertools==10.3.0
395
+ packaging==24.2
396
+ platformdirs==4.2.2
397
+ tomli==2.0.1
398
+ typeguard==4.3.0
399
+ typing_extensions==4.12.2
400
+ wheel==0.45.1
401
+ zipp==3.19.2
402
+ PyGObject==3.48.2
403
+ PyJWT==2.7.0
404
+ blinker==1.7.0
405
+ cryptography==41.0.7
406
+ cryptography==41.0.7
407
+ dbus-python==1.3.2
408
+ distro==1.9.0
409
+ httplib2==0.20.4
410
+ launchpadlib==1.11.0
411
+ lazr.restfulclient==0.14.6
412
+ lazr.uri==1.0.6
413
+ oauthlib==3.2.2
414
+ pyparsing==3.1.1
415
+ six==1.16.0
416
+ ssh-import-id==5.11
417
+ wadllib==1.3.6
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/files/wandb-metadata.json ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-142-generic-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.12.3",
4
+ "startedAt": "2026-04-30T14:05:47.459514Z",
5
+ "args": [
6
+ "--config=fastgen/configs/experiments/OmniAvatar/config_df_shift_5_lora_t769.py",
7
+ "-",
8
+ "dataloader_train.batch_size=8",
9
+ "dataloader_train.latentsync_mask_path=/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/mask.png",
10
+ "dataloader_val.latentsync_mask_path=/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/mask.png",
11
+ "trainer.ddp=True",
12
+ "trainer.max_iter=5000",
13
+ "trainer.save_ckpt_iter=500",
14
+ "trainer.resume=False",
15
+ "log_config.group=omniavatar_df_audiofix",
16
+ "log_config.name=df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter",
17
+ "log_config.project=OmniAvatar-FastGen",
18
+ "log_config.wandb_entity=paulhcho"
19
+ ],
20
+ "program": "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/train.py",
21
+ "codePath": "train.py",
22
+ "codePathLocal": "train.py",
23
+ "git": {
24
+ "remote": "https://github.com/paulcho98/FastGen.git",
25
+ "commit": "f5897815a4bdcc8f11212b24f367a6839a5409ca"
26
+ },
27
+ "email": "paul.hyunbin@gmail.com",
28
+ "root": "/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter",
29
+ "host": "instance-35250",
30
+ "executable": "/usr/bin/python",
31
+ "cpu_count": 64,
32
+ "cpu_count_logical": 128,
33
+ "gpu": "NVIDIA A100-SXM4-80GB",
34
+ "gpu_count": 8,
35
+ "disk": {
36
+ "/": {
37
+ "total": "1599530123264",
38
+ "used": "753074790400"
39
+ }
40
+ },
41
+ "memory": {
42
+ "total": "1081693446144"
43
+ },
44
+ "gpu_nvidia": [
45
+ {
46
+ "name": "NVIDIA A100-SXM4-80GB",
47
+ "memoryTotal": "85899345920",
48
+ "cudaCores": 6912,
49
+ "architecture": "Ampere",
50
+ "uuid": "GPU-c1619da3-e2c1-15b0-cb55-50e24b1f8e99"
51
+ },
52
+ {
53
+ "name": "NVIDIA A100-SXM4-80GB",
54
+ "memoryTotal": "85899345920",
55
+ "cudaCores": 6912,
56
+ "architecture": "Ampere",
57
+ "uuid": "GPU-29f274f2-7065-4653-dcd1-055518ba099c"
58
+ },
59
+ {
60
+ "name": "NVIDIA A100-SXM4-80GB",
61
+ "memoryTotal": "85899345920",
62
+ "cudaCores": 6912,
63
+ "architecture": "Ampere",
64
+ "uuid": "GPU-47a2dd51-a5dc-1d24-4713-ea97b7049d18"
65
+ },
66
+ {
67
+ "name": "NVIDIA A100-SXM4-80GB",
68
+ "memoryTotal": "85899345920",
69
+ "cudaCores": 6912,
70
+ "architecture": "Ampere",
71
+ "uuid": "GPU-ad40d9cb-0070-8a6c-f0a3-d8d40d8233a7"
72
+ },
73
+ {
74
+ "name": "NVIDIA A100-SXM4-80GB",
75
+ "memoryTotal": "85899345920",
76
+ "cudaCores": 6912,
77
+ "architecture": "Ampere",
78
+ "uuid": "GPU-97413b12-6c45-b8cd-a06a-886dd3bc94d6"
79
+ },
80
+ {
81
+ "name": "NVIDIA A100-SXM4-80GB",
82
+ "memoryTotal": "85899345920",
83
+ "cudaCores": 6912,
84
+ "architecture": "Ampere",
85
+ "uuid": "GPU-060cf5c3-ba18-6ff1-9d4d-9e9c71bf6c67"
86
+ },
87
+ {
88
+ "name": "NVIDIA A100-SXM4-80GB",
89
+ "memoryTotal": "85899345920",
90
+ "cudaCores": 6912,
91
+ "architecture": "Ampere",
92
+ "uuid": "GPU-6562d339-d2bb-95e2-3881-199a64c50ba7"
93
+ },
94
+ {
95
+ "name": "NVIDIA A100-SXM4-80GB",
96
+ "memoryTotal": "85899345920",
97
+ "cudaCores": 6912,
98
+ "architecture": "Ampere",
99
+ "uuid": "GPU-a6834410-f241-7270-f5e3-129ecdc2e8f3"
100
+ }
101
+ ],
102
+ "cudaVersion": "12.9",
103
+ "writerId": "d5096jhay1ocyc5oe5r6t4060xhmxcoy"
104
+ }
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/logs/debug-internal.log ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-30T23:05:47.717661886+09:00","level":"INFO","msg":"wandb-core"}
2
+ {"time":"2026-04-30T23:05:47.719875838+09:00","level":"INFO","msg":"stream: starting","core version":"0.25.1"}
3
+ {"time":"2026-04-30T23:05:48.202102105+09:00","level":"INFO","msg":"stream: created new stream","id":"aogal2qe"}
4
+ {"time":"2026-04-30T23:05:48.202176404+09:00","level":"INFO","msg":"handler: started"}
5
+ {"time":"2026-04-30T23:05:48.203751244+09:00","level":"INFO","msg":"stream: started"}
6
+ {"time":"2026-04-30T23:05:48.203784235+09:00","level":"INFO","msg":"sender: started"}
7
+ {"time":"2026-04-30T23:05:48.203780548+09:00","level":"INFO","msg":"writer: started","stream_id":"aogal2qe"}
8
+ {"time":"2026-04-30T23:05:49.289209394+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"console_offset":0,"console_lines":1}
9
+ {"time":"2026-04-30T23:05:49.628819533+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
10
+ {"time":"2026-04-30T23:06:04.28911266+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":0,"events_lines":2,"console_offset":0,"console_lines":19,"uploaded_len":2}
11
+ {"time":"2026-04-30T23:06:04.68488743+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
12
+ {"time":"2026-04-30T23:06:19.28947862+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":2,"events_lines":2}
13
+ {"time":"2026-04-30T23:06:19.593106092+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
14
+ {"time":"2026-04-30T23:06:34.289531575+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":4,"events_lines":2}
15
+ {"time":"2026-04-30T23:06:34.638885012+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
16
+ {"time":"2026-04-30T23:06:49.289408032+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":6,"events_lines":2,"console_offset":19,"console_lines":1}
17
+ {"time":"2026-04-30T23:06:49.55441404+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
18
+ {"time":"2026-04-30T23:07:04.2893822+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":8,"events_lines":2}
19
+ {"time":"2026-04-30T23:07:04.547174503+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
20
+ {"time":"2026-04-30T23:07:19.289556072+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":10,"events_lines":2}
21
+ {"time":"2026-04-30T23:07:19.542062737+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
22
+ {"time":"2026-04-30T23:07:34.289675411+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":12,"events_lines":2,"console_offset":20,"console_lines":29}
23
+ {"time":"2026-04-30T23:07:34.590652485+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
24
+ {"time":"2026-04-30T23:07:49.289694092+09:00","level":"INFO","msg":"filestream: sending request","total_files":3,"events_offset":14,"events_lines":2,"console_offset":49,"console_lines":9,"uploaded_len":10}
25
+ {"time":"2026-04-30T23:07:49.578907428+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
26
+ {"time":"2026-04-30T23:08:04.289321845+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":16,"events_lines":2,"console_offset":58,"console_lines":3}
27
+ {"time":"2026-04-30T23:08:04.654848542+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
28
+ {"time":"2026-04-30T23:08:19.302053487+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":18,"events_lines":2,"console_offset":61,"console_lines":10}
29
+ {"time":"2026-04-30T23:08:19.606327435+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
30
+ {"time":"2026-04-30T23:08:34.288993064+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":20,"events_lines":2}
31
+ {"time":"2026-04-30T23:08:34.57863+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
32
+ {"time":"2026-04-30T23:08:49.289673912+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":22,"events_lines":2}
33
+ {"time":"2026-04-30T23:08:49.597082041+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
34
+ {"time":"2026-04-30T23:09:04.289440794+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":24,"events_lines":2}
35
+ {"time":"2026-04-30T23:09:04.62933334+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
36
+ {"time":"2026-04-30T23:09:19.289512374+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":26,"events_lines":2}
37
+ {"time":"2026-04-30T23:09:19.579604059+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
38
+ {"time":"2026-04-30T23:09:34.288965379+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":28,"events_lines":2}
39
+ {"time":"2026-04-30T23:09:34.594544765+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
40
+ {"time":"2026-04-30T23:09:49.288782859+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":30,"events_lines":2}
41
+ {"time":"2026-04-30T23:09:49.612205294+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
42
+ {"time":"2026-04-30T23:10:04.289135035+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":32,"events_lines":2}
43
+ {"time":"2026-04-30T23:10:04.630551549+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
44
+ {"time":"2026-04-30T23:10:19.288780712+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":34,"events_lines":2}
45
+ {"time":"2026-04-30T23:10:19.682644618+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
46
+ {"time":"2026-04-30T23:10:34.289481389+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":36,"events_lines":2}
47
+ {"time":"2026-04-30T23:10:34.647039103+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
48
+ {"time":"2026-04-30T23:10:49.289265985+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":38,"events_lines":2}
49
+ {"time":"2026-04-30T23:10:49.730743901+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
50
+ {"time":"2026-04-30T23:11:04.289172039+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":40,"events_lines":2}
51
+ {"time":"2026-04-30T23:11:04.731077132+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
52
+ {"time":"2026-04-30T23:11:19.289448884+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":42,"events_lines":2}
53
+ {"time":"2026-04-30T23:11:19.667453476+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
54
+ {"time":"2026-04-30T23:11:34.289592911+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":44,"events_lines":2}
55
+ {"time":"2026-04-30T23:11:34.668128144+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
56
+ {"time":"2026-04-30T23:11:49.288778693+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":46,"events_lines":2}
57
+ {"time":"2026-04-30T23:11:49.644035721+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
58
+ {"time":"2026-04-30T23:12:04.289349786+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":48,"events_lines":2}
59
+ {"time":"2026-04-30T23:12:04.736082536+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
60
+ {"time":"2026-04-30T23:12:19.288945368+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":50,"events_lines":2}
61
+ {"time":"2026-04-30T23:12:19.610329497+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
62
+ {"time":"2026-04-30T23:12:34.289571483+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":52,"events_lines":2}
63
+ {"time":"2026-04-30T23:12:34.587850694+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
64
+ {"time":"2026-04-30T23:12:49.288764613+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":54,"events_lines":2}
65
+ {"time":"2026-04-30T23:12:49.719622981+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
66
+ {"time":"2026-04-30T23:13:04.288637224+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":56,"events_lines":2}
67
+ {"time":"2026-04-30T23:13:04.582812338+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
68
+ {"time":"2026-04-30T23:13:19.289301406+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":58,"events_lines":2}
69
+ {"time":"2026-04-30T23:13:19.553204842+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
70
+ {"time":"2026-04-30T23:13:34.289451588+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":60,"events_lines":2}
71
+ {"time":"2026-04-30T23:13:34.534556354+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
72
+ {"time":"2026-04-30T23:13:49.288622643+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":62,"events_lines":2}
73
+ {"time":"2026-04-30T23:13:49.595316475+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
74
+ {"time":"2026-04-30T23:14:04.289144412+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":64,"events_lines":2}
75
+ {"time":"2026-04-30T23:14:04.543244073+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
76
+ {"time":"2026-04-30T23:14:19.288823516+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":66,"events_lines":2}
77
+ {"time":"2026-04-30T23:14:19.571833716+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
78
+ {"time":"2026-04-30T23:14:34.289509199+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":68,"events_lines":2}
79
+ {"time":"2026-04-30T23:14:34.579585848+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
80
+ {"time":"2026-04-30T23:14:49.288824765+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":70,"events_lines":2}
81
+ {"time":"2026-04-30T23:14:49.612924595+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
82
+ {"time":"2026-04-30T23:15:04.2892304+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":72,"events_lines":2}
83
+ {"time":"2026-04-30T23:15:04.566368977+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
84
+ {"time":"2026-04-30T23:15:19.288719459+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":74,"events_lines":2}
85
+ {"time":"2026-04-30T23:15:19.609636252+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
86
+ {"time":"2026-04-30T23:15:34.289310014+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":76,"events_lines":2}
87
+ {"time":"2026-04-30T23:15:34.584427145+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
88
+ {"time":"2026-04-30T23:15:49.288956977+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":78,"events_lines":2}
89
+ {"time":"2026-04-30T23:15:49.614829139+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
90
+ {"time":"2026-04-30T23:16:04.289218328+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":80,"events_lines":2}
91
+ {"time":"2026-04-30T23:16:04.60993107+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
92
+ {"time":"2026-04-30T23:16:19.289171247+09:00","level":"INFO","msg":"filestream: sending request","total_files":2,"events_offset":82,"events_lines":2,"console_offset":71,"console_lines":3}
93
+ {"time":"2026-04-30T23:16:19.628814484+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
94
+ {"time":"2026-04-30T23:16:34.288676582+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":84,"events_lines":2}
95
+ {"time":"2026-04-30T23:16:34.689081134+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
96
+ {"time":"2026-04-30T23:16:49.288933188+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":86,"events_lines":2}
97
+ {"time":"2026-04-30T23:16:49.62914172+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
98
+ {"time":"2026-04-30T23:17:04.288607448+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":88,"events_lines":2}
99
+ {"time":"2026-04-30T23:17:04.589594346+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
100
+ {"time":"2026-04-30T23:17:19.289321381+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":90,"events_lines":2}
101
+ {"time":"2026-04-30T23:17:19.564264059+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
102
+ {"time":"2026-04-30T23:17:34.288994724+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":92,"events_lines":2}
103
+ {"time":"2026-04-30T23:17:34.552863001+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
104
+ {"time":"2026-04-30T23:17:49.289503425+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":94,"events_lines":2}
105
+ {"time":"2026-04-30T23:17:49.588243139+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
106
+ {"time":"2026-04-30T23:18:04.28878216+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":96,"events_lines":2}
107
+ {"time":"2026-04-30T23:18:04.554107868+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
108
+ {"time":"2026-04-30T23:18:19.289179022+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":98,"events_lines":2}
109
+ {"time":"2026-04-30T23:18:19.612210314+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
110
+ {"time":"2026-04-30T23:18:34.288875601+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":100,"events_lines":2}
111
+ {"time":"2026-04-30T23:18:34.581426522+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
112
+ {"time":"2026-04-30T23:18:49.289382733+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":102,"events_lines":2}
113
+ {"time":"2026-04-30T23:18:49.571645992+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
114
+ {"time":"2026-04-30T23:19:04.28863327+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":104,"events_lines":2}
115
+ {"time":"2026-04-30T23:19:04.567218404+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
116
+ {"time":"2026-04-30T23:19:19.288592986+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":106,"events_lines":2}
117
+ {"time":"2026-04-30T23:19:19.559133381+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
118
+ {"time":"2026-04-30T23:19:34.288571933+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":108,"events_lines":2}
119
+ {"time":"2026-04-30T23:19:34.543783797+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
120
+ {"time":"2026-04-30T23:19:49.289279029+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":110,"events_lines":2}
121
+ {"time":"2026-04-30T23:19:49.634365885+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
122
+ {"time":"2026-04-30T23:20:04.288850186+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":112,"events_lines":2}
123
+ {"time":"2026-04-30T23:20:04.569464453+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
124
+ {"time":"2026-04-30T23:20:19.289155372+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":114,"events_lines":2}
125
+ {"time":"2026-04-30T23:20:19.613994616+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
126
+ {"time":"2026-04-30T23:20:34.289328425+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":116,"events_lines":2}
127
+ {"time":"2026-04-30T23:20:34.620516915+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
128
+ {"time":"2026-04-30T23:20:49.288670175+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":118,"events_lines":2}
129
+ {"time":"2026-04-30T23:20:49.701752992+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
130
+ {"time":"2026-04-30T23:21:04.289448285+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":120,"events_lines":2}
131
+ {"time":"2026-04-30T23:21:04.672086777+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
132
+ {"time":"2026-04-30T23:21:19.288957688+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":122,"events_lines":2}
133
+ {"time":"2026-04-30T23:21:19.808028855+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
134
+ {"time":"2026-04-30T23:21:34.289496467+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":124,"events_lines":2}
135
+ {"time":"2026-04-30T23:21:34.598270838+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
136
+ {"time":"2026-04-30T23:21:49.288582737+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":126,"events_lines":2}
137
+ {"time":"2026-04-30T23:21:49.602869427+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
138
+ {"time":"2026-04-30T23:22:04.289027983+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":128,"events_lines":2}
139
+ {"time":"2026-04-30T23:22:04.602488321+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
140
+ {"time":"2026-04-30T23:22:19.288843665+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":130,"events_lines":2}
141
+ {"time":"2026-04-30T23:22:19.590625944+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
142
+ {"time":"2026-04-30T23:22:34.288973354+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":132,"events_lines":2}
143
+ {"time":"2026-04-30T23:22:34.576595162+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
144
+ {"time":"2026-04-30T23:22:49.28941316+09:00","level":"INFO","msg":"filestream: sending request","total_files":1,"events_offset":134,"events_lines":1}
145
+ {"time":"2026-04-30T23:22:49.617243724+09:00","level":"INFO","msg":"filestream: request sent","status":"200 OK"}
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/logs/debug.log ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_setup.py:_flush():81] Current SDK version is 0.25.1
2
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_setup.py:_flush():81] Configure stats pid to 2767876
3
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_setup.py:_flush():81] Loading settings from environment variables
4
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:setup_run_log_directory():717] Logging user logs to /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/logs/debug.log
5
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:setup_run_log_directory():718] Logging internal logs to /data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/logs/debug-internal.log
6
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:init():844] calling init triggers
7
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:init():849] wandb.init called with sweep_config: {}
8
+ config: {'log_config': {'project': 'OmniAvatar-FastGen', 'group': 'omniavatar_df_audiofix', 'name': 'df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter', 'wandb_mode': 'online', 'wandb_entity': 'paulhcho', 'wandb_credential': './credentials/wandb_api.txt'}, 'trainer': {'cudnn': {'deterministic': 'False', 'benchmark': 'True'}, 'checkpointer': {'save_dir': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/FastGen/output/DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/checkpoints', 'use_s3': 'False', 's3_container': 's3://checkpoints/fastgen', 's3_credential': './credentials/s3.json', 'pretrained_ckpt_path': '', 'pretrained_ckpt_key_map': {'net': 'net'}}, 'callbacks': {'grad_clip': {'grad_norm': '10.0', 'model_key': 'net', '_target_': "<class 'fastgen.callbacks.grad_clip.GradClipCallback'>"}, 'gpu_stats': {'every_n': '100', '_target_': "<class 'fastgen.callbacks.gpu_stats.GPUStatsCallback'>"}, 'train_profiler': {'every_n': '100', '_target_': "<class 'fastgen.callbacks.train_profiler.TrainProfilerCallback'>"}, 'param_count': {'_target_': "<class 'fastgen.callbacks.param_count.ParamCountCallback'>"}, 'wandb': {'sample_logging_iter': '500', 'fps': '25', '_target_': "<class 'fastgen.callbacks.wandb.WandbCallback'>"}}, 'save_ckpt_iter': '500', 'validation_iter': '500', 'skip_initial_validation': 'True', 'logging_iter': '1', 'max_iter': '5000', 'visualize_teacher': 'False', 'seed': '0', 'val_seed': None, 'resume': 'False', 'ddp': 'True', 'fsdp': 'False', 'tf32_enabled': 'True', 'grad_accum_rounds': '1', 'batch_size_global': None, 'offload_module_in_decoding': 'False', 'fsdp_cpu_offload': 'False', 'fsdp_min_num_params': '10000000', 'fsdp_sharding_group_size': None, 'global_vars': None, 'global_vars_val': [None], 'augment_pipe': None}, 'dataloader_train': {'data_list_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_path.txt', 'latentsync_mask_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/mask.png', 'batch_size': '8', 'num_workers': '4', 'neg_text_emb_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt', 'use_ref_sequence': 'True', 'load_ode_path': 'False', '_target_': "<class 'fastgen.datasets.omniavatar_dataloader.OmniAvatarDataLoader'>"}, 'dataloader_val': {'data_list_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/v2v_training_data/video_square_val10.txt', 'latentsync_mask_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/mask.png', 'batch_size': '1', 'num_workers': '2', 'neg_text_emb_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data/text_emb/neg_text_emb.pt', 'use_ref_sequence': 'True', 'load_ode_path': 'False', '_target_': '<function create_omniavatar_dataloader at 0x7fa4931818a0>'}, 'eval': {'num_samples': '50000', 'save_images': 'False', 'min_ckpt': '0', 'max_ckpt': '100000000', 'samples_dir': 'samples'}, 'model': {'net': {'model_size': '1.3B', 'in_dim': '65', 'mode': 'v2v', 'use_audio': 'True', 'audio_hidden_size': '32', 'chunk_size': '3', 'total_num_frames': '21', 'base_model_paths': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/diffusion_pytorch_model.safetensors', 'omniavatar_ckpt_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/data_checkpoints/1.3B-step-1000.pt', 'net_pred_type': 'flow', 'schedule_type': 'rf', 'use_dynamic_rope': 'False', 'stochastic_attn_configs': [{'local_attn_size': '7', 'sink_size': '1', 'weight': '0.2'}, {'local_attn_size': '10', 'sink_size': '1', 'weight': '0.2'}, {'local_attn_size': '13', 'sink_size': '1', 'weight': '0.2'}, {'local_attn_size': '9', 'sink_size': '3', 'weight': '0.2'}, {'local_attn_size': '12', 'sink_size': '3', 'weight': '0.2'}], '_target_': "<class 'fastgen.networks.OmniAvatar.network_causal.CausalOmniAvatarWan'>", 'merge_lora': 'False', 'unfreeze_modules': ['_core.audio_proj', '_core.audio_cond_projs', '_core.patch_embedding'], 'lora_rank': '128', 'lora_alpha': '64'}, 'teacher': None, 'fake_score_net': None, 'guidance_scale': None, 'timestep_cfg': {'enabled': 'False', 't_lo': '0.0', 't_hi': '1.0'}, 'skip_layers': None, 'net_optimizer': {'model': None, 'optim_type': 'adamw', 'lr': '1e-05', 'weight_decay': '0.01', 'betas': ['0.9', '0.999'], 'eps': '1e-08', 'fused': 'False', '_target_': '<function get_optimizer at 0x7fa499799940>'}, 'net_scheduler': {'warm_up_steps': ['0'], 'cycle_lengths': ['10000000000'], 'f_start': ['1e-06'], 'f_max': ['1.0'], 'f_min': ['1.0'], '_target_': "<class 'fastgen.utils.lr_scheduler.LambdaLinearScheduler'>"}, 'sample_t_cfg': {'time_dist_type': 'shifted', 'train_p_mean': '-1.1', 'train_p_std': '2.0', 'shift': '5.0', 'min_t': '0.001', 'max_t': '0.999', 't_list': ['0.999', '0.769', '0.0'], 'log_t_df': '0.01'}, 'input_shape': ['16', '21', '64', '64'], 'device': 'cuda', 'grad_scaler_enabled': 'False', 'grad_scaler_init_scale': '65536.0', 'grad_scaler_growth_interval': '2000', 'pretrained_model_path': '', 'pretrained_student_net_path': '', 'load_student_weights': 'True', 'enable_preprocessors': 'True', 'use_ema': 'False', 'student_sample_steps': '2', 'student_sample_type': 'sde', 'fsdp_meta_init': 'False', 'add_teacher_to_fsdp_dict': 'True', 'ddp_find_unused_parameters': 'True', 'precision': 'bfloat16', 'precision_amp': None, 'precision_amp_infer': None, 'precision_amp_enc': None, 'precision_fsdp': 'float32', 'context_noise': '0.0', 'vae_path': '/data/karlo-research_715/workspace/kinemaar/paul/AR_diffusion/reference_FastGen_OmniAvatar/OmniAvatar-Train/pretrained_models/Wan2.1-T2V-1.3B/Wan2.1_VAE.pth'}, 'model_class': {'config': None, '_target_': "<class 'fastgen.methods.omniavatar_diffusion_forcing.OmniAvatarDiffusionForcingModel'>"}, '_wandb': {}}
9
+ 2026-04-30 23:05:47,480 INFO MainThread:2767876 [wandb_init.py:init():892] starting backend
10
+ 2026-04-30 23:05:47,705 INFO MainThread:2767876 [wandb_init.py:init():895] sending inform_init request
11
+ 2026-04-30 23:05:47,714 INFO MainThread:2767876 [wandb_init.py:init():903] backend started and connected
12
+ 2026-04-30 23:05:47,716 INFO MainThread:2767876 [wandb_init.py:init():973] updated telemetry
13
+ 2026-04-30 23:05:47,743 INFO MainThread:2767876 [wandb_init.py:init():997] communicating run to backend with 90.0 second timeout
14
+ 2026-04-30 23:05:48,972 INFO MainThread:2767876 [wandb_init.py:init():1042] starting run threads in backend
15
+ 2026-04-30 23:05:49,282 INFO MainThread:2767876 [wandb_run.py:_console_start():2524] atexit reg
16
+ 2026-04-30 23:05:49,283 INFO MainThread:2767876 [wandb_run.py:_redirect():2373] redirect: wrap_raw
17
+ 2026-04-30 23:05:49,283 INFO MainThread:2767876 [wandb_run.py:_redirect():2442] Wrapping output streams.
18
+ 2026-04-30 23:05:49,283 INFO MainThread:2767876 [wandb_run.py:_redirect():2465] Redirects installed.
19
+ 2026-04-30 23:05:49,286 INFO MainThread:2767876 [wandb_init.py:init():1082] run started, returning control to user process
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb/run-20260430_230547-aogal2qe/run-aogal2qe.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bd2a461c2164750645fcc7c85f423fce261f402d412a2e90a30baa22cd7d8ea
3
+ size 262144
DF_LORA_T769_8GPU_BS8/OmniAvatar-FastGen/omniavatar_df_audiofix/df_audiofix_syncnet_trained_shift_5_lora_t769_8gpu_bs8_lr1e5_5000iter/wandb_id.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ aogal2qe