yuegao commited on May 15, 2025

Commit

4bd2d52

verified ·

1 Parent(s): ff014ac

Upload folder using huggingface_hub

Browse files

Files changed (19) hide show

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/10000-ema/mp_rank_00_model_states.pt +3 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/10000/mp_rank_00_model_states.pt +3 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/latest +1 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/model_config.json +4 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/training_config.yaml +219 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/.DS_Store +0 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/10000-ema/mp_rank_00_model_states.pt +3 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/10000/mp_rank_00_model_states.pt +3 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/latest +1 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/model_config.json +4 -0
cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/training_config.yaml +219 -0
cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/10000-ema/mp_rank_00_model_states.pt +3 -0
cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/10000/mp_rank_00_model_states.pt +3 -0
cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/latest +1 -0
cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/model_config.json +4 -0
cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/training_config.yaml +219 -0
zero123_finetune_logs/2024-04-24T14-04-16_scalar_flow/checkpoints/step=000015499.ckpt +3 -0
zero123_finetune_logs/2024-10-28T18-26-21_fluid_nexus_ball/checkpoints/step=000079999.ckpt +3 -0
zero123_finetune_logs/2024-10-30T06-31-08_fluid_nexus_smoke/checkpoints/step=000051999.ckpt +3 -0

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/10000-ema/mp_rank_00_model_states.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c7076e10568d7aceb600582ed7e537d7ea921b404f97a95e769b832dfdec7e7f
+size 42463648157

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/10000/mp_rank_00_model_states.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0f5c3a9db5de4978b30c1d53ea7cd0847a67dbf4b87071d29eb11720133acb9c
+size 42463648157

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/latest ADDED Viewed

	@@ -0,0 +1 @@


1	+ 10000

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/model_config.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+    "model_class": "SATVideoDiffusionEngine",
+    "model_parallel_size": 1
+}

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_ball_i2v_fix3samples-10-28-17-06/training_config.yaml ADDED Viewed

	@@ -0,0 +1,219 @@

+model:
+  scale_factor: 0.7
+  disable_first_stage_autocast: true
+  not_trainable_prefixes:
+  - all
+  log_keys:
+  - txt
+  denoiser_config:
+    target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    params:
+      num_idx: 1000
+      quantize_c_noise: false
+      weighting_config:
+        target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      scaling_config:
+        target: sgm.modules.diffusionmodules.denoiser_scaling.VideoScaling
+      discretization_config:
+        target: sgm.modules.diffusionmodules.discretizer.ZeroSNRDDPMDiscretization
+        params:
+          shift_scale: 1.0
+  network_config:
+    target: dit_video_concat.DiffusionTransformer
+    params:
+      time_embed_dim: 512
+      elementwise_affine: true
+      num_frames: 49
+      time_compressed_rate: 4
+      latent_width: 90
+      latent_height: 60
+      num_layers: 42
+      patch_size: 2
+      in_channels: 16
+      out_channels: 16
+      hidden_size: 3072
+      adm_in_channels: 256
+      num_attention_heads: 48
+      transformer_args:
+        checkpoint_activations: true
+        vocab_size: 1
+        max_sequence_length: 64
+        layernorm_order: pre
+        skip_init: false
+        model_parallel_size: 1
+        is_decoder: false
+      modules:
+        pos_embed_config:
+          target: dit_video_concat.Rotary3DPositionEmbeddingMixin
+          params:
+            hidden_size_head: 64
+            text_length: 226
+        lora_config:
+          target: sat.model.finetune.lora2.LoraMixin
+          params:
+            r: 128
+        patch_embed_config:
+          target: dit_video_concat.ImagePatchEmbeddingMixin
+          params:
+            text_hidden_size: 4096
+        adaln_layer_config:
+          target: dit_video_concat.AdaLNMixin
+          params:
+            qk_ln: true
+        final_layer_config:
+          target: dit_video_concat.FinalLayerMixin
+  conditioner_config:
+    target: sgm.modules.GeneralConditioner
+    params:
+      emb_models:
+      - is_trainable: false
+        input_key: txt
+        ucg_rate: 0.1
+        target: sgm.modules.encoders.modules.FrozenT5Embedder
+        params:
+          model_dir: /path/to/FluidNexusRoot/cogvideox-sat/2b/t5-v1_1-xxl
+          max_length: 226
+  first_stage_config:
+    target: vae_modules.autoencoder.VideoAutoencoderInferenceWrapper
+    params:
+      cp_size: 1
+      ckpt_path: /path/to/FluidNexusRoot/cogvideox-sat/5b/vae/3d-vae.pt
+      ignore_keys:
+      - loss
+      loss_config:
+        target: torch.nn.Identity
+      regularizer_config:
+        target: vae_modules.regularizers.DiagonalGaussianRegularizer
+      encoder_config:
+        target: vae_modules.cp_enc_dec.ContextParallelEncoder3D
+        params:
+          double_z: true
+          z_channels: 16
+          resolution: 256
+          in_channels: 3
+          out_ch: 3
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 2
+          - 4
+          attn_resolutions: []
+          num_res_blocks: 3
+          dropout: 0.0
+          gather_norm: true
+      decoder_config:
+        target: vae_modules.cp_enc_dec.ContextParallelDecoder3D
+        params:
+          double_z: true
+          z_channels: 16
+          resolution: 256
+          in_channels: 3
+          out_ch: 3
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 2
+          - 4
+          attn_resolutions: []
+          num_res_blocks: 3
+          dropout: 0.0
+          gather_norm: false
+  loss_fn_config:
+    target: sgm.modules.diffusionmodules.loss.VideoDiffusionLoss
+    params:
+      fixed_frames: 3
+      offset_noise_level: 0
+      sigma_sampler_config:
+        target: sgm.modules.diffusionmodules.sigma_sampling.DiscreteSampling
+        params:
+          uniform_sampling: true
+          num_idx: 1000
+          discretization_config:
+            target: sgm.modules.diffusionmodules.discretizer.ZeroSNRDDPMDiscretization
+            params:
+              shift_scale: 1.0
+  sampler_config:
+    target: sgm.modules.diffusionmodules.sampling.VPSDEDPMPP2MSampler
+    params:
+      num_steps: 50
+      verbose: true
+      discretization_config:
+        target: sgm.modules.diffusionmodules.discretizer.ZeroSNRDDPMDiscretization
+        params:
+          shift_scale: 1.0
+      guider_config:
+        target: sgm.modules.diffusionmodules.guiders.DynamicCFG
+        params:
+          scale: 6
+          exp: 5
+          num_steps: 50
+args:
+  checkpoint_activations: true
+  model_parallel_size: 1
+  experiment_name: lora_cogvidx5b_realcapture_blackbluecloudredball_i2v_fix3samples
+  mode: finetune
+  load: /path/to/FluidNexusRoot/cogvideox-sat/5b/transformer
+  no_load_rng: true
+  train_iters: 10000
+  eval_iters: 1
+  eval_interval: 1000
+  eval_batch_size: 1
+  save: /path/to/FluidNexusRoot/cogvideox_lora_ckpts
+  summary_dir: /path/to/FluidNexusRoot/cogvideox_lora_runs
+  save_interval: 500
+  log_interval: 100
+  train_data:
+  - /dev/shm/RealCaptureBlackBlueCloudRedBallSetData_cogvideox_dataset
+  valid_data:
+  - /dev/shm/RealCaptureBlackBlueCloudRedBallSetData_cogvideox_dataset_sub_235
+  split: 1,0,0
+  num_workers: 8
+  force_train: true
+  only_log_video_latents: false
+data:
+  target: data_video.SFTDataset
+  params:
+    video_size:
+    - 480
+    - 720
+    fps: 8
+    max_num_frames: 49
+    skip_frms_num: 0
+deepspeed:
+  train_micro_batch_size_per_gpu: 2
+  gradient_accumulation_steps: 1
+  steps_per_print: 50
+  gradient_clipping: 0.1
+  zero_optimization:
+    stage: 2
+    cpu_offload: false
+    contiguous_gradients: false
+    overlap_comm: true
+    reduce_scatter: true
+    reduce_bucket_size: 1000000000
+    allgather_bucket_size: 1000000000
+    load_from_fp32_weights: false
+  zero_allow_untested_optimizer: true
+  bf16:
+    enabled: true
+  fp16:
+    enabled: false
+  loss_scale: 0
+  loss_scale_window: 400
+  hysteresis: 2
+  min_loss_scale: 1
+  optimizer:
+    type: sat.ops.FusedEmaAdam
+    params:
+      lr: 0.001
+      betas:
+      - 0.9
+      - 0.95
+      eps: 1.0e-08
+      weight_decay: 0.0001
+  activation_checkpointing:
+    partition_activations: false
+    contiguous_memory_optimization: false
+  wall_clock_breakdown: false

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/10000-ema/mp_rank_00_model_states.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:576a198a53cb3b73b2549e1da890071c23ecd3ae8f7394f5c96e789351e54e60
+size 42463648157

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/10000/mp_rank_00_model_states.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:13c8790a90eb62fbb115438a141d87695f452f2d4f8edf518c3621d46c3344e6
+size 42463648157

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/latest ADDED Viewed

	@@ -0,0 +1 @@


1	+ 10000

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/model_config.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+    "model_class": "SATVideoDiffusionEngine",
+    "model_parallel_size": 1
+}

cogvideox_lora_ckpts/lora_cogvidx5b_fluid_nexus_smoke_i2v_fix3samples-10-28-17-06/training_config.yaml ADDED Viewed

	@@ -0,0 +1,219 @@

+model:
+  scale_factor: 0.7
+  disable_first_stage_autocast: true
+  not_trainable_prefixes:
+  - all
+  log_keys:
+  - txt
+  denoiser_config:
+    target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    params:
+      num_idx: 1000
+      quantize_c_noise: false
+      weighting_config:
+        target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      scaling_config:
+        target: sgm.modules.diffusionmodules.denoiser_scaling.VideoScaling
+      discretization_config:
+        target: sgm.modules.diffusionmodules.discretizer.ZeroSNRDDPMDiscretization
+        params:
+          shift_scale: 1.0
+  network_config:
+    target: dit_video_concat.DiffusionTransformer
+    params:
+      time_embed_dim: 512
+      elementwise_affine: true
+      num_frames: 49
+      time_compressed_rate: 4
+      latent_width: 90
+      latent_height: 60
+      num_layers: 42
+      patch_size: 2
+      in_channels: 16
+      out_channels: 16
+      hidden_size: 3072
+      adm_in_channels: 256
+      num_attention_heads: 48
+      transformer_args:
+        checkpoint_activations: true
+        vocab_size: 1
+        max_sequence_length: 64
+        layernorm_order: pre
+        skip_init: false
+        model_parallel_size: 1
+        is_decoder: false
+      modules:
+        pos_embed_config:
+          target: dit_video_concat.Rotary3DPositionEmbeddingMixin
+          params:
+            hidden_size_head: 64
+            text_length: 226
+        lora_config:
+          target: sat.model.finetune.lora2.LoraMixin
+          params:
+            r: 128
+        patch_embed_config:
+          target: dit_video_concat.ImagePatchEmbeddingMixin
+          params:
+            text_hidden_size: 4096
+        adaln_layer_config:
+          target: dit_video_concat.AdaLNMixin
+          params:
+            qk_ln: true
+        final_layer_config:
+          target: dit_video_concat.FinalLayerMixin
+  conditioner_config:
+    target: sgm.modules.GeneralConditioner
+    params:
+      emb_models:
+      - is_trainable: false
+        input_key: txt
+        ucg_rate: 0.1
+        target: sgm.modules.encoders.modules.FrozenT5Embedder
+        params:
+          model_dir: /path/to/FluidNexusRoot/cogvideox-sat/2b/t5-v1_1-xxl
+          max_length: 226
+  first_stage_config:
+    target: vae_modules.autoencoder.VideoAutoencoderInferenceWrapper
+    params:
+      cp_size: 1
+      ckpt_path: /path/to/FluidNexusRoot/cogvideox-sat/5b/vae/3d-vae.pt
+      ignore_keys:
+      - loss
+      loss_config:
+        target: torch.nn.Identity
+      regularizer_config:
+        target: vae_modules.regularizers.DiagonalGaussianRegularizer
+      encoder_config:
+        target: vae_modules.cp_enc_dec.ContextParallelEncoder3D
+        params:
+          double_z: true
+          z_channels: 16
+          resolution: 256
+          in_channels: 3
+          out_ch: 3
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 2
+          - 4
+          attn_resolutions: []
+          num_res_blocks: 3
+          dropout: 0.0
+          gather_norm: true
+      decoder_config:
+        target: vae_modules.cp_enc_dec.ContextParallelDecoder3D
+        params:
+          double_z: true
+          z_channels: 16
+          resolution: 256
+          in_channels: 3
+          out_ch: 3
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 2
+          - 4
+          attn_resolutions: []
+          num_res_blocks: 3
+          dropout: 0.0
+          gather_norm: false
+  loss_fn_config:
+    target: sgm.modules.diffusionmodules.loss.VideoDiffusionLoss
+    params:
+      fixed_frames: 3
+      offset_noise_level: 0
+      sigma_sampler_config:
+        target: sgm.modules.diffusionmodules.sigma_sampling.DiscreteSampling
+        params:
+          uniform_sampling: true
+          num_idx: 1000
+          discretization_config:
+            target: sgm.modules.diffusionmodules.discretizer.ZeroSNRDDPMDiscretization
+            params:
+              shift_scale: 1.0
+  sampler_config:
+    target: sgm.modules.diffusionmodules.sampling.VPSDEDPMPP2MSampler
+    params:
+      num_steps: 50
+      verbose: true
+      discretization_config:
+        target: sgm.modules.diffusionmodules.discretizer.ZeroSNRDDPMDiscretization
+        params:
+          shift_scale: 1.0
+      guider_config:
+        target: sgm.modules.diffusionmodules.guiders.DynamicCFG
+        params:
+          scale: 6
+          exp: 5
+          num_steps: 50
+args:
+  checkpoint_activations: true
+  model_parallel_size: 1
+  experiment_name: lora_cogvidx5b_realcapture_blackbluecloud_i2v_fix3samples
+  mode: finetune
+  load: /path/to/FluidNexusRoot/cogvideox-sat/5b/transformer
+  no_load_rng: true
+  train_iters: 10000
+  eval_iters: 1
+  eval_interval: 1000
+  eval_batch_size: 1
+  save: /path/to/FluidNexusRoot/cogvideox_lora_ckpts
+  summary_dir: /path/to/FluidNexusRoot/cogvideox_lora_runs
+  save_interval: 500
+  log_interval: 100
+  train_data:
+  - /dev/shm/RealCaptureBlackBlueCloudSetData_cogvideox_dataset
+  valid_data:
+  - /dev/shm/RealCaptureBlackBlueCloudSetData_cogvideox_dataset_sub_235
+  split: 1,0,0
+  num_workers: 8
+  force_train: true
+  only_log_video_latents: false
+data:
+  target: data_video.SFTDataset
+  params:
+    video_size:
+    - 480
+    - 720
+    fps: 8
+    max_num_frames: 49
+    skip_frms_num: 0
+deepspeed:
+  train_micro_batch_size_per_gpu: 2
+  gradient_accumulation_steps: 1
+  steps_per_print: 50
+  gradient_clipping: 0.1
+  zero_optimization:
+    stage: 2
+    cpu_offload: false
+    contiguous_gradients: false
+    overlap_comm: true
+    reduce_scatter: true
+    reduce_bucket_size: 1000000000
+    allgather_bucket_size: 1000000000
+    load_from_fp32_weights: false
+  zero_allow_untested_optimizer: true
+  bf16:
+    enabled: true
+  fp16:
+    enabled: false
+  loss_scale: 0
+  loss_scale_window: 400
+  hysteresis: 2
+  min_loss_scale: 1
+  optimizer:
+    type: sat.ops.FusedEmaAdam
+    params:
+      lr: 0.001
+      betas:
+      - 0.9
+      - 0.95
+      eps: 1.0e-08
+      weight_decay: 0.0001
+  activation_checkpointing:
+    partition_activations: false
+    contiguous_memory_optimization: false
+  wall_clock_breakdown: false

cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/10000-ema/mp_rank_00_model_states.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ca32a23c842129b42bbbd15021e6487c342fa22dddd7d9af9a58bceb3e1df378
+size 42463648157

cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/10000/mp_rank_00_model_states.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a484a53f48e0ea059a7ab4e5df3ca5330fcf6f1adcdf3111593e3d55aea0416c
+size 42463648157

cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/latest ADDED Viewed

	@@ -0,0 +1 @@


1	+ 10000

cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/model_config.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+    "model_class": "SATVideoDiffusionEngine",
+    "model_parallel_size": 1
+}

cogvideox_lora_ckpts/lora_cogvidx5b_scalar_flow_i2v_fix3samples-09-09-05-39/training_config.yaml ADDED Viewed

	@@ -0,0 +1,219 @@

+model:
+  scale_factor: 0.7
+  disable_first_stage_autocast: true
+  not_trainable_prefixes:
+  - all
+  log_keys:
+  - txt
+  denoiser_config:
+    target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    params:
+      num_idx: 1000
+      quantize_c_noise: false
+      weighting_config:
+        target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      scaling_config:
+        target: sgm.modules.diffusionmodules.denoiser_scaling.VideoScaling
+      discretization_config:
+        target: sgm.modules.diffusionmodules.discretizer.ZeroSNRDDPMDiscretization
+        params:
+          shift_scale: 1.0
+  network_config:
+    target: dit_video_concat.DiffusionTransformer
+    params:
+      time_embed_dim: 512
+      elementwise_affine: true
+      num_frames: 49
+      time_compressed_rate: 4
+      latent_width: 90
+      latent_height: 60
+      num_layers: 42
+      patch_size: 2
+      in_channels: 16
+      out_channels: 16
+      hidden_size: 3072
+      adm_in_channels: 256
+      num_attention_heads: 48
+      transformer_args:
+        checkpoint_activations: true
+        vocab_size: 1
+        max_sequence_length: 64
+        layernorm_order: pre
+        skip_init: false
+        model_parallel_size: 1
+        is_decoder: false
+      modules:
+        pos_embed_config:
+          target: dit_video_concat.Rotary3DPositionEmbeddingMixin
+          params:
+            hidden_size_head: 64
+            text_length: 226
+        lora_config:
+          target: sat.model.finetune.lora2.LoraMixin
+          params:
+            r: 128
+        patch_embed_config:
+          target: dit_video_concat.ImagePatchEmbeddingMixin
+          params:
+            text_hidden_size: 4096
+        adaln_layer_config:
+          target: dit_video_concat.AdaLNMixin
+          params:
+            qk_ln: true
+        final_layer_config:
+          target: dit_video_concat.FinalLayerMixin
+  conditioner_config:
+    target: sgm.modules.GeneralConditioner
+    params:
+      emb_models:
+      - is_trainable: false
+        input_key: txt
+        ucg_rate: 0.1
+        target: sgm.modules.encoders.modules.FrozenT5Embedder
+        params:
+          model_dir: /path/to/FluidNexusRoot/cogvideox-sat/2b/t5-v1_1-xxl
+          max_length: 226
+  first_stage_config:
+    target: vae_modules.autoencoder.VideoAutoencoderInferenceWrapper
+    params:
+      cp_size: 1
+      ckpt_path: /path/to/FluidNexusRoot/cogvideox-sat/5b/vae/3d-vae.pt
+      ignore_keys:
+      - loss
+      loss_config:
+        target: torch.nn.Identity
+      regularizer_config:
+        target: vae_modules.regularizers.DiagonalGaussianRegularizer
+      encoder_config:
+        target: vae_modules.cp_enc_dec.ContextParallelEncoder3D
+        params:
+          double_z: true
+          z_channels: 16
+          resolution: 256
+          in_channels: 3
+          out_ch: 3
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 2
+          - 4
+          attn_resolutions: []
+          num_res_blocks: 3
+          dropout: 0.0
+          gather_norm: true
+      decoder_config:
+        target: vae_modules.cp_enc_dec.ContextParallelDecoder3D
+        params:
+          double_z: true
+          z_channels: 16
+          resolution: 256
+          in_channels: 3
+          out_ch: 3
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 2
+          - 4
+          attn_resolutions: []
+          num_res_blocks: 3
+          dropout: 0.0
+          gather_norm: false
+  loss_fn_config:
+    target: sgm.modules.diffusionmodules.loss.VideoDiffusionLoss
+    params:
+      fixed_frames: 3
+      offset_noise_level: 0
+      sigma_sampler_config:
+        target: sgm.modules.diffusionmodules.sigma_sampling.DiscreteSampling
+        params:
+          uniform_sampling: true
+          num_idx: 1000
+          discretization_config:
+            target: sgm.modules.diffusionmodules.discretizer.ZeroSNRDDPMDiscretization
+            params:
+              shift_scale: 1.0
+  sampler_config:
+    target: sgm.modules.diffusionmodules.sampling.VPSDEDPMPP2MSampler
+    params:
+      num_steps: 50
+      verbose: true
+      discretization_config:
+        target: sgm.modules.diffusionmodules.discretizer.ZeroSNRDDPMDiscretization
+        params:
+          shift_scale: 1.0
+      guider_config:
+        target: sgm.modules.diffusionmodules.guiders.DynamicCFG
+        params:
+          scale: 6
+          exp: 5
+          num_steps: 50
+args:
+  checkpoint_activations: true
+  model_parallel_size: 1
+  experiment_name: lora_cogvidx5b_scalarflow_all_i2v_fix3samples
+  mode: finetune
+  load: /path/to/FluidNexusRoot/cogvideox-sat/5b/transformer
+  no_load_rng: true
+  train_iters: 10000
+  eval_iters: 1
+  eval_interval: 1000
+  eval_batch_size: 1
+  save: /path/to/FluidNexusRoot/cogvideox_lora_ckpts
+  summary_dir: /path/to/FluidNexusRoot/cogvideox_lora_runs
+  save_interval: 500
+  log_interval: 100
+  train_data:
+  - /dev/shm/ScalarFlow_cogvideox_dataset
+  valid_data:
+  - /dev/shm/ScalarFlow_cogvideox_dataset_sub_90
+  split: 1,0,0
+  num_workers: 8
+  force_train: true
+  only_log_video_latents: false
+data:
+  target: data_video.SFTDataset
+  params:
+    video_size:
+    - 480
+    - 720
+    fps: 8
+    max_num_frames: 49
+    skip_frms_num: 0
+deepspeed:
+  train_micro_batch_size_per_gpu: 2
+  gradient_accumulation_steps: 1
+  steps_per_print: 50
+  gradient_clipping: 0.1
+  zero_optimization:
+    stage: 2
+    cpu_offload: false
+    contiguous_gradients: false
+    overlap_comm: true
+    reduce_scatter: true
+    reduce_bucket_size: 1000000000
+    allgather_bucket_size: 1000000000
+    load_from_fp32_weights: false
+  zero_allow_untested_optimizer: true
+  bf16:
+    enabled: true
+  fp16:
+    enabled: false
+  loss_scale: 0
+  loss_scale_window: 400
+  hysteresis: 2
+  min_loss_scale: 1
+  optimizer:
+    type: sat.ops.FusedEmaAdam
+    params:
+      lr: 0.001
+      betas:
+      - 0.9
+      - 0.95
+      eps: 1.0e-08
+      weight_decay: 0.0001
+  activation_checkpointing:
+    partition_activations: false
+    contiguous_memory_optimization: false
+  wall_clock_breakdown: false

zero123_finetune_logs/2024-04-24T14-04-16_scalar_flow/checkpoints/step=000015499.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:79155ecf6818fa9c813d3eaf12d91a13a5d57b6c8845ca1ec3b1e0a72c828a49
+size 15465966043

zero123_finetune_logs/2024-10-28T18-26-21_fluid_nexus_ball/checkpoints/step=000079999.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:54b7685a157f2b602312cf438106f8d1269bb3e8cfcfe8b5b11c45230c14818d
+size 15465966616

zero123_finetune_logs/2024-10-30T06-31-08_fluid_nexus_smoke/checkpoints/step=000051999.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:774267ba698138e2208fcb6b047797e51d6159a003131c9e07c67ec9de0710d3
+size 15465974168