Add checkpoint(s) [via HfApi]

Browse files

Files changed (5) hide show

jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/config-fit-2602082333.yaml +219 -0
jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/config-fit-2602120157.yaml +219 -0
jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/config-fit-2602120215.yaml +219 -0
jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/epoch=2555-step=800000.ckpt +3 -0
jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/uploaded_by.txt +1 -0

jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/config-fit-2602082333.yaml ADDED Viewed

	@@ -0,0 +1,219 @@

+# lightning.pytorch==2.6.1
+seed_everything: 1234
+torch_hub_dir: null
+huggingface_cache_dir: null
+trainer:
+  accelerator: auto
+  strategy: auto
+  devices: auto
+  num_nodes: 1
+  precision: bf16-mixed
+  logger:
+    class_path: lightning.pytorch.loggers.WandbLogger
+    init_args:
+      name: jit_b_pixel_bs64_repa_4_lpips_pdino_adamw
+      save_dir: .
+      version: null
+      offline: false
+      dir: null
+      id: null
+      anonymous: null
+      project: jit_b_pixel_ablation
+      log_model: false
+      experiment: null
+      prefix: ''
+      checkpoint_name: null
+      add_file_policy: mutable
+      entity: null
+      notes: null
+      tags: null
+      config: null
+      config_exclude_keys: null
+      config_include_keys: null
+      allow_val_change: null
+      group: null
+      job_type: null
+      mode: null
+      force: null
+      reinit: null
+      resume: null
+      resume_from: null
+      fork_from: null
+      save_code: null
+      tensorboard: null
+      sync_tensorboard: null
+      monitor_gym: null
+      settings: null
+  callbacks:
+  - class_path: src.callbacks.model_checkpoint.CheckpointHook
+    init_args:
+      dirpath: null
+      filename: null
+      monitor: null
+      verbose: false
+      save_last: true
+      save_top_k: -1
+      save_on_exception: false
+      save_weights_only: false
+      mode: min
+      auto_insert_metric_name: true
+      every_n_train_steps: 50000
+      train_time_interval: null
+      every_n_epochs: null
+      save_on_train_epoch_end: null
+      enable_version_counter: true
+  - class_path: src.callbacks.save_images.SaveImagesHook
+    init_args:
+      save_dir: val_ode50_cfg2.0
+      save_compressed: true
+  fast_dev_run: false
+  max_epochs: null
+  min_epochs: null
+  max_steps: 1000000
+  min_steps: null
+  max_time: null
+  limit_train_batches: null
+  limit_val_batches: null
+  limit_test_batches: null
+  limit_predict_batches: null
+  overfit_batches: 0.0
+  val_check_interval: null
+  check_val_every_n_epoch: 1000000
+  num_sanity_val_steps: 0
+  log_every_n_steps: 50
+  enable_checkpointing: null
+  enable_progress_bar: null
+  enable_model_summary: null
+  accumulate_grad_batches: 1
+  gradient_clip_val: null
+  gradient_clip_algorithm: null
+  deterministic: null
+  benchmark: null
+  inference_mode: true
+  use_distributed_sampler: false
+  profiler: null
+  detect_anomaly: false
+  barebones: false
+  plugins:
+  - class_path: src.plugins.bd_env.BDEnvironment
+  sync_batchnorm: false
+  reload_dataloaders_every_n_epochs: 0
+  default_root_dir: ./universal_pix_workdirs
+  enable_autolog_hparams: true
+  model_registry: null
+model:
+  vae:
+    class_path: src.models.autoencoder.pixel.PixelAE
+    init_args:
+      scale: 1.0
+      shift: 0.0
+  conditioner:
+    class_path: src.models.conditioner.class_label.LabelConditioner
+    init_args:
+      num_classes: 20
+  denoiser:
+    class_path: src.models.transformer.JiT.JiT
+    init_args:
+      input_size: 256
+      patch_size: 16
+      in_channels: 3
+      hidden_size: 768
+      depth: 12
+      num_heads: 12
+      mlp_ratio: 4.0
+      attn_drop: 0.0
+      proj_drop: 0.0
+      num_classes: 20
+      bottleneck_dim: 128
+      use_bottleneck: true
+      in_context_len: 32
+      in_context_start: 4
+  diffusion_trainer:
+    class_path: src.diffusion.flow_matching.training_repa_JiT_LPIPS_DINO_NoiseGating.REPATrainer
+    init_args:
+      scheduler:
+        class_path: src.diffusion.flow_matching.scheduling.LinearScheduler
+      loss_weight_fn: src.diffusion.flow_matching.training_repa_JiT_LPIPS_DINO_NoiseGating.constant
+      feat_loss_weight: 0.5
+      lognorm_t: true
+      timeshift: 1.0
+      encoder:
+        class_path: src.models.encoder.DINOv2
+        init_args:
+          weight_path: ~/.cache/torch/hub/checkpoints/dinov2_vitb14_pretrain.pth
+          base_patch_size: 16
+      align_layer: 4
+      proj_denoiser_dim: 768
+      proj_hidden_dim: 768
+      proj_encoder_dim: 768
+      P_mean: -0.8
+      P_std: 0.8
+      t_eps: 0.05
+      num_classes: 1000
+      lpips_weight: 0.1
+      dino_weight: 0.01
+      percept_t_threshold: 0.3
+      noise_scale: 1.0
+      patch_size: 16
+      percept_ratio: 1.0
+      null_condition_p: 0.1
+  diffusion_sampler:
+    class_path: src.diffusion.flow_matching.sampling.HeunSamplerJiT
+    init_args:
+      scheduler:
+        class_path: src.diffusion.flow_matching.scheduling.LinearScheduler
+      w_scheduler:
+        class_path: src.diffusion.flow_matching.scheduling.LinearScheduler
+      exact_henu: true
+      guidance_interval_min: 0.1
+      guidance_interval_max: 0.9
+      timeshift: 1.0
+      step_fn: src.diffusion.flow_matching.sampling.ode_step_fn
+      last_step: null
+      last_step_fn: src.diffusion.flow_matching.sampling.ode_step_fn
+      guidance_fn: src.diffusion.base.guidance.simple_guidance_fn
+      num_steps: 50
+      guidance: 2.0
+  ema_tracker:
+    class_path: src.callbacks.simple_ema.SimpleEMA
+    init_args:
+      decay: 0.9999
+      every_n_steps: 1
+  optimizer:
+    class_path: torch.optim.AdamW
+    init_args:
+      lr: 0.0001
+      betas:
+      - 0.9
+      - 0.999
+      eps: 1.0e-08
+      weight_decay: 0.0
+      amsgrad: false
+      maximize: false
+      foreach: null
+      capturable: false
+      differentiable: false
+      fused: null
+  lr_scheduler: null
+  eval_original_model: false
+data:
+  train_dataset:
+    class_path: src.data.dataset.imagenet.PixImageNet
+    init_args:
+      root: /data/batik-256/images/
+      resolution: 256
+      random_crop: false
+      random_flip: false
+  eval_dataset: null
+  pred_dataset: null
+  train_batch_size: 64
+  train_num_workers: 8
+  train_prefetch_factor: 8
+  eval_batch_size: 32
+  eval_num_workers: 4
+  pred_batch_size: 32
+  pred_num_workers: 1
+tags:
+  exp: jit_b_pixel_bs64_repa_4_lpips_pdino_adamw
+ckpt_path: null
+weights_only: null

jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/config-fit-2602120157.yaml ADDED Viewed

	@@ -0,0 +1,219 @@

+# lightning.pytorch==2.6.1
+seed_everything: 1234
+torch_hub_dir: null
+huggingface_cache_dir: null
+trainer:
+  accelerator: auto
+  strategy: auto
+  devices: auto
+  num_nodes: 1
+  precision: bf16-mixed
+  logger:
+    class_path: lightning.pytorch.loggers.WandbLogger
+    init_args:
+      name: jit_b_pixel_bs64_repa_4_lpips_pdino_adamw
+      save_dir: .
+      version: null
+      offline: false
+      dir: null
+      id: null
+      anonymous: null
+      project: jit_b_pixel_ablation
+      log_model: false
+      experiment: null
+      prefix: ''
+      checkpoint_name: null
+      add_file_policy: mutable
+      entity: null
+      notes: null
+      tags: null
+      config: null
+      config_exclude_keys: null
+      config_include_keys: null
+      allow_val_change: null
+      group: null
+      job_type: null
+      mode: null
+      force: null
+      reinit: null
+      resume: null
+      resume_from: null
+      fork_from: null
+      save_code: null
+      tensorboard: null
+      sync_tensorboard: null
+      monitor_gym: null
+      settings: null
+  callbacks:
+  - class_path: src.callbacks.model_checkpoint.CheckpointHook
+    init_args:
+      dirpath: null
+      filename: null
+      monitor: null
+      verbose: false
+      save_last: true
+      save_top_k: -1
+      save_on_exception: false
+      save_weights_only: false
+      mode: min
+      auto_insert_metric_name: true
+      every_n_train_steps: 50000
+      train_time_interval: null
+      every_n_epochs: null
+      save_on_train_epoch_end: null
+      enable_version_counter: true
+  - class_path: src.callbacks.save_images.SaveImagesHook
+    init_args:
+      save_dir: val_ode50_cfg2.0
+      save_compressed: true
+  fast_dev_run: false
+  max_epochs: null
+  min_epochs: null
+  max_steps: 1000000
+  min_steps: null
+  max_time: null
+  limit_train_batches: null
+  limit_val_batches: null
+  limit_test_batches: null
+  limit_predict_batches: null
+  overfit_batches: 0.0
+  val_check_interval: null
+  check_val_every_n_epoch: 1000000
+  num_sanity_val_steps: 0
+  log_every_n_steps: 50
+  enable_checkpointing: null
+  enable_progress_bar: null
+  enable_model_summary: null
+  accumulate_grad_batches: 1
+  gradient_clip_val: null
+  gradient_clip_algorithm: null
+  deterministic: null
+  benchmark: null
+  inference_mode: true
+  use_distributed_sampler: false
+  profiler: null
+  detect_anomaly: false
+  barebones: false
+  plugins:
+  - class_path: src.plugins.bd_env.BDEnvironment
+  sync_batchnorm: false
+  reload_dataloaders_every_n_epochs: 0
+  default_root_dir: ./universal_pix_workdirs
+  enable_autolog_hparams: true
+  model_registry: null
+model:
+  vae:
+    class_path: src.models.autoencoder.pixel.PixelAE
+    init_args:
+      scale: 1.0
+      shift: 0.0
+  conditioner:
+    class_path: src.models.conditioner.class_label.LabelConditioner
+    init_args:
+      num_classes: 20
+  denoiser:
+    class_path: src.models.transformer.JiT.JiT
+    init_args:
+      input_size: 256
+      patch_size: 16
+      in_channels: 3
+      hidden_size: 768
+      depth: 12
+      num_heads: 12
+      mlp_ratio: 4.0
+      attn_drop: 0.0
+      proj_drop: 0.0
+      num_classes: 20
+      bottleneck_dim: 128
+      use_bottleneck: true
+      in_context_len: 32
+      in_context_start: 4
+  diffusion_trainer:
+    class_path: src.diffusion.flow_matching.training_repa_JiT_LPIPS_DINO_NoiseGating.REPATrainer
+    init_args:
+      scheduler:
+        class_path: src.diffusion.flow_matching.scheduling.LinearScheduler
+      loss_weight_fn: src.diffusion.flow_matching.training_repa_JiT_LPIPS_DINO_NoiseGating.constant
+      feat_loss_weight: 0.5
+      lognorm_t: true
+      timeshift: 1.0
+      encoder:
+        class_path: src.models.encoder.DINOv2
+        init_args:
+          weight_path: ~/.cache/torch/hub/checkpoints/dinov2_vitb14_pretrain.pth
+          base_patch_size: 16
+      align_layer: 4
+      proj_denoiser_dim: 768
+      proj_hidden_dim: 768
+      proj_encoder_dim: 768
+      P_mean: -0.8
+      P_std: 0.8
+      t_eps: 0.05
+      num_classes: 1000
+      lpips_weight: 0.1
+      dino_weight: 0.01
+      percept_t_threshold: 0.3
+      noise_scale: 1.0
+      patch_size: 16
+      percept_ratio: 1.0
+      null_condition_p: 0.1
+  diffusion_sampler:
+    class_path: src.diffusion.flow_matching.sampling.HeunSamplerJiT
+    init_args:
+      scheduler:
+        class_path: src.diffusion.flow_matching.scheduling.LinearScheduler
+      w_scheduler:
+        class_path: src.diffusion.flow_matching.scheduling.LinearScheduler
+      exact_henu: true
+      guidance_interval_min: 0.1
+      guidance_interval_max: 0.9
+      timeshift: 1.0
+      step_fn: src.diffusion.flow_matching.sampling.ode_step_fn
+      last_step: null
+      last_step_fn: src.diffusion.flow_matching.sampling.ode_step_fn
+      guidance_fn: src.diffusion.base.guidance.simple_guidance_fn
+      num_steps: 50
+      guidance: 2.0
+  ema_tracker:
+    class_path: src.callbacks.simple_ema.SimpleEMA
+    init_args:
+      decay: 0.9999
+      every_n_steps: 1
+  optimizer:
+    class_path: torch.optim.AdamW
+    init_args:
+      lr: 0.0001
+      betas:
+      - 0.9
+      - 0.999
+      eps: 1.0e-08
+      weight_decay: 0.0
+      amsgrad: false
+      maximize: false
+      foreach: null
+      capturable: false
+      differentiable: false
+      fused: null
+  lr_scheduler: null
+  eval_original_model: false
+data:
+  train_dataset:
+    class_path: src.data.dataset.imagenet.PixImageNet
+    init_args:
+      root: /data/batik-256/images/
+      resolution: 256
+      random_crop: false
+      random_flip: false
+  eval_dataset: null
+  pred_dataset: null
+  train_batch_size: 64
+  train_num_workers: 8
+  train_prefetch_factor: 8
+  eval_batch_size: 32
+  eval_num_workers: 4
+  pred_batch_size: 32
+  pred_num_workers: 1
+tags:
+  exp: jit_b_pixel_bs64_repa_4_lpips_pdino_adamw
+ckpt_path: null
+weights_only: null

jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/config-fit-2602120215.yaml ADDED Viewed

	@@ -0,0 +1,219 @@

+# lightning.pytorch==2.6.1
+seed_everything: 1234
+torch_hub_dir: null
+huggingface_cache_dir: null
+trainer:
+  accelerator: auto
+  strategy: auto
+  devices: auto
+  num_nodes: 1
+  precision: bf16-mixed
+  logger:
+    class_path: lightning.pytorch.loggers.WandbLogger
+    init_args:
+      name: jit_b_pixel_bs64_repa_4_lpips_pdino_adamw
+      save_dir: .
+      version: null
+      offline: false
+      dir: null
+      id: null
+      anonymous: null
+      project: jit_b_pixel_ablation
+      log_model: false
+      experiment: null
+      prefix: ''
+      checkpoint_name: null
+      add_file_policy: mutable
+      entity: null
+      notes: null
+      tags: null
+      config: null
+      config_exclude_keys: null
+      config_include_keys: null
+      allow_val_change: null
+      group: null
+      job_type: null
+      mode: null
+      force: null
+      reinit: null
+      resume: null
+      resume_from: null
+      fork_from: null
+      save_code: null
+      tensorboard: null
+      sync_tensorboard: null
+      monitor_gym: null
+      settings: null
+  callbacks:
+  - class_path: src.callbacks.model_checkpoint.CheckpointHook
+    init_args:
+      dirpath: null
+      filename: null
+      monitor: null
+      verbose: false
+      save_last: true
+      save_top_k: -1
+      save_on_exception: false
+      save_weights_only: false
+      mode: min
+      auto_insert_metric_name: true
+      every_n_train_steps: 50000
+      train_time_interval: null
+      every_n_epochs: null
+      save_on_train_epoch_end: null
+      enable_version_counter: true
+  - class_path: src.callbacks.save_images.SaveImagesHook
+    init_args:
+      save_dir: val_ode50_cfg2.0
+      save_compressed: true
+  fast_dev_run: false
+  max_epochs: null
+  min_epochs: null
+  max_steps: 1000000
+  min_steps: null
+  max_time: null
+  limit_train_batches: null
+  limit_val_batches: null
+  limit_test_batches: null
+  limit_predict_batches: null
+  overfit_batches: 0.0
+  val_check_interval: null
+  check_val_every_n_epoch: 1000000
+  num_sanity_val_steps: 0
+  log_every_n_steps: 50
+  enable_checkpointing: null
+  enable_progress_bar: null
+  enable_model_summary: null
+  accumulate_grad_batches: 1
+  gradient_clip_val: null
+  gradient_clip_algorithm: null
+  deterministic: null
+  benchmark: null
+  inference_mode: true
+  use_distributed_sampler: false
+  profiler: null
+  detect_anomaly: false
+  barebones: false
+  plugins:
+  - class_path: src.plugins.bd_env.BDEnvironment
+  sync_batchnorm: false
+  reload_dataloaders_every_n_epochs: 0
+  default_root_dir: ./universal_pix_workdirs
+  enable_autolog_hparams: true
+  model_registry: null
+model:
+  vae:
+    class_path: src.models.autoencoder.pixel.PixelAE
+    init_args:
+      scale: 1.0
+      shift: 0.0
+  conditioner:
+    class_path: src.models.conditioner.class_label.LabelConditioner
+    init_args:
+      num_classes: 20
+  denoiser:
+    class_path: src.models.transformer.JiT.JiT
+    init_args:
+      input_size: 256
+      patch_size: 16
+      in_channels: 3
+      hidden_size: 768
+      depth: 12
+      num_heads: 12
+      mlp_ratio: 4.0
+      attn_drop: 0.0
+      proj_drop: 0.0
+      num_classes: 20
+      bottleneck_dim: 128
+      use_bottleneck: true
+      in_context_len: 32
+      in_context_start: 4
+  diffusion_trainer:
+    class_path: src.diffusion.flow_matching.training_repa_JiT_LPIPS_DINO_NoiseGating.REPATrainer
+    init_args:
+      scheduler:
+        class_path: src.diffusion.flow_matching.scheduling.LinearScheduler
+      loss_weight_fn: src.diffusion.flow_matching.training_repa_JiT_LPIPS_DINO_NoiseGating.constant
+      feat_loss_weight: 0.5
+      lognorm_t: true
+      timeshift: 1.0
+      encoder:
+        class_path: src.models.encoder.DINOv2
+        init_args:
+          weight_path: ~/.cache/torch/hub/checkpoints/dinov2_vitb14_pretrain.pth
+          base_patch_size: 16
+      align_layer: 4
+      proj_denoiser_dim: 768
+      proj_hidden_dim: 768
+      proj_encoder_dim: 768
+      P_mean: -0.8
+      P_std: 0.8
+      t_eps: 0.05
+      num_classes: 1000
+      lpips_weight: 0.1
+      dino_weight: 0.01
+      percept_t_threshold: 0.3
+      noise_scale: 1.0
+      patch_size: 16
+      percept_ratio: 1.0
+      null_condition_p: 0.1
+  diffusion_sampler:
+    class_path: src.diffusion.flow_matching.sampling.HeunSamplerJiT
+    init_args:
+      scheduler:
+        class_path: src.diffusion.flow_matching.scheduling.LinearScheduler
+      w_scheduler:
+        class_path: src.diffusion.flow_matching.scheduling.LinearScheduler
+      exact_henu: true
+      guidance_interval_min: 0.1
+      guidance_interval_max: 0.9
+      timeshift: 1.0
+      step_fn: src.diffusion.flow_matching.sampling.ode_step_fn
+      last_step: null
+      last_step_fn: src.diffusion.flow_matching.sampling.ode_step_fn
+      guidance_fn: src.diffusion.base.guidance.simple_guidance_fn
+      num_steps: 50
+      guidance: 2.0
+  ema_tracker:
+    class_path: src.callbacks.simple_ema.SimpleEMA
+    init_args:
+      decay: 0.9999
+      every_n_steps: 1
+  optimizer:
+    class_path: torch.optim.AdamW
+    init_args:
+      lr: 0.0001
+      betas:
+      - 0.9
+      - 0.999
+      eps: 1.0e-08
+      weight_decay: 0.0
+      amsgrad: false
+      maximize: false
+      foreach: null
+      capturable: false
+      differentiable: false
+      fused: null
+  lr_scheduler: null
+  eval_original_model: false
+data:
+  train_dataset:
+    class_path: src.data.dataset.imagenet.PixImageNet
+    init_args:
+      root: /data/batik-256/images/
+      resolution: 256
+      random_crop: false
+      random_flip: false
+  eval_dataset: null
+  pred_dataset: null
+  train_batch_size: 64
+  train_num_workers: 8
+  train_prefetch_factor: 8
+  eval_batch_size: 32
+  eval_num_workers: 4
+  pred_batch_size: 32
+  pred_num_workers: 1
+tags:
+  exp: jit_b_pixel_bs64_repa_4_lpips_pdino_adamw
+ckpt_path: null
+weights_only: null

jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/epoch=2555-step=800000.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aaa2eee7cf53377d830fd86b31d06b6d93bccdb28cc6bafefa601a9cc280637c
+size 2109052911

jit_b_pixel_bs64_repa_4_lpips_pdino_adamw/step_800000/uploaded_by.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ source_dir=/workspace