Upload 3 files

Browse files

Files changed (3) hide show

config.yaml +117 -0
lora_000002400.safetensors +3 -0
optimizer.pt +3 -0

config.yaml ADDED Viewed

	@@ -0,0 +1,117 @@

+job: extension
+config:
+  name: lora
+  process:
+  - type: diffusion_trainer
+    training_folder: /output
+    sqlite_db_path: /app/ai-toolkit/aitk_db.db
+    device: cuda
+    trigger_word: anzohwx
+    performance_log_every: 10
+    network:
+      type: lora
+      linear: 64
+      linear_alpha: 64
+      conv: 16
+      conv_alpha: 16
+      lokr_full_rank: true
+      lokr_factor: -1
+      network_kwargs:
+        ignore_if_contains: []
+    save:
+      dtype: bf16
+      save_every: 120
+      max_step_saves_to_keep: 4000
+      save_format: diffusers
+      push_to_hub: false
+    datasets:
+    - folder_path: /datasets/anzohwx
+      mask_path: null
+      mask_min_value: 0.1
+      default_caption: a photo of anzohwx girl
+      caption_ext: txt
+      caption_dropout_rate: 0.05
+      cache_latents_to_disk: false
+      is_reg: false
+      network_weight: 1
+      resolution:
+      - 1024
+      controls: []
+      shrink_video_to_frames: true
+      num_frames: 1
+      do_i2v: true
+      flip_x: false
+      flip_y: false
+    train:
+      batch_size: 2
+      bypass_guidance_embedding: false
+      steps: 30000
+      gradient_accumulation: 1
+      train_unet: true
+      train_text_encoder: false
+      gradient_checkpointing: true
+      noise_scheduler: flowmatch
+      optimizer: adamw8bit
+      timestep_type: weighted
+      content_or_style: balanced
+      optimizer_params:
+        weight_decay: 0.0001
+      unload_text_encoder: false
+      cache_text_embeddings: false
+      lr: 0.0001
+      ema_config:
+        use_ema: false
+        ema_decay: 0.99
+      skip_first_sample: false
+      force_first_sample: false
+      disable_sampling: true
+      dtype: bf16
+      diff_output_preservation: false
+      diff_output_preservation_multiplier: 1
+      diff_output_preservation_class: person
+      switch_boundary_every: 1
+      loss_type: mse
+    model:
+      name_or_path: Qwen/Qwen-Image
+      quantize: true
+      qtype: qfloat8
+      quantize_te: true
+      qtype_te: qfloat8
+      arch: qwen_image
+      low_vram: true
+      model_kwargs: {}
+      layer_offloading: false
+      layer_offloading_text_encoder_percent: 1
+      layer_offloading_transformer_percent: 1
+    sample:
+      sampler: flowmatch
+      sample_every: 250
+      width: 1024
+      height: 1024
+      samples:
+      - prompt: woman with red hair, playing chess at the park, bomb going off in
+          the background
+      - prompt: a woman holding a coffee cup, in a beanie, sitting at a cafe
+      - prompt: a horse is a DJ at a night club, fish eye lens, smoke machine, lazer
+          lights, holding a martini
+      - prompt: a man showing off his cool new t shirt at the beach, a shark is jumping
+          out of the water in the background
+      - prompt: a bear building a log cabin in the snow covered mountains
+      - prompt: woman playing the guitar, on stage, singing a song, laser lights,
+          punk rocker
+      - prompt: hipster man with a beard, building a chair, in a wood shop
+      - prompt: photo of a man, white background, medium shot, modeling clothing,
+          studio lighting, white backdrop
+      - prompt: a man holding a sign that says, 'this is a sign'
+      - prompt: a bulldog, in a post apocalyptic world, with a shotgun, in a leather
+          jacket, in a desert, with a motorcycle
+      neg: ''
+      seed: 42
+      walk_seed: true
+      guidance_scale: 4
+      sample_steps: 25
+      num_frames: 1
+      fps: 1
+meta:
+  name: lora
+  version: '1.0'

lora_000002400.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a5687510b3b5f9dfd365dcf1a6b00c0eda79cef093f74e358b95fabd8aad2185
+size 1179883680

optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c73580ac0c3dfa96f4fe567272b56becf2d678064866fc1d02e871bfaf6905e1
+size 1195257229