TheMindExpansionNetwork commited on Nov 16, 2025

Commit

0b4a4dd

verified ·

1 Parent(s): aa3ecf4

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +4 -0
.job_config.json +135 -0
config.yaml +126 -0
hash_cache_v1.safetensors +3 -0
hash_cache_v1_000002000.safetensors +3 -0
hash_cache_v1_000002250.safetensors +3 -0
hash_cache_v1_000002500.safetensors +3 -0
hash_cache_v1_000002750.safetensors +3 -0
log.txt +0 -0
optimizer.pt +3 -0
pid.txt +1 -0
samples/1763244777125__000000000_0.jpg +0 -0
samples/1763244847638__000000000_1.jpg +0 -0
samples/1763244918161__000000000_2.jpg +0 -0
samples/1763244989127__000000000_3.jpg +0 -0
samples/1763245869172__000000250_0.jpg +0 -0
samples/1763245941492__000000250_1.jpg +0 -0
samples/1763246013882__000000250_2.jpg +0 -0
samples/1763246086279__000000250_3.jpg +0 -0
samples/1763246958297__000000500_0.jpg +0 -0
samples/1763247030518__000000500_1.jpg +0 -0
samples/1763247102833__000000500_2.jpg +0 -0
samples/1763247175174__000000500_3.jpg +0 -0
samples/1763248036622__000000750_0.jpg +0 -0
samples/1763248108868__000000750_1.jpg +0 -0
samples/1763248181412__000000750_2.jpg +0 -0
samples/1763248253941__000000750_3.jpg +0 -0
samples/1763249132486__000001000_0.jpg +0 -0
samples/1763249204958__000001000_1.jpg +0 -0
samples/1763249277546__000001000_2.jpg +0 -0
samples/1763249349926__000001000_3.jpg +0 -0
samples/1763250220760__000001250_0.jpg +0 -0
samples/1763250293230__000001250_1.jpg +0 -0
samples/1763250365742__000001250_2.jpg +0 -0
samples/1763250438055__000001250_3.jpg +0 -0
samples/1763251300994__000001500_0.jpg +0 -0
samples/1763251373348__000001500_1.jpg +0 -0
samples/1763251445767__000001500_2.jpg +0 -0
samples/1763251518184__000001500_3.jpg +0 -0
samples/1763252388902__000001750_0.jpg +0 -0
samples/1763252461313__000001750_1.jpg +0 -0
samples/1763252533715__000001750_2.jpg +0 -0
samples/1763252606026__000001750_3.jpg +0 -0
samples/1763253487029__000002000_0.jpg +0 -0
samples/1763253559402__000002000_1.jpg +0 -0
samples/1763253631997__000002000_2.jpg +0 -0
samples/1763253704491__000002000_3.jpg +0 -0
samples/1763254572411__000002250_0.jpg +0 -0
samples/1763254644904__000002250_1.jpg +0 -0
samples/1763254717481__000002250_2.jpg +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+samples/1763254717481__000002250_2.jpg filter=lfs diff=lfs merge=lfs -text
+samples/1763255798300__000002500_2.jpg filter=lfs diff=lfs merge=lfs -text
+samples/1763256921963__000002750_2.jpg filter=lfs diff=lfs merge=lfs -text
+samples/1763258006174__000003000_2.jpg filter=lfs diff=lfs merge=lfs -text

.job_config.json ADDED Viewed

	@@ -0,0 +1,135 @@

+{
+  "job": "extension",
+  "config": {
+    "name": "hash_cache_v1",
+    "process": [
+      {
+        "type": "diffusion_trainer",
+        "training_folder": "/app/ai-toolkit/output",
+        "sqlite_db_path": "/app/ai-toolkit/aitk_db.db",
+        "device": "cuda",
+        "trigger_word": null,
+        "performance_log_every": 10,
+        "network": {
+          "type": "lora",
+          "linear": 32,
+          "linear_alpha": 32,
+          "conv": 16,
+          "conv_alpha": 16,
+          "lokr_full_rank": true,
+          "lokr_factor": -1,
+          "network_kwargs": {
+            "ignore_if_contains": []
+          }
+        },
+        "save": {
+          "dtype": "bf16",
+          "save_every": 250,
+          "max_step_saves_to_keep": 4,
+          "save_format": "diffusers",
+          "push_to_hub": false
+        },
+        "datasets": [
+          {
+            "folder_path": "/app/ai-toolkit/datasets/hash_cache",
+            "mask_path": null,
+            "mask_min_value": 0.1,
+            "default_caption": "",
+            "caption_ext": "txt",
+            "caption_dropout_rate": 0.05,
+            "cache_latents_to_disk": false,
+            "is_reg": false,
+            "network_weight": 1,
+            "resolution": [
+              512,
+              768,
+              1024
+            ],
+            "controls": [],
+            "shrink_video_to_frames": true,
+            "num_frames": 1,
+            "do_i2v": true,
+            "flip_x": false,
+            "flip_y": false
+          }
+        ],
+        "train": {
+          "batch_size": 1,
+          "bypass_guidance_embedding": false,
+          "steps": 3000,
+          "gradient_accumulation": 1,
+          "train_unet": true,
+          "train_text_encoder": false,
+          "gradient_checkpointing": true,
+          "noise_scheduler": "flowmatch",
+          "optimizer": "adamw8bit",
+          "timestep_type": "weighted",
+          "content_or_style": "balanced",
+          "optimizer_params": {
+            "weight_decay": 0.0001
+          },
+          "unload_text_encoder": false,
+          "cache_text_embeddings": false,
+          "lr": 0.0001,
+          "ema_config": {
+            "use_ema": false,
+            "ema_decay": 0.99
+          },
+          "skip_first_sample": false,
+          "force_first_sample": false,
+          "disable_sampling": false,
+          "dtype": "bf16",
+          "diff_output_preservation": false,
+          "diff_output_preservation_multiplier": 1,
+          "diff_output_preservation_class": "person",
+          "switch_boundary_every": 1,
+          "loss_type": "mse"
+        },
+        "model": {
+          "name_or_path": "Qwen/Qwen-Image",
+          "quantize": true,
+          "qtype": "qfloat8",
+          "quantize_te": true,
+          "qtype_te": "qfloat8",
+          "arch": "qwen_image",
+          "low_vram": true,
+          "model_kwargs": {},
+          "layer_offloading": false,
+          "layer_offloading_text_encoder_percent": 1,
+          "layer_offloading_transformer_percent": 1
+        },
+        "sample": {
+          "sampler": "flowmatch",
+          "sample_every": 250,
+          "width": 1024,
+          "height": 1024,
+          "samples": [
+            {
+              "prompt": "Two adult people sitting side-by-side on a couch in a simple room, full bodies fully visible in frame. Neutral lighting, no stylization, no dramatic poses. Both figures look forward calmly with relaxed posture, hands resting naturally. The background is minimal and uncluttered, with a plain wall, soft shadows and a low-table in front. No neon, no props — just clean, natural photographic realism."
+            },
+            {
+              "prompt": "Two adults slightly slouched on a couch, clearly drunk but not cartoonish: relaxed posture, unfocused expressions, leaning into each other casually. Full bodies visible. The room is dim but neutral in tone, with soft warm lighting, subtle background blur and no dramatic color effects. A few bottles or cans on a table in front for context, but environment remains minimal and clean."
+            },
+            {
+              "prompt": "A clean black-and-white line-art drawing of two people sitting on a couch, full bodies visible, simple outlines with minimal shading. Smooth, consistent linework, no stylization like anime or comic — neutral sketchbook quality. Background lightly suggested with simple lines for the couch and wall. No color, no text, no shadows — pure structural line drawing."
+            },
+            {
+              "prompt": "Two human silhouettes sitting on a couch, shown as solid matte shapes with no internal details. Full bodies visible, clean side-by-side posture. The couch is a simple silhouette shape as well. Background is blank white. No shading, no texture — pure flat graphical silhouette intended only for pose and composition reference."
+            }
+          ],
+          "neg": "",
+          "seed": 42,
+          "walk_seed": true,
+          "guidance_scale": 4,
+          "sample_steps": 25,
+          "num_frames": 1,
+          "fps": 1
+        }
+      }
+    ]
+  },
+  "meta": {
+    "name": "[name]",
+    "version": "1.0"
+  }
+}

config.yaml ADDED Viewed

	@@ -0,0 +1,126 @@

+job: extension
+config:
+  name: hash_cache_v1
+  process:
+  - type: diffusion_trainer
+    training_folder: /app/ai-toolkit/output
+    sqlite_db_path: /app/ai-toolkit/aitk_db.db
+    device: cuda
+    trigger_word: null
+    performance_log_every: 10
+    network:
+      type: lora
+      linear: 32
+      linear_alpha: 32
+      conv: 16
+      conv_alpha: 16
+      lokr_full_rank: true
+      lokr_factor: -1
+      network_kwargs:
+        ignore_if_contains: []
+    save:
+      dtype: bf16
+      save_every: 250
+      max_step_saves_to_keep: 4
+      save_format: diffusers
+      push_to_hub: false
+    datasets:
+    - folder_path: /app/ai-toolkit/datasets/hash_cache
+      mask_path: null
+      mask_min_value: 0.1
+      default_caption: ''
+      caption_ext: txt
+      caption_dropout_rate: 0.05
+      cache_latents_to_disk: false
+      is_reg: false
+      network_weight: 1
+      resolution:
+      - 512
+      - 768
+      - 1024
+      controls: []
+      shrink_video_to_frames: true
+      num_frames: 1
+      do_i2v: true
+      flip_x: false
+      flip_y: false
+    train:
+      batch_size: 1
+      bypass_guidance_embedding: false
+      steps: 3000
+      gradient_accumulation: 1
+      train_unet: true
+      train_text_encoder: false
+      gradient_checkpointing: true
+      noise_scheduler: flowmatch
+      optimizer: adamw8bit
+      timestep_type: weighted
+      content_or_style: balanced
+      optimizer_params:
+        weight_decay: 0.0001
+      unload_text_encoder: false
+      cache_text_embeddings: false
+      lr: 0.0001
+      ema_config:
+        use_ema: false
+        ema_decay: 0.99
+      skip_first_sample: false
+      force_first_sample: false
+      disable_sampling: false
+      dtype: bf16
+      diff_output_preservation: false
+      diff_output_preservation_multiplier: 1
+      diff_output_preservation_class: person
+      switch_boundary_every: 1
+      loss_type: mse
+    model:
+      name_or_path: Qwen/Qwen-Image
+      quantize: true
+      qtype: qfloat8
+      quantize_te: true
+      qtype_te: qfloat8
+      arch: qwen_image
+      low_vram: true
+      model_kwargs: {}
+      layer_offloading: false
+      layer_offloading_text_encoder_percent: 1
+      layer_offloading_transformer_percent: 1
+    sample:
+      sampler: flowmatch
+      sample_every: 250
+      width: 1024
+      height: 1024
+      samples:
+      - prompt: "Two adult people sitting side-by-side on a couch in a simple room,\
+          \ full bodies fully visible in frame. Neutral lighting, no stylization,\
+          \ no dramatic poses. Both figures look forward calmly with relaxed posture,\
+          \ hands resting naturally. The background is minimal and uncluttered, with\
+          \ a plain wall, soft shadows and a low-table in front. No neon, no props\
+          \ \u2014 just clean, natural photographic realism."
+      - prompt: 'Two adults slightly slouched on a couch, clearly drunk but not cartoonish:
+          relaxed posture, unfocused expressions, leaning into each other casually.
+          Full bodies visible. The room is dim but neutral in tone, with soft warm
+          lighting, subtle background blur and no dramatic color effects. A few bottles
+          or cans on a table in front for context, but environment remains minimal
+          and clean.'
+      - prompt: "A clean black-and-white line-art drawing of two people sitting on\
+          \ a couch, full bodies visible, simple outlines with minimal shading. Smooth,\
+          \ consistent linework, no stylization like anime or comic \u2014 neutral\
+          \ sketchbook quality. Background lightly suggested with simple lines for\
+          \ the couch and wall. No color, no text, no shadows \u2014 pure structural\
+          \ line drawing."
+      - prompt: "Two human silhouettes sitting on a couch, shown as solid matte shapes\
+          \ with no internal details. Full bodies visible, clean side-by-side posture.\
+          \ The couch is a simple silhouette shape as well. Background is blank white.\
+          \ No shading, no texture \u2014 pure flat graphical silhouette intended\
+          \ only for pose and composition reference."
+      neg: ''
+      seed: 42
+      walk_seed: true
+      guidance_scale: 4
+      sample_steps: 25
+      num_frames: 1
+      fps: 1
+meta:
+  name: hash_cache_v1
+  version: '1.0'

hash_cache_v1.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fcdab1bbb2b305363d034d30f885bca6d3f67b3685706475ae5b974c2b04fe1d
+size 590058824

hash_cache_v1_000002000.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cdff1eca1644da954b2c5c379e3f6299159bcb0596d7183d00eae51ee9454686
+size 590058824

hash_cache_v1_000002250.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1858da18ebec668624a740d2379e6eca19aafcff049df96538a11a52ea71f7bb
+size 590058824

hash_cache_v1_000002500.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:377cc623a5abbfb75d6372091f464440633a651d75c62f27ea0ac56851ea2aab
+size 590058824

hash_cache_v1_000002750.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3516f980a2c016976faed96bf9f8c21e9f4dace8e6e1849839bac2edd8db6e2b
+size 590058824

log.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fee356929b2770853d09f29520173ebbd992d7526f690e6db892525045550ed0
+size 598613389

pid.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ 343

samples/1763244777125__000000000_0.jpg ADDED Viewed

samples/1763244847638__000000000_1.jpg ADDED Viewed

samples/1763244918161__000000000_2.jpg ADDED Viewed

samples/1763244989127__000000000_3.jpg ADDED Viewed

samples/1763245869172__000000250_0.jpg ADDED Viewed

samples/1763245941492__000000250_1.jpg ADDED Viewed

samples/1763246013882__000000250_2.jpg ADDED Viewed

samples/1763246086279__000000250_3.jpg ADDED Viewed

samples/1763246958297__000000500_0.jpg ADDED Viewed

samples/1763247030518__000000500_1.jpg ADDED Viewed

samples/1763247102833__000000500_2.jpg ADDED Viewed

samples/1763247175174__000000500_3.jpg ADDED Viewed

samples/1763248036622__000000750_0.jpg ADDED Viewed

samples/1763248108868__000000750_1.jpg ADDED Viewed

samples/1763248181412__000000750_2.jpg ADDED Viewed

samples/1763248253941__000000750_3.jpg ADDED Viewed

samples/1763249132486__000001000_0.jpg ADDED Viewed

samples/1763249204958__000001000_1.jpg ADDED Viewed

samples/1763249277546__000001000_2.jpg ADDED Viewed

samples/1763249349926__000001000_3.jpg ADDED Viewed

samples/1763250220760__000001250_0.jpg ADDED Viewed

samples/1763250293230__000001250_1.jpg ADDED Viewed

samples/1763250365742__000001250_2.jpg ADDED Viewed

samples/1763250438055__000001250_3.jpg ADDED Viewed

samples/1763251300994__000001500_0.jpg ADDED Viewed

samples/1763251373348__000001500_1.jpg ADDED Viewed

samples/1763251445767__000001500_2.jpg ADDED Viewed

samples/1763251518184__000001500_3.jpg ADDED Viewed

samples/1763252388902__000001750_0.jpg ADDED Viewed

samples/1763252461313__000001750_1.jpg ADDED Viewed

samples/1763252533715__000001750_2.jpg ADDED Viewed

samples/1763252606026__000001750_3.jpg ADDED Viewed

samples/1763253487029__000002000_0.jpg ADDED Viewed

samples/1763253559402__000002000_1.jpg ADDED Viewed

samples/1763253631997__000002000_2.jpg ADDED Viewed

samples/1763253704491__000002000_3.jpg ADDED Viewed

samples/1763254572411__000002250_0.jpg ADDED Viewed

samples/1763254644904__000002250_1.jpg ADDED Viewed

samples/1763254717481__000002250_2.jpg ADDED Viewed

Git LFS Details

SHA256: 6eb246e107006452e04065303f3d32a1e0cd3ab010512fc269e7ccae0884cd29
Pointer size: 131 Bytes
Size of remote file: 104 kB