recoilme commited on Oct 27, 2025

Commit

1fb2664

1 Parent(s): b4d8bb3

v3

Browse files

Files changed (17) hide show

samples/unet_320x640_0.jpg +3 -0
samples/unet_384x640_0.jpg +2 -2
samples/unet_448x640_0.jpg +2 -2
samples/unet_512x640_0.jpg +2 -2
samples/unet_576x640_0.jpg +2 -2
samples/unet_640x320_0.jpg +3 -0
samples/unet_640x384_0.jpg +2 -2
samples/unet_640x448_0.jpg +2 -2
samples/unet_640x512_0.jpg +2 -2
samples/unet_640x576_0.jpg +2 -2
samples/unet_640x640_0.jpg +2 -2
src/dataset_combine.py +1 -1
src/dataset_combine_zstd.py +47 -0
src/dataset_from_folder_qwen.py +2 -2
train.py +19 -9
unet/config.json +2 -2
unet/diffusion_pytorch_model.safetensors +2 -2

samples/unet_320x640_0.jpg ADDED Viewed

Git LFS Details

SHA256: aaa49bde52ec56fd5630df5c20b5279a31f4449dd6cb55e331fcca2c56d1bf9c
Pointer size: 130 Bytes
Size of remote file: 78.6 kB

samples/unet_384x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 7c30542105a2666530f5803781536a2a1e569ab1f9964fcac8896b4f4a362660
Pointer size: 131 Bytes
Size of remote file: 128 kB

Git LFS Details

SHA256: 3fc2e576d7213ae9f6c2056155e5e01f0ee4d4b30cc19c27597572b78822c088
Pointer size: 130 Bytes
Size of remote file: 60.5 kB

samples/unet_448x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: b45c5a27eb6000c80251516574a6e27165b9d1320fc179eec17ad1ed344791af
Pointer size: 131 Bytes
Size of remote file: 153 kB

Git LFS Details

SHA256: 0145df74b35440e170a97ac44bb604190fb11e3cef23166b4a8b6892839ff09d
Pointer size: 131 Bytes
Size of remote file: 133 kB

samples/unet_512x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: eed27dcab746b5c7e514c51b02485ea557cddd9d5056eddf9de0aaeb198bf288
Pointer size: 131 Bytes
Size of remote file: 163 kB

Git LFS Details

SHA256: 6acc2d9442ab6d2aa5ae3a95c42a5c5ad30870ecf3be164eb5105b0c3a7f3e17
Pointer size: 131 Bytes
Size of remote file: 147 kB

samples/unet_576x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 7333aa4c4e061883e815ba83119babbb2553a5c19fd45277104c9e17690d55a2
Pointer size: 131 Bytes
Size of remote file: 203 kB

Git LFS Details

SHA256: dc47d89308fec89e2459d20b1359e41ceeea16c472547589de2e34449d051976
Pointer size: 131 Bytes
Size of remote file: 144 kB

samples/unet_640x320_0.jpg ADDED Viewed

Git LFS Details

SHA256: e42813ea082afb569323590b04ceef30f2726f396c61763b518f5b08267f27e3
Pointer size: 130 Bytes
Size of remote file: 88.6 kB

samples/unet_640x384_0.jpg CHANGED Viewed

Git LFS Details

SHA256: a0a4f56606b4fe0fdd56bc6ab26ac566837d6ca332ec320c210093ff8ceb75d6
Pointer size: 131 Bytes
Size of remote file: 114 kB

Git LFS Details

SHA256: 8185d2203f022cf26056ab99aa64fc89b633683119c9e165163cae08e2af8943
Pointer size: 130 Bytes
Size of remote file: 46.1 kB

samples/unet_640x448_0.jpg CHANGED Viewed

Git LFS Details

SHA256: faf83170ec8fe965a5efea48365c11f50e8d325960279226c84087f28266c335
Pointer size: 131 Bytes
Size of remote file: 122 kB

Git LFS Details

SHA256: 46fb4f2a371e61359b0b1bf0e3fe8c1abbd058ebb0449736593db8a7aacbe33e
Pointer size: 131 Bytes
Size of remote file: 122 kB

samples/unet_640x512_0.jpg CHANGED Viewed

Git LFS Details

SHA256: b3360256cb302285902321ced68e9c6601d8f52c3d649fec91864f97610d4e0e
Pointer size: 131 Bytes
Size of remote file: 114 kB

Git LFS Details

SHA256: 74e58d54d0e4a77341b110f3aa2274f663cb674d3e187d6080e0c5503c3e8b43
Pointer size: 131 Bytes
Size of remote file: 125 kB

samples/unet_640x576_0.jpg CHANGED Viewed

Git LFS Details

SHA256: ff08a7a9ac754b820c93d3b5f5f7dab28b0687c583560d8a474fd5fb8c6f7866
Pointer size: 131 Bytes
Size of remote file: 154 kB

Git LFS Details

SHA256: 8e04f685ad9ecc7537044e0fd9789019e75197d1b08be6cc38caa8b5b662fe96
Pointer size: 131 Bytes
Size of remote file: 118 kB

samples/unet_640x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 1819eac81e22f5bfa21581295b3afd82440ebd5327bb317e78fa1e2425d2b8e7
Pointer size: 131 Bytes
Size of remote file: 175 kB

Git LFS Details

SHA256: 372ac2247c2ef96783cad10c2cc9dffb9578348021bf3d7884c9cc18a6210963
Pointer size: 130 Bytes
Size of remote file: 85.5 kB

src/dataset_combine.py CHANGED Viewed

@@ -65,4 +65,4 @@ def combine_datasets(main_dataset_path, datasets_to_add):
     return combined
-combine_datasets("/workspace/sdxs3d/datasets/mjnj", ["/workspace/animesfw384"])


65
66	return combined
67
68	+ combine_datasets("/workspace/sdxs3d/datasets/batch0_640", ["/workspace/sdxs3d/datasets/esh640"])

src/dataset_combine_zstd.py ADDED Viewed

	@@ -0,0 +1,47 @@

+import os
+import shutil
+from datasets import load_from_disk, concatenate_datasets
+def combine_datasets(main_dataset_path, datasets_to_add):
+    try:
+        main_dataset = load_from_disk(main_dataset_path)
+        print(f"Загружен основной датасет: {main_dataset_path} ({len(main_dataset)} записей)")
+    except Exception as e:
+        print(f"Ошибка загрузки основного датасета: {e}")
+        return None
+    all_datasets = [main_dataset]
+    for path in datasets_to_add:
+        try:
+            ds = load_from_disk(path)
+            all_datasets.append(ds)
+            print(f"Добавлен датасет: {path} ({len(ds)} записей)")
+        except Exception as e:
+            print(f"Ошибка загрузки датасета {path}: {e}")
+    combined = concatenate_datasets(all_datasets)
+    print(f"Объединение {len(all_datasets)} датасетов...")
+    temp_dir = f"{main_dataset_path}_temp"
+    if os.path.exists(temp_dir):
+        shutil.rmtree(temp_dir)
+    try:
+        print(f"Сохранение в сжатом формате во временную директорию {temp_dir}...")
+        combined.save_to_disk(temp_dir)#, compression="zstd")  # <-- Сжатие
+        print(f"Обновление основного датасета...")
+        if os.path.exists(main_dataset_path):
+            shutil.rmtree(main_dataset_path)
+        shutil.copytree(temp_dir, main_dataset_path)
+        shutil.rmtree(temp_dir)
+        print(f"✅ Объединенный датасет ({len(combined)} записей) успешно сохранен в: {main_dataset_path}")
+    except Exception as e:
+        print(f"Ошибка при сохранении датасета: {e}")
+        print(f"Временные данные сохранены в: {temp_dir}")
+    return combined
+combine_datasets("/workspace/sdxs3d/datasets/esh640", ["/workspace/sdxs3d/datasets/batch0_640_temp"])

src/dataset_from_folder_qwen.py CHANGED Viewed

@@ -27,8 +27,8 @@ step = 64 #64
 empty_share = 0.05
 limit = 0
 # Основная процедура обработки
-folder_path = "/workspace/sdxs3d/datasets/eshooshoo_all" #alchemist"
-save_path = "/workspace/sdxs3d/datasets/esh640" #"alchemist"
 os.makedirs(save_path, exist_ok=True)
 # Функция для очистки CUDA памяти

 empty_share = 0.05
 limit = 0
 # Основная процедура обработки
+folder_path = "/workspace/sdxs3d/datasets/batch1" #alchemist"
+save_path = "/workspace/sdxs3d/datasets/batch1_640" #"alchemist"
 os.makedirs(save_path, exist_ok=True)
 # Функция для очистки CUDA памяти

train.py CHANGED Viewed

@@ -26,16 +26,16 @@ import torch.nn.functional as F
 from collections import deque
 # --------------------------- Параметры ---------------------------
-ds_path = "/workspace/sdxs3d/datasets/esh640"
 project = "unet"
-batch_size = 64
 base_learning_rate = 6e-5
 min_learning_rate = 1e-5
-num_epochs = 80
 # samples/save per epoch
-sample_interval_share = 20
-use_wandb = True
-use_comet_ml = False
 save_model = True
 use_decay = True
 fbp = False # fused backward pass
@@ -52,7 +52,7 @@ torch.backends.cudnn.allow_tf32 = True
 torch.backends.cuda.enable_mem_efficient_sdp(False)
 dtype = torch.float32
 save_barrier = 1.006
-warmup_percent = 0.01
 percentile_clipping = 99 # 8bit optim
 betta2 = 0.99
 eps = 1e-8
@@ -480,7 +480,8 @@ def get_negative_embedding(neg_prompt="", batch_size=1):
     # Возвращаем эмбеддинг
     if not neg_prompt:
         hidden_dim = 1024  # Размерность эмбеддинга Qwen3-Embedding-0.6B
-        return torch.zeros((batch_size, 1, hidden_dim), dtype=dtype, device=device)
     uncond_emb = encode_texts([neg_prompt]).to(dtype=dtype, device=device)
     uncond_emb = uncond_emb.repeat(batch_size, 1, 1)  # Добавляем батч
@@ -533,10 +534,19 @@ def generate_and_save_samples(fixed_samples_cpu,empty_embeddings, step):
                 # guidance: удваиваем батч
                 if guidance_scale != 1:
                     latent_model_input = torch.cat([latents, latents], dim=0)
-                    text_embeddings_batch = torch.cat([empty_embeddings, sample_text_embeddings], dim=0)
                 else:
                     latent_model_input = latents
                     text_embeddings_batch = sample_text_embeddings
                 # предсказание потока (velocity)
                 model_out = original_model(latent_model_input, t, encoder_hidden_states=text_embeddings_batch)

 from collections import deque
 # --------------------------- Параметры ---------------------------
+ds_path = "/workspace/sdxs3d/datasets/batch0_640_temp"
 project = "unet"
+batch_size = 32
 base_learning_rate = 6e-5
 min_learning_rate = 1e-5
+num_epochs = 10
 # samples/save per epoch
+sample_interval_share = 2
+use_wandb = False
+use_comet_ml = True
 save_model = True
 use_decay = True
 fbp = False # fused backward pass
 torch.backends.cuda.enable_mem_efficient_sdp(False)
 dtype = torch.float32
 save_barrier = 1.006
+warmup_percent = 0.005
 percentile_clipping = 99 # 8bit optim
 betta2 = 0.99
 eps = 1e-8
     # Возвращаем эмбеддинг
     if not neg_prompt:
         hidden_dim = 1024  # Размерность эмбеддинга Qwen3-Embedding-0.6B
+        seq_len = 150
+        return torch.zeros((batch_size, seq_len, hidden_dim), dtype=dtype, device=device)
     uncond_emb = encode_texts([neg_prompt]).to(dtype=dtype, device=device)
     uncond_emb = uncond_emb.repeat(batch_size, 1, 1)  # Добавляем батч
                 # guidance: удваиваем батч
                 if guidance_scale != 1:
                     latent_model_input = torch.cat([latents, latents], dim=0)
+                    # empty_embeddings: [1, 1, hidden_dim] → повторяем по seq_len и batch
+                    seq_len = sample_text_embeddings.shape[1]
+                    hidden_dim = sample_text_embeddings.shape[2]
+                    empty_embeddings_exp = empty_embeddings.expand(-1, seq_len, hidden_dim)  # [1, seq_len, hidden_dim]
+                    empty_embeddings_exp = empty_embeddings_exp.repeat(sample_text_embeddings.shape[0], 1, 1)  # [batch, seq_len, hidden_dim]
+                    text_embeddings_batch = torch.cat([empty_embeddings_exp, sample_text_embeddings], dim=0)
                 else:
                     latent_model_input = latents
                     text_embeddings_batch = sample_text_embeddings
                 # предсказание потока (velocity)
                 model_out = original_model(latent_model_input, t, encoder_hidden_states=text_embeddings_batch)

unet/config.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:afc06beff07034f0ce9f671c83222e7f78eedc3b3ce93293143accdebef1b111
-size 1887

 version https://git-lfs.github.com/spec/v1
+oid sha256:fac879374be0c1cd3ffcbfa188e72f50576f25326aada5da077b0fc7af442ad4
+size 1874

unet/diffusion_pytorch_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9d933d318f2d42b37c31065a09c14ee0c03ec05a10d672667743a089d396086b
-size 3092571208

 version https://git-lfs.github.com/spec/v1
+oid sha256:74563fd4bef0e9f811d7ed6571b6064707beafa8f6ea7f4eeae0dbdfe819f902
+size 6184944280