jaruce commited on Jun 21, 2025

Commit

df2120e

verified ·

1 Parent(s): c927c54

End of training

Browse files

Files changed (28) hide show

checkpoint-3000/optimizer.bin +3 -0
checkpoint-3000/random_states_0.pkl +3 -0
checkpoint-3000/scheduler.bin +3 -0
checkpoint-3000/unet/config.json +68 -0
checkpoint-3000/unet/diffusion_pytorch_model.safetensors +3 -0
checkpoint-3500/optimizer.bin +3 -0
checkpoint-3500/random_states_0.pkl +3 -0
checkpoint-3500/scheduler.bin +3 -0
checkpoint-3500/unet/config.json +68 -0
checkpoint-3500/unet/diffusion_pytorch_model.safetensors +3 -0
checkpoint-4000/optimizer.bin +3 -0
checkpoint-4000/random_states_0.pkl +3 -0
checkpoint-4000/scheduler.bin +3 -0
checkpoint-4000/unet/config.json +68 -0
checkpoint-4000/unet/diffusion_pytorch_model.safetensors +3 -0
checkpoint-4500/optimizer.bin +3 -0
checkpoint-4500/random_states_0.pkl +3 -0
checkpoint-4500/scheduler.bin +3 -0
checkpoint-4500/unet/config.json +68 -0
checkpoint-4500/unet/diffusion_pytorch_model.safetensors +3 -0
checkpoint-5000/optimizer.bin +3 -0
checkpoint-5000/random_states_0.pkl +3 -0
checkpoint-5000/scheduler.bin +3 -0
checkpoint-5000/unet/config.json +68 -0
checkpoint-5000/unet/diffusion_pytorch_model.safetensors +3 -0
readme.txt +3 -0
unet/config.json +1 -1
unet/diffusion_pytorch_model.safetensors +1 -1

checkpoint-3000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a74887c3f340d5cd9b3d8f0d9701a480b249657c67f4588f16128d19119e5375
+size 6876851924

checkpoint-3000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad976251c14f38921dc3ef41ed81155520134203fe31c630da46d1a32edaa736
+size 16036

checkpoint-3000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9bcaa0ec9565c3bec056c6136ed24ab62a762aedcf6cdfb8053f701a68b6d056
+size 1000

checkpoint-3000/unet/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.33.1",
+  "_name_or_path": "output_lr1e4/checkpoint-2500",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 8,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

checkpoint-3000/unet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d69d56942f8db858fe9ce38a9a8b5e2b3cb192b2ddc35a451080b77eb997f174
+size 3438213624

checkpoint-3500/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc5d90c7f7762faa0edb200e1acf49cb8e3c51a6a269e617cb8813bbf338207d
+size 6876851924

checkpoint-3500/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df013a66abfe2b0f0c5b50bc9069ddb6295fc2b0293b9e5c83095d5e80201ad2
+size 16036

checkpoint-3500/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e6dd533cc093c46d0767cb255242c6e7c5706aaffabe304eeb0030f224e5cb82
+size 1000

checkpoint-3500/unet/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.33.1",
+  "_name_or_path": "output_lr1e4/checkpoint-2500",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 8,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

checkpoint-3500/unet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3127bf6cdf1538adfee5d4e612ff9d6c464c57a519faa04602b7def78d691cb6
+size 3438213624

checkpoint-4000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a2f3d861e7b78570c4640b905e09a83a132a59b3c71254eb205fadbcba7d7cee
+size 6876851924

checkpoint-4000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b8a60da8071d14cee03204f0fcb30199718e0dbdc5cc10ca0ecbb42c47d7e6db
+size 16036

checkpoint-4000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2bbb61109d01da8a9c381c0e2f077875e9118afeba0c4ed8b289ee114f675793
+size 1000

checkpoint-4000/unet/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.33.1",
+  "_name_or_path": "output_lr1e4/checkpoint-2500",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 8,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

checkpoint-4000/unet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b8a533f276154927ce8c96dc3cda05f3ed0ec848f7505a367d2eaeb4ca31265e
+size 3438213624

checkpoint-4500/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b4c1cc2fa941331bcf6bfc89f743f66bd083adfb374b5a9a7140e6439a7b6eb
+size 6876851924

checkpoint-4500/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:64fd4a0f84ca15706c0d173ef693f48181d7d75f065958f60469626557510e3f
+size 16036

checkpoint-4500/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c053c1662beab785ce3130a131593c5ee64e664223403b2aab6ac3c68b0dd77b
+size 1000

checkpoint-4500/unet/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.33.1",
+  "_name_or_path": "output_lr1e4/checkpoint-2500",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 8,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

checkpoint-4500/unet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5beb5fcecd8e4292270e0413603ad1f9dea4dd232cf9eca6468a5c91b0e7bd53
+size 3438213624

checkpoint-5000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf58fc4ebd3cbb9a9e75a7a2240a2ff22c8c39c684e9dcfd178fcf87c6a0496a
+size 6876851924

checkpoint-5000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3861e1bbdafcf900a4a7a794290536117324522f88af73aeb45b40207367ee94
+size 16036

checkpoint-5000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ac5722a50941bc1353846f80a544eb191fa869ae625cb63833f25ef78114c2d
+size 1000

checkpoint-5000/unet/config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_diffusers_version": "0.33.1",
+  "_name_or_path": "output_lr1e4/checkpoint-2500",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 8,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

checkpoint-5000/unet/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0a20383bd4124af51ebcd7ec195aa7f5ce7f9b604a5ee210d9650fbedfe62908
+size 3438213624

readme.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+前面2500个step是用lr 1e-4 训的，accumulation step = 4，loss持续下降（wandb 23）
+Namespace(adam_beta1=0.9, adam_beta2=0.999, adam_epsilon=1e-08, adam_weight_decay=0.01, allow_tf32=False, cache_dir=None, center_crop=False, checkpointing_steps=500, checkpoints_total_limit=None, conditioning_dropout_prob=None, data_file_records='/home/ach17654gk/code/train_sdxl_gg/metadata.jsonl', dataloader_num_workers=0, dataset_config_name=None, dataset_name=None, edit_prompt_column='text', edited_image_column='conditioning_image', enable_xformers_memory_efficient_attention=False, gradient_accumulation_steps=4, gradient_checkpointing=False, hub_model_id=None, hub_token=None, learning_rate=0.0001, local_rank=2, logging_dir='logs', lr_scheduler='constant', lr_warmup_steps=500, max_grad_norm=1.0, max_train_samples=None, max_train_steps=2500, mixed_precision=None, non_ema_revision=None, num_train_epochs=100, num_validation_images=4, original_image_column='file_name', output_dir='output_lr1e4', pretrained_model_name_or_path='/home/ach17654gk/.cache/huggingface/hub/models--runwayml--stable-diffusion-v1-5/snapshots/451f4fe16113bff5a5d2269ed5ad43b0592e9a14', push_to_hub=True, random_flip=False, report_to='wandb', resolution=512, resume_from_checkpoint='latest', revision=None, scale_lr=False, seed=0, train_batch_size=16, train_data_dir='/home/ach17654gk/download/dataset/DFC/Track_1', use_8bit_adam=False, use_ema=False, val_image_url='/home/ach17654gk/download/dataset/DFC/Track_1/png/rgb_images/TrainArea_1551.png', validation_epochs=1, validation_prompt='A high-resolution synthetic aperture radar (SAR) satellite image, heavy speckle noise, monochrome, moderate contrast, detailed geometric patterns, realistic radar texture, remote sensing style, urban area, distinct linear and rectangular structures', variant=None)
+再用这套参数训2500

unet/config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "_class_name": "UNet2DConditionModel",
   "_diffusers_version": "0.33.1",
-  "_name_or_path": "output_lr1e4/checkpoint-1000",
   "act_fn": "silu",
   "addition_embed_type": null,
   "addition_embed_type_num_heads": 64,

 {
   "_class_name": "UNet2DConditionModel",
   "_diffusers_version": "0.33.1",
+  "_name_or_path": "output_lr1e4/checkpoint-2500",
   "act_fn": "silu",
   "addition_embed_type": null,
   "addition_embed_type_num_heads": 64,

unet/diffusion_pytorch_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ca65bf9c3468dc66c753e5ace7eb06c72a867bafee9ad65a18b19aefedd1f44c
 size 3438213624

 version https://git-lfs.github.com/spec/v1
+oid sha256:0a20383bd4124af51ebcd7ec195aa7f5ce7f9b604a5ee210d9650fbedfe62908
 size 3438213624