Shahidhasib1014 commited on
Commit
e1753b2
·
verified ·
1 Parent(s): 1df1a1a

Upload 54 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint-30000/optimizer.bin +3 -0
  2. checkpoint-30000/random_states_0.pkl +3 -0
  3. checkpoint-30000/scaler.pt +3 -0
  4. checkpoint-30000/scheduler.bin +3 -0
  5. checkpoint-30000/unet/config.json +68 -0
  6. checkpoint-30000/unet/diffusion_pytorch_model.safetensors +3 -0
  7. feature_extractor/preprocessor_config.json +27 -0
  8. logs/instruct-pix2pix/1745779918.861231/events.out.tfevents.1745779918.mundus-mir-1.325504.1 +3 -0
  9. logs/instruct-pix2pix/1745779918.8683908/hparams.yml +51 -0
  10. logs/instruct-pix2pix/1745781153.0493896/events.out.tfevents.1745781153.mundus-mir-2.648434.1 +3 -0
  11. logs/instruct-pix2pix/1745781153.0559945/hparams.yml +51 -0
  12. logs/instruct-pix2pix/1745783236.7069378/events.out.tfevents.1745783236.mundus-mir-2.650016.1 +3 -0
  13. logs/instruct-pix2pix/1745783236.7138407/hparams.yml +51 -0
  14. logs/instruct-pix2pix/1745784819.9812648/events.out.tfevents.1745784819.mundus-mir-2.650967.1 +3 -0
  15. logs/instruct-pix2pix/1745784819.9881177/hparams.yml +51 -0
  16. logs/instruct-pix2pix/1745784968.139657/events.out.tfevents.1745784968.mundus-mir-3.334708.1 +3 -0
  17. logs/instruct-pix2pix/1745784968.1458905/hparams.yml +51 -0
  18. logs/instruct-pix2pix/1745785770.6922438/events.out.tfevents.1745785770.mundus-mir-2.651552.1 +3 -0
  19. logs/instruct-pix2pix/1745785770.6990857/hparams.yml +51 -0
  20. logs/instruct-pix2pix/1745785929.0347283/events.out.tfevents.1745785929.mundus-mir-2.651753.1 +3 -0
  21. logs/instruct-pix2pix/1745785929.0417445/hparams.yml +51 -0
  22. logs/instruct-pix2pix/1745786073.517925/events.out.tfevents.1745786073.mundus-mir-2.651936.1 +3 -0
  23. logs/instruct-pix2pix/1745786073.5251162/hparams.yml +51 -0
  24. logs/instruct-pix2pix/1745786629.405493/events.out.tfevents.1745786629.mundus-mir-2.652271.1 +3 -0
  25. logs/instruct-pix2pix/1745786629.4116194/hparams.yml +51 -0
  26. logs/instruct-pix2pix/1745787038.5777526/events.out.tfevents.1745787038.mundus-mir-2.652686.1 +3 -0
  27. logs/instruct-pix2pix/1745787038.6061075/hparams.yml +51 -0
  28. logs/instruct-pix2pix/1745787199.0689187/events.out.tfevents.1745787199.mundus-mir-1.330350.1 +3 -0
  29. logs/instruct-pix2pix/1745787199.0821726/hparams.yml +51 -0
  30. logs/instruct-pix2pix/events.out.tfevents.1745779918.mundus-mir-1.325504.0 +3 -0
  31. logs/instruct-pix2pix/events.out.tfevents.1745781153.mundus-mir-2.648434.0 +3 -0
  32. logs/instruct-pix2pix/events.out.tfevents.1745783236.mundus-mir-2.650016.0 +3 -0
  33. logs/instruct-pix2pix/events.out.tfevents.1745784819.mundus-mir-2.650967.0 +3 -0
  34. logs/instruct-pix2pix/events.out.tfevents.1745784968.mundus-mir-3.334708.0 +3 -0
  35. logs/instruct-pix2pix/events.out.tfevents.1745785770.mundus-mir-2.651552.0 +3 -0
  36. logs/instruct-pix2pix/events.out.tfevents.1745785929.mundus-mir-2.651753.0 +3 -0
  37. logs/instruct-pix2pix/events.out.tfevents.1745786073.mundus-mir-2.651936.0 +3 -0
  38. logs/instruct-pix2pix/events.out.tfevents.1745786629.mundus-mir-2.652271.0 +3 -0
  39. logs/instruct-pix2pix/events.out.tfevents.1745787038.mundus-mir-2.652686.0 +3 -0
  40. logs/instruct-pix2pix/events.out.tfevents.1745787199.mundus-mir-1.330350.0 +3 -0
  41. model_index.json +38 -0
  42. safety_checker/config.json +47 -0
  43. safety_checker/model.safetensors +3 -0
  44. scheduler/scheduler_config.json +23 -0
  45. text_encoder/config.json +24 -0
  46. text_encoder/model.safetensors +3 -0
  47. tokenizer/merges.txt +0 -0
  48. tokenizer/special_tokens_map.json +24 -0
  49. tokenizer/tokenizer_config.json +31 -0
  50. tokenizer/vocab.json +0 -0
checkpoint-30000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3fea5c9853b9e0f6f097bb5cd954e9188e919f847123428af60f9f5d69067d9
3
+ size 6876849433
checkpoint-30000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c21adfdd26e212f5a9c47f59077ffffab8a49a5e01ae6040f508db84e9e71fa9
3
+ size 14821
checkpoint-30000/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1eb84867a7e6381d5aebbffe52104a9229cc72d8e4939069c227babf5a29c9f5
3
+ size 1383
checkpoint-30000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:282d8ec55d3e266fc82753c523a4117fdbe735bbcbfeb84caa49aff016f37c4c
3
+ size 1401
checkpoint-30000/unet/config.json ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.34.0.dev0",
4
+ "_name_or_path": "timbrooks/instruct-pix2pix",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": null,
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": null,
9
+ "attention_head_dim": 8,
10
+ "attention_type": "default",
11
+ "block_out_channels": [
12
+ 320,
13
+ 640,
14
+ 1280,
15
+ 1280
16
+ ],
17
+ "center_input_sample": false,
18
+ "class_embed_type": null,
19
+ "class_embeddings_concat": false,
20
+ "conv_in_kernel": 3,
21
+ "conv_out_kernel": 3,
22
+ "cross_attention_dim": 768,
23
+ "cross_attention_norm": null,
24
+ "down_block_types": [
25
+ "CrossAttnDownBlock2D",
26
+ "CrossAttnDownBlock2D",
27
+ "CrossAttnDownBlock2D",
28
+ "DownBlock2D"
29
+ ],
30
+ "downsample_padding": 1,
31
+ "dropout": 0.0,
32
+ "dual_cross_attention": false,
33
+ "encoder_hid_dim": null,
34
+ "encoder_hid_dim_type": null,
35
+ "flip_sin_to_cos": true,
36
+ "freq_shift": 0,
37
+ "in_channels": 8,
38
+ "layers_per_block": 2,
39
+ "mid_block_only_cross_attention": null,
40
+ "mid_block_scale_factor": 1,
41
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
42
+ "norm_eps": 1e-05,
43
+ "norm_num_groups": 32,
44
+ "num_attention_heads": null,
45
+ "num_class_embeds": null,
46
+ "only_cross_attention": false,
47
+ "out_channels": 4,
48
+ "projection_class_embeddings_input_dim": null,
49
+ "resnet_out_scale_factor": 1.0,
50
+ "resnet_skip_time_act": false,
51
+ "resnet_time_scale_shift": "default",
52
+ "reverse_transformer_layers_per_block": null,
53
+ "sample_size": 64,
54
+ "time_cond_proj_dim": null,
55
+ "time_embedding_act_fn": null,
56
+ "time_embedding_dim": null,
57
+ "time_embedding_type": "positional",
58
+ "timestep_post_act": null,
59
+ "transformer_layers_per_block": 1,
60
+ "up_block_types": [
61
+ "UpBlock2D",
62
+ "CrossAttnUpBlock2D",
63
+ "CrossAttnUpBlock2D",
64
+ "CrossAttnUpBlock2D"
65
+ ],
66
+ "upcast_attention": false,
67
+ "use_linear_projection": false
68
+ }
checkpoint-30000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbe7ef9489ce2dec1d202dda94453fc08a5d13aad78913bdc71557a19d3eb769
3
+ size 3438213624
feature_extractor/preprocessor_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 0.48145466,
13
+ 0.4578275,
14
+ 0.40821073
15
+ ],
16
+ "image_processor_type": "CLIPImageProcessor",
17
+ "image_std": [
18
+ 0.26862954,
19
+ 0.26130258,
20
+ 0.27577711
21
+ ],
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "shortest_edge": 224
26
+ }
27
+ }
logs/instruct-pix2pix/1745779918.861231/events.out.tfevents.1745779918.mundus-mir-1.325504.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c62b28e4500ea7017f541047be262d613b0fa9fd7696ae7ebc7acbc9110fe4b
3
+ size 2477
logs/instruct-pix2pix/1745779918.8683908/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745781153.0493896/events.out.tfevents.1745781153.mundus-mir-2.648434.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fdc62f7e76def4522f75a886860d807f00a83fb4d12d7156a8ab8022c822ce2
3
+ size 2477
logs/instruct-pix2pix/1745781153.0559945/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745783236.7069378/events.out.tfevents.1745783236.mundus-mir-2.650016.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abc54acca72e23eb53b73dbd2ffe45297b11e23feee2fc914aa56d097747f812
3
+ size 2477
logs/instruct-pix2pix/1745783236.7138407/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745784819.9812648/events.out.tfevents.1745784819.mundus-mir-2.650967.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d143cbe9c44df4ba89b797d31b28d51f8e298c95f7658825320d1cc305404f90
3
+ size 2477
logs/instruct-pix2pix/1745784819.9881177/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745784968.139657/events.out.tfevents.1745784968.mundus-mir-3.334708.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efc23513f98bc65cf883219d4cd5ea735fa3371b6cbfc402613b459e2d067462
3
+ size 2477
logs/instruct-pix2pix/1745784968.1458905/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745785770.6922438/events.out.tfevents.1745785770.mundus-mir-2.651552.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16ed93bd57c5c8a6ee0e1756a9efa7e66ad86f88d3ee3864e3fe1457a4614a66
3
+ size 2477
logs/instruct-pix2pix/1745785770.6990857/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745785929.0347283/events.out.tfevents.1745785929.mundus-mir-2.651753.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fd5d5f13fe0d15d2cdcef1aed6ddb98bbde72c79a5ac15828637f4f3868a0b7
3
+ size 2477
logs/instruct-pix2pix/1745785929.0417445/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745786073.517925/events.out.tfevents.1745786073.mundus-mir-2.651936.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:467fcf706f0df96133090c0370e2eda8df367a6ed6b6208103c6dc15944d7dbf
3
+ size 2477
logs/instruct-pix2pix/1745786073.5251162/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745786629.405493/events.out.tfevents.1745786629.mundus-mir-2.652271.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1126664d889d87419ac4320703315f8d607723018b8d6f6c538a5538835477ab
3
+ size 2477
logs/instruct-pix2pix/1745786629.4116194/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745787038.5777526/events.out.tfevents.1745787038.mundus-mir-2.652686.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ca0a0288dc020cf239cb009c98c9a95db357800ef08991141241734ff38480
3
+ size 2477
logs/instruct-pix2pix/1745787038.6061075/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/1745787199.0689187/events.out.tfevents.1745787199.mundus-mir-1.330350.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b2f1007bab04d804568c19ae91a61a37f4e66cb01dd40be7c5baf0970fe9737
3
+ size 2477
logs/instruct-pix2pix/1745787199.0821726/hparams.yml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ center_crop: false
8
+ checkpointing_steps: 5000
9
+ checkpoints_total_limit: 1
10
+ conditioning_dropout_prob: 0.05
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ edit_prompt_column: edit_prompt
15
+ edited_image_column: edited_image
16
+ enable_xformers_memory_efficient_attention: false
17
+ gradient_accumulation_steps: 4
18
+ gradient_checkpointing: true
19
+ hub_model_id: null
20
+ hub_token: null
21
+ learning_rate: 5.0e-05
22
+ local_rank: -1
23
+ logging_dir: logs
24
+ lr_scheduler: constant
25
+ lr_warmup_steps: 500
26
+ max_grad_norm: 1.0
27
+ max_train_samples: null
28
+ max_train_steps: 30000
29
+ mixed_precision: fp16
30
+ non_ema_revision: null
31
+ num_train_epochs: 477
32
+ num_validation_images: 4
33
+ original_image_column: original_image
34
+ output_dir: instruct-pix2pix-model
35
+ pretrained_model_name_or_path: timbrooks/instruct-pix2pix
36
+ push_to_hub: true
37
+ random_flip: true
38
+ report_to: tensorboard
39
+ resolution: 256
40
+ resume_from_checkpoint: null
41
+ revision: null
42
+ scale_lr: false
43
+ seed: 42
44
+ train_batch_size: 4
45
+ train_data_dir: /home/mundus/shasib158/.ssh/diffusers/examples/instruct_pix2pix/reach_target_250
46
+ use_8bit_adam: false
47
+ use_ema: false
48
+ val_image_url: null
49
+ validation_epochs: 1
50
+ validation_prompt: null
51
+ variant: null
logs/instruct-pix2pix/events.out.tfevents.1745779918.mundus-mir-1.325504.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39fe6505c7618dcbb840f5e97f646b9a1c570d295b2555ea48a2cb0d86ad0efe
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745781153.mundus-mir-2.648434.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07970fe44505b6cca8524f9931582658103e3f55ad586d82acf34ff7ef445e87
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745783236.mundus-mir-2.650016.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cc6693f9db34cdb520eff471ae8892fef586fe55e37f1d3ba732179bb57d573
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745784819.mundus-mir-2.650967.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52396943cc85b56bed9b7822c9dbf36199b33f1481df2ab3728cf484833acad0
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745784968.mundus-mir-3.334708.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8728cf3d01cfd92a0b2e290db8d2e0b787b54e044b57dad842382c4351c4495c
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745785770.mundus-mir-2.651552.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7eb9b1fdb6523e48a154b76076ccf937d226e3da549b8157ed9988b57d948136
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745785929.mundus-mir-2.651753.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39130b3045ddcee179f233b4ea36a8e593777af64daf3b91a0f72a54828ae26f
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745786073.mundus-mir-2.651936.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dbbe46d6fb6c6166e69f10cf15944d63637ea616634aef5706ecff3ba019a06
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745786629.mundus-mir-2.652271.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92d0bd071cb972f67116a9268b62f550e7645515cf76075a2b6be71760561d2c
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745787038.mundus-mir-2.652686.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:688d90c7096e87fa2a4863cd3a31ccd26231c309c3beebf4041d2fdb50141459
3
+ size 88
logs/instruct-pix2pix/events.out.tfevents.1745787199.mundus-mir-1.330350.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c84cb877dc9be29313f8d379dec7a2c46159bdc9554483f1f8e9592c704024f
3
+ size 88
model_index.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "StableDiffusionInstructPix2PixPipeline",
3
+ "_diffusers_version": "0.34.0.dev0",
4
+ "_name_or_path": "timbrooks/instruct-pix2pix",
5
+ "feature_extractor": [
6
+ "transformers",
7
+ "CLIPImageProcessor"
8
+ ],
9
+ "image_encoder": [
10
+ null,
11
+ null
12
+ ],
13
+ "requires_safety_checker": false,
14
+ "safety_checker": [
15
+ "stable_diffusion",
16
+ "StableDiffusionSafetyChecker"
17
+ ],
18
+ "scheduler": [
19
+ "diffusers",
20
+ "EulerAncestralDiscreteScheduler"
21
+ ],
22
+ "text_encoder": [
23
+ "transformers",
24
+ "CLIPTextModel"
25
+ ],
26
+ "tokenizer": [
27
+ "transformers",
28
+ "CLIPTokenizer"
29
+ ],
30
+ "unet": [
31
+ "diffusers",
32
+ "UNet2DConditionModel"
33
+ ],
34
+ "vae": [
35
+ "diffusers",
36
+ "AutoencoderKL"
37
+ ]
38
+ }
safety_checker/config.json ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "StableDiffusionSafetyChecker"
4
+ ],
5
+ "initializer_factor": 1.0,
6
+ "logit_scale_init_value": 2.6592,
7
+ "model_type": "clip",
8
+ "projection_dim": 768,
9
+ "text_config": {
10
+ "attention_dropout": 0.0,
11
+ "dropout": 0.0,
12
+ "hidden_act": "quick_gelu",
13
+ "hidden_size": 768,
14
+ "initializer_factor": 1.0,
15
+ "initializer_range": 0.02,
16
+ "intermediate_size": 3072,
17
+ "layer_norm_eps": 1e-05,
18
+ "max_position_embeddings": 77,
19
+ "model_type": "clip_text_model",
20
+ "num_attention_heads": 12,
21
+ "num_hidden_layers": 12,
22
+ "projection_dim": 512,
23
+ "torch_dtype": "float16",
24
+ "vocab_size": 49408
25
+ },
26
+ "torch_dtype": "float16",
27
+ "transformers_version": "4.51.3",
28
+ "vision_config": {
29
+ "_attn_implementation_autoset": true,
30
+ "attention_dropout": 0.0,
31
+ "dropout": 0.0,
32
+ "hidden_act": "quick_gelu",
33
+ "hidden_size": 1024,
34
+ "image_size": 224,
35
+ "initializer_factor": 1.0,
36
+ "initializer_range": 0.02,
37
+ "intermediate_size": 4096,
38
+ "layer_norm_eps": 1e-05,
39
+ "model_type": "clip_vision_model",
40
+ "num_attention_heads": 16,
41
+ "num_channels": 3,
42
+ "num_hidden_layers": 24,
43
+ "patch_size": 14,
44
+ "projection_dim": 512,
45
+ "torch_dtype": "float16"
46
+ }
47
+ }
safety_checker/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57ecdfa243b170f9b4cb3eefaf0f64552ef78fc0bf0eb1c5b9675308447184f6
3
+ size 608016280
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "EulerAncestralDiscreteScheduler",
3
+ "_diffusers_version": "0.34.0.dev0",
4
+ "algorithm_type": "dpmsolver++",
5
+ "beta_end": 0.012,
6
+ "beta_schedule": "scaled_linear",
7
+ "beta_start": 0.00085,
8
+ "clip_sample": false,
9
+ "dynamic_thresholding_ratio": 0.995,
10
+ "lower_order_final": true,
11
+ "num_train_timesteps": 1000,
12
+ "prediction_type": "epsilon",
13
+ "rescale_betas_zero_snr": false,
14
+ "sample_max_value": 1.0,
15
+ "set_alpha_to_one": false,
16
+ "skip_prk_steps": true,
17
+ "solver_order": 2,
18
+ "solver_type": "midpoint",
19
+ "steps_offset": 1,
20
+ "thresholding": false,
21
+ "timestep_spacing": "linspace",
22
+ "trained_betas": null
23
+ }
text_encoder/config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CLIPTextModel"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 0,
7
+ "dropout": 0.0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "quick_gelu",
10
+ "hidden_size": 768,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 77,
16
+ "model_type": "clip_text_model",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 1,
20
+ "projection_dim": 768,
21
+ "torch_dtype": "float16",
22
+ "transformers_version": "4.51.3",
23
+ "vocab_size": 49408
24
+ }
text_encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:660c6f5b1abae9dc498ac2d21e1347d2abdb0cf6c0c0c8576cd796491d9a6cdd
3
+ size 246144152
tokenizer/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer/special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<|endoftext|>",
17
+ "unk_token": {
18
+ "content": "<|endoftext|>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "49406": {
5
+ "content": "<|startoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "49407": {
13
+ "content": "<|endoftext|>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ }
20
+ },
21
+ "bos_token": "<|startoftext|>",
22
+ "clean_up_tokenization_spaces": false,
23
+ "do_lower_case": true,
24
+ "eos_token": "<|endoftext|>",
25
+ "errors": "replace",
26
+ "extra_special_tokens": {},
27
+ "model_max_length": 77,
28
+ "pad_token": "<|endoftext|>",
29
+ "tokenizer_class": "CLIPTokenizer",
30
+ "unk_token": "<|endoftext|>"
31
+ }
tokenizer/vocab.json ADDED
The diff for this file is too large to render. See raw diff