End of training
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- README.md +39 -0
- checkpoint-1000/model.safetensors +3 -0
- checkpoint-1000/optimizer.bin +3 -0
- checkpoint-1000/random_states_0.pkl +3 -0
- checkpoint-1000/scheduler.bin +3 -0
- checkpoint-1500/model.safetensors +3 -0
- checkpoint-1500/optimizer.bin +3 -0
- checkpoint-1500/random_states_0.pkl +3 -0
- checkpoint-1500/scheduler.bin +3 -0
- checkpoint-2000/model.safetensors +3 -0
- checkpoint-2000/optimizer.bin +3 -0
- checkpoint-2000/random_states_0.pkl +3 -0
- checkpoint-2000/scheduler.bin +3 -0
- checkpoint-2500/model.safetensors +3 -0
- checkpoint-2500/optimizer.bin +3 -0
- checkpoint-2500/random_states_0.pkl +3 -0
- checkpoint-2500/scheduler.bin +3 -0
- checkpoint-3000/model.safetensors +3 -0
- checkpoint-3000/optimizer.bin +3 -0
- checkpoint-3000/random_states_0.pkl +3 -0
- checkpoint-3000/scheduler.bin +3 -0
- checkpoint-500/model.safetensors +3 -0
- checkpoint-500/optimizer.bin +3 -0
- checkpoint-500/random_states_0.pkl +3 -0
- checkpoint-500/scheduler.bin +3 -0
- feature_extractor/preprocessor_config.json +27 -0
- learned_embeds-steps-1000.safetensors +3 -0
- learned_embeds-steps-1500.safetensors +3 -0
- learned_embeds-steps-2000.safetensors +3 -0
- learned_embeds-steps-2500.safetensors +3 -0
- learned_embeds-steps-3000.safetensors +3 -0
- learned_embeds-steps-500.safetensors +3 -0
- learned_embeds.safetensors +3 -0
- logs/textual_inversion/1748332987.9312513/events.out.tfevents.1748332987.966fbf330007.5423.1 +3 -0
- logs/textual_inversion/1748332987.9338686/hparams.yml +48 -0
- logs/textual_inversion/1748333078.598716/events.out.tfevents.1748333078.966fbf330007.5518.1 +3 -0
- logs/textual_inversion/1748333078.6014333/hparams.yml +48 -0
- logs/textual_inversion/events.out.tfevents.1748332987.966fbf330007.5423.0 +3 -0
- logs/textual_inversion/events.out.tfevents.1748333078.966fbf330007.5518.0 +3 -0
- model_index.json +38 -0
- safety_checker/config.json +46 -0
- safety_checker/model.safetensors +3 -0
- scheduler/scheduler_config.json +15 -0
- text_encoder/config.json +24 -0
- text_encoder/model.safetensors +3 -0
- tokenizer/added_tokens.json +3 -0
- tokenizer/merges.txt +0 -0
- tokenizer/special_tokens_map.json +24 -0
- tokenizer/tokenizer_config.json +39 -0
- tokenizer/vocab.json +0 -0
README.md
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
base_model: stable-diffusion-v1-5/stable-diffusion-v1-5
|
| 3 |
+
library_name: diffusers
|
| 4 |
+
license: creativeml-openrail-m
|
| 5 |
+
inference: true
|
| 6 |
+
tags:
|
| 7 |
+
- stable-diffusion
|
| 8 |
+
- stable-diffusion-diffusers
|
| 9 |
+
- text-to-image
|
| 10 |
+
- diffusers
|
| 11 |
+
- textual_inversion
|
| 12 |
+
- diffusers-training
|
| 13 |
+
---
|
| 14 |
+
|
| 15 |
+
<!-- This model card has been generated automatically according to the information the training script had access to. You
|
| 16 |
+
should probably proofread and complete it, then remove this comment. -->
|
| 17 |
+
|
| 18 |
+
|
| 19 |
+
# Textual inversion text2image fine-tuning - ycxyork/textual_inversion_cat
|
| 20 |
+
These are textual inversion adaption weights for stable-diffusion-v1-5/stable-diffusion-v1-5. You can find some example images in the following.
|
| 21 |
+
|
| 22 |
+
|
| 23 |
+
|
| 24 |
+
|
| 25 |
+
## Intended uses & limitations
|
| 26 |
+
|
| 27 |
+
#### How to use
|
| 28 |
+
|
| 29 |
+
```python
|
| 30 |
+
# TODO: add an example code snippet for running this diffusion pipeline
|
| 31 |
+
```
|
| 32 |
+
|
| 33 |
+
#### Limitations and bias
|
| 34 |
+
|
| 35 |
+
[TODO: provide examples of latent issues and potential remediations]
|
| 36 |
+
|
| 37 |
+
## Training details
|
| 38 |
+
|
| 39 |
+
[TODO: describe the data used to train the model]
|
checkpoint-1000/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d2e36b38cf55ad64e308ef6d70777905b6169bc29e7e6d7bba181509e0b9cae
|
| 3 |
+
size 492268240
|
checkpoint-1000/optimizer.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ea4a6d47e4986949425c8c9f4bd8989012e019c70db41106074925bc425a7d3
|
| 3 |
+
size 303571379
|
checkpoint-1000/random_states_0.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b25a0938a541fea2a44a495f48b697949cb26bf454eaa1174da70f0f258370ed
|
| 3 |
+
size 14757
|
checkpoint-1000/scheduler.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0141b8816d005ab0155e12076591b358b17b434b820ffd19fcb751fd3577ab0
|
| 3 |
+
size 1401
|
checkpoint-1500/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02fe4a93361732436cbad55762df138a5e650bb7b8cfe2d9c984754c34a21a78
|
| 3 |
+
size 492268240
|
checkpoint-1500/optimizer.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d215d9219667bbb123ed2886576cf4c3082d04cb34f7de61d1976ac306eb9742
|
| 3 |
+
size 303571379
|
checkpoint-1500/random_states_0.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df94cbcc8ddfb64f910bbba8a3cf29a8e97767ecfda7c48b9e6317423d2f2a86
|
| 3 |
+
size 14821
|
checkpoint-1500/scheduler.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2f6de1f1aad4955373863105fea43996909135ab11a05f69f664002caa7f655
|
| 3 |
+
size 1401
|
checkpoint-2000/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd1a19bcbb11c1a8674b5c8e57bad37654f8eb668d0fd147b3757882e390deed
|
| 3 |
+
size 492268240
|
checkpoint-2000/optimizer.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2e858136df12c1f7059763a88e4ff5554a8c7db4323a10923cca769f5191386
|
| 3 |
+
size 303571379
|
checkpoint-2000/random_states_0.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb9ce4ca6621c1ce4981077e5b0a22462f2c8611e1ca2b935701481654095387
|
| 3 |
+
size 14821
|
checkpoint-2000/scheduler.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db8705e68e3f5d10b2093eb04409445a51eaa0fa537855f68bbff49f7ba03b3f
|
| 3 |
+
size 1401
|
checkpoint-2500/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20544149ba78dc85028edc80e40eb748dbb051614a548fe9868ec13cd5a19d1b
|
| 3 |
+
size 492268240
|
checkpoint-2500/optimizer.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:353a28b4aa1f6d4ee1e1729121176237f8e3e7bfb3804792ccc32fe743ebed83
|
| 3 |
+
size 303571379
|
checkpoint-2500/random_states_0.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cdf89698ccb2e744f71651fecea4c0a212208c614eecb666edf9fc37c4468d93
|
| 3 |
+
size 14757
|
checkpoint-2500/scheduler.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:328b872afc2dde919bcdc05a2f15ee9a6c2c722dc09e791a74e330c511dff2d7
|
| 3 |
+
size 1401
|
checkpoint-3000/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4f0466c7f7abdf33eb02651635485d5fdf1efe8e549c5e96b1a2cb0114b7b59
|
| 3 |
+
size 492268240
|
checkpoint-3000/optimizer.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c71376b2a09419509c97a31884ba3856ae3b69c00db8906b2e0e256259d73393
|
| 3 |
+
size 303571379
|
checkpoint-3000/random_states_0.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9280134662aa5b1f108a83e81da5cd7faa0e4bc119be97c12570f7aa993a2b86
|
| 3 |
+
size 14821
|
checkpoint-3000/scheduler.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f598def469aca44a1bf0b4394561a0be098ee257cabc03a28986894010b3775
|
| 3 |
+
size 1401
|
checkpoint-500/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33d6121f84ceb7d7dad3eef9b115d3a7833c8a9fde020210530e84027c55179d
|
| 3 |
+
size 492268240
|
checkpoint-500/optimizer.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0101d6e6ca6e8d215f82b42d226ac2d69c1f931428946cd12bd97591e7184d97
|
| 3 |
+
size 303571379
|
checkpoint-500/random_states_0.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:959ce2231bbdf89ef3c5fe744f892a1837575b6d3b44c9934ac5c13c665241d1
|
| 3 |
+
size 14757
|
checkpoint-500/scheduler.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee04579db6cf5d822fbf73f3441ac1670faf4a79ec5c320d39b5a697e8102112
|
| 3 |
+
size 1401
|
feature_extractor/preprocessor_config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"crop_size": {
|
| 3 |
+
"height": 224,
|
| 4 |
+
"width": 224
|
| 5 |
+
},
|
| 6 |
+
"do_center_crop": true,
|
| 7 |
+
"do_convert_rgb": true,
|
| 8 |
+
"do_normalize": true,
|
| 9 |
+
"do_rescale": true,
|
| 10 |
+
"do_resize": true,
|
| 11 |
+
"image_mean": [
|
| 12 |
+
0.48145466,
|
| 13 |
+
0.4578275,
|
| 14 |
+
0.40821073
|
| 15 |
+
],
|
| 16 |
+
"image_processor_type": "CLIPImageProcessor",
|
| 17 |
+
"image_std": [
|
| 18 |
+
0.26862954,
|
| 19 |
+
0.26130258,
|
| 20 |
+
0.27577711
|
| 21 |
+
],
|
| 22 |
+
"resample": 3,
|
| 23 |
+
"rescale_factor": 0.00392156862745098,
|
| 24 |
+
"size": {
|
| 25 |
+
"shortest_edge": 224
|
| 26 |
+
}
|
| 27 |
+
}
|
learned_embeds-steps-1000.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc16b82b4bdc2f52d51d6f853a1cb294f3545d05c09ea798530719b8478ef507
|
| 3 |
+
size 3184
|
learned_embeds-steps-1500.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d542fd6e71070ac7d2bed3872c43ca348d1de2388df8e19610101b0db0ef1fe
|
| 3 |
+
size 3184
|
learned_embeds-steps-2000.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99a2a32e0bfd11bdebb82f1528fafb92f355eba50fb7893ea2cf31d393ea0b5f
|
| 3 |
+
size 3184
|
learned_embeds-steps-2500.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ecc5b326eec381fa44a25e3d1489a1c94e5901d2f5b13731c4b61d0b09b38247
|
| 3 |
+
size 3184
|
learned_embeds-steps-3000.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:173347e7dbba556160eda7aed58800d251f85d62651023c694ce4c66036cd57e
|
| 3 |
+
size 3184
|
learned_embeds-steps-500.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a627af1ea99d96dcc3c3b607dc0ea2b2a62c5ff434c38daeb6fb4e07e5d3641
|
| 3 |
+
size 3184
|
learned_embeds.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:173347e7dbba556160eda7aed58800d251f85d62651023c694ce4c66036cd57e
|
| 3 |
+
size 3184
|
logs/textual_inversion/1748332987.9312513/events.out.tfevents.1748332987.966fbf330007.5423.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf0b55c533020a2a50f87936f8ce67e34b25d4e91797c04d797f870c46af8b20
|
| 3 |
+
size 2336
|
logs/textual_inversion/1748332987.9338686/hparams.yml
ADDED
|
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
adam_beta1: 0.9
|
| 2 |
+
adam_beta2: 0.999
|
| 3 |
+
adam_epsilon: 1.0e-08
|
| 4 |
+
adam_weight_decay: 0.01
|
| 5 |
+
allow_tf32: false
|
| 6 |
+
center_crop: false
|
| 7 |
+
checkpointing_steps: 500
|
| 8 |
+
checkpoints_total_limit: null
|
| 9 |
+
dataloader_num_workers: 0
|
| 10 |
+
enable_xformers_memory_efficient_attention: false
|
| 11 |
+
gradient_accumulation_steps: 4
|
| 12 |
+
gradient_checkpointing: false
|
| 13 |
+
hub_model_id: null
|
| 14 |
+
hub_token: null
|
| 15 |
+
initializer_token: toy
|
| 16 |
+
learnable_property: object
|
| 17 |
+
learning_rate: 0.002
|
| 18 |
+
local_rank: -1
|
| 19 |
+
logging_dir: logs
|
| 20 |
+
lr_num_cycles: 1
|
| 21 |
+
lr_scheduler: constant
|
| 22 |
+
lr_warmup_steps: 0
|
| 23 |
+
max_train_steps: 3000
|
| 24 |
+
mixed_precision: 'no'
|
| 25 |
+
no_safe_serialization: false
|
| 26 |
+
num_train_epochs: 18
|
| 27 |
+
num_validation_images: 4
|
| 28 |
+
num_vectors: 1
|
| 29 |
+
output_dir: textual_inversion_cat
|
| 30 |
+
placeholder_token: <cat-toy>
|
| 31 |
+
pretrained_model_name_or_path: stable-diffusion-v1-5/stable-diffusion-v1-5
|
| 32 |
+
push_to_hub: true
|
| 33 |
+
repeats: 100
|
| 34 |
+
report_to: tensorboard
|
| 35 |
+
resolution: 512
|
| 36 |
+
resume_from_checkpoint: null
|
| 37 |
+
revision: null
|
| 38 |
+
save_as_full_pipeline: false
|
| 39 |
+
save_steps: 500
|
| 40 |
+
scale_lr: true
|
| 41 |
+
seed: null
|
| 42 |
+
tokenizer_name: null
|
| 43 |
+
train_batch_size: 1
|
| 44 |
+
train_data_dir: ./cat
|
| 45 |
+
validation_epochs: null
|
| 46 |
+
validation_prompt: null
|
| 47 |
+
validation_steps: 100
|
| 48 |
+
variant: null
|
logs/textual_inversion/1748333078.598716/events.out.tfevents.1748333078.966fbf330007.5518.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8fb4f42d4fca30f53766c6a61ec45c4f90795aa002ea25c33df3c66d6868e6c1
|
| 3 |
+
size 2336
|
logs/textual_inversion/1748333078.6014333/hparams.yml
ADDED
|
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
adam_beta1: 0.9
|
| 2 |
+
adam_beta2: 0.999
|
| 3 |
+
adam_epsilon: 1.0e-08
|
| 4 |
+
adam_weight_decay: 0.01
|
| 5 |
+
allow_tf32: false
|
| 6 |
+
center_crop: false
|
| 7 |
+
checkpointing_steps: 500
|
| 8 |
+
checkpoints_total_limit: null
|
| 9 |
+
dataloader_num_workers: 0
|
| 10 |
+
enable_xformers_memory_efficient_attention: false
|
| 11 |
+
gradient_accumulation_steps: 4
|
| 12 |
+
gradient_checkpointing: false
|
| 13 |
+
hub_model_id: null
|
| 14 |
+
hub_token: null
|
| 15 |
+
initializer_token: toy
|
| 16 |
+
learnable_property: object
|
| 17 |
+
learning_rate: 0.002
|
| 18 |
+
local_rank: -1
|
| 19 |
+
logging_dir: logs
|
| 20 |
+
lr_num_cycles: 1
|
| 21 |
+
lr_scheduler: constant
|
| 22 |
+
lr_warmup_steps: 0
|
| 23 |
+
max_train_steps: 3000
|
| 24 |
+
mixed_precision: 'no'
|
| 25 |
+
no_safe_serialization: false
|
| 26 |
+
num_train_epochs: 20
|
| 27 |
+
num_validation_images: 4
|
| 28 |
+
num_vectors: 1
|
| 29 |
+
output_dir: textual_inversion_cat
|
| 30 |
+
placeholder_token: <cat-toy>
|
| 31 |
+
pretrained_model_name_or_path: stable-diffusion-v1-5/stable-diffusion-v1-5
|
| 32 |
+
push_to_hub: true
|
| 33 |
+
repeats: 100
|
| 34 |
+
report_to: tensorboard
|
| 35 |
+
resolution: 512
|
| 36 |
+
resume_from_checkpoint: null
|
| 37 |
+
revision: null
|
| 38 |
+
save_as_full_pipeline: false
|
| 39 |
+
save_steps: 500
|
| 40 |
+
scale_lr: true
|
| 41 |
+
seed: null
|
| 42 |
+
tokenizer_name: null
|
| 43 |
+
train_batch_size: 1
|
| 44 |
+
train_data_dir: ./cat
|
| 45 |
+
validation_epochs: null
|
| 46 |
+
validation_prompt: null
|
| 47 |
+
validation_steps: 100
|
| 48 |
+
variant: null
|
logs/textual_inversion/events.out.tfevents.1748332987.966fbf330007.5423.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:112821b810cb8b1b59bcad6a3b0221883874aadd2dc9facbd5d2e06134de0ae3
|
| 3 |
+
size 88
|
logs/textual_inversion/events.out.tfevents.1748333078.966fbf330007.5518.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23a472daeea5b5dcba1c0fa64a673d3938eefe532ac1593884ea8af824fe1f15
|
| 3 |
+
size 1007054
|
model_index.json
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "StableDiffusionPipeline",
|
| 3 |
+
"_diffusers_version": "0.34.0.dev0",
|
| 4 |
+
"_name_or_path": "stable-diffusion-v1-5/stable-diffusion-v1-5",
|
| 5 |
+
"feature_extractor": [
|
| 6 |
+
"transformers",
|
| 7 |
+
"CLIPImageProcessor"
|
| 8 |
+
],
|
| 9 |
+
"image_encoder": [
|
| 10 |
+
null,
|
| 11 |
+
null
|
| 12 |
+
],
|
| 13 |
+
"requires_safety_checker": true,
|
| 14 |
+
"safety_checker": [
|
| 15 |
+
"stable_diffusion",
|
| 16 |
+
"StableDiffusionSafetyChecker"
|
| 17 |
+
],
|
| 18 |
+
"scheduler": [
|
| 19 |
+
"diffusers",
|
| 20 |
+
"PNDMScheduler"
|
| 21 |
+
],
|
| 22 |
+
"text_encoder": [
|
| 23 |
+
"transformers",
|
| 24 |
+
"CLIPTextModel"
|
| 25 |
+
],
|
| 26 |
+
"tokenizer": [
|
| 27 |
+
"transformers",
|
| 28 |
+
"CLIPTokenizer"
|
| 29 |
+
],
|
| 30 |
+
"unet": [
|
| 31 |
+
"diffusers",
|
| 32 |
+
"UNet2DConditionModel"
|
| 33 |
+
],
|
| 34 |
+
"vae": [
|
| 35 |
+
"diffusers",
|
| 36 |
+
"AutoencoderKL"
|
| 37 |
+
]
|
| 38 |
+
}
|
safety_checker/config.json
ADDED
|
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"StableDiffusionSafetyChecker"
|
| 4 |
+
],
|
| 5 |
+
"initializer_factor": 1.0,
|
| 6 |
+
"logit_scale_init_value": 2.6592,
|
| 7 |
+
"model_type": "clip",
|
| 8 |
+
"projection_dim": 768,
|
| 9 |
+
"text_config": {
|
| 10 |
+
"attention_dropout": 0.0,
|
| 11 |
+
"dropout": 0.0,
|
| 12 |
+
"hidden_act": "quick_gelu",
|
| 13 |
+
"hidden_size": 768,
|
| 14 |
+
"initializer_factor": 1.0,
|
| 15 |
+
"initializer_range": 0.02,
|
| 16 |
+
"intermediate_size": 3072,
|
| 17 |
+
"layer_norm_eps": 1e-05,
|
| 18 |
+
"max_position_embeddings": 77,
|
| 19 |
+
"model_type": "clip_text_model",
|
| 20 |
+
"num_attention_heads": 12,
|
| 21 |
+
"num_hidden_layers": 12,
|
| 22 |
+
"projection_dim": 512,
|
| 23 |
+
"torch_dtype": "float32",
|
| 24 |
+
"vocab_size": 49408
|
| 25 |
+
},
|
| 26 |
+
"torch_dtype": "float32",
|
| 27 |
+
"transformers_version": "4.52.3",
|
| 28 |
+
"vision_config": {
|
| 29 |
+
"attention_dropout": 0.0,
|
| 30 |
+
"dropout": 0.0,
|
| 31 |
+
"hidden_act": "quick_gelu",
|
| 32 |
+
"hidden_size": 1024,
|
| 33 |
+
"image_size": 224,
|
| 34 |
+
"initializer_factor": 1.0,
|
| 35 |
+
"initializer_range": 0.02,
|
| 36 |
+
"intermediate_size": 4096,
|
| 37 |
+
"layer_norm_eps": 1e-05,
|
| 38 |
+
"model_type": "clip_vision_model",
|
| 39 |
+
"num_attention_heads": 16,
|
| 40 |
+
"num_channels": 3,
|
| 41 |
+
"num_hidden_layers": 24,
|
| 42 |
+
"patch_size": 14,
|
| 43 |
+
"projection_dim": 512,
|
| 44 |
+
"torch_dtype": "float32"
|
| 45 |
+
}
|
| 46 |
+
}
|
safety_checker/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb351a5ded815c3ff744968ad9c6b218d071b9d313d04f35e813b84b4c0ffde8
|
| 3 |
+
size 1215979664
|
scheduler/scheduler_config.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "PNDMScheduler",
|
| 3 |
+
"_diffusers_version": "0.34.0.dev0",
|
| 4 |
+
"beta_end": 0.012,
|
| 5 |
+
"beta_schedule": "scaled_linear",
|
| 6 |
+
"beta_start": 0.00085,
|
| 7 |
+
"clip_sample": false,
|
| 8 |
+
"num_train_timesteps": 1000,
|
| 9 |
+
"prediction_type": "epsilon",
|
| 10 |
+
"set_alpha_to_one": false,
|
| 11 |
+
"skip_prk_steps": true,
|
| 12 |
+
"steps_offset": 1,
|
| 13 |
+
"timestep_spacing": "leading",
|
| 14 |
+
"trained_betas": null
|
| 15 |
+
}
|
text_encoder/config.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"CLIPTextModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_dropout": 0.0,
|
| 6 |
+
"bos_token_id": 0,
|
| 7 |
+
"dropout": 0.0,
|
| 8 |
+
"eos_token_id": 2,
|
| 9 |
+
"hidden_act": "quick_gelu",
|
| 10 |
+
"hidden_size": 768,
|
| 11 |
+
"initializer_factor": 1.0,
|
| 12 |
+
"initializer_range": 0.02,
|
| 13 |
+
"intermediate_size": 3072,
|
| 14 |
+
"layer_norm_eps": 1e-05,
|
| 15 |
+
"max_position_embeddings": 77,
|
| 16 |
+
"model_type": "clip_text_model",
|
| 17 |
+
"num_attention_heads": 12,
|
| 18 |
+
"num_hidden_layers": 12,
|
| 19 |
+
"pad_token_id": 1,
|
| 20 |
+
"projection_dim": 768,
|
| 21 |
+
"torch_dtype": "float32",
|
| 22 |
+
"transformers_version": "4.52.3",
|
| 23 |
+
"vocab_size": 49409
|
| 24 |
+
}
|
text_encoder/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4f0466c7f7abdf33eb02651635485d5fdf1efe8e549c5e96b1a2cb0114b7b59
|
| 3 |
+
size 492268240
|
tokenizer/added_tokens.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"<cat-toy>": 49408
|
| 3 |
+
}
|
tokenizer/merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer/special_tokens_map.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<|startoftext|>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": true,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"eos_token": {
|
| 10 |
+
"content": "<|endoftext|>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": true,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": "<|endoftext|>",
|
| 17 |
+
"unk_token": {
|
| 18 |
+
"content": "<|endoftext|>",
|
| 19 |
+
"lstrip": false,
|
| 20 |
+
"normalized": true,
|
| 21 |
+
"rstrip": false,
|
| 22 |
+
"single_word": false
|
| 23 |
+
}
|
| 24 |
+
}
|
tokenizer/tokenizer_config.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"added_tokens_decoder": {
|
| 4 |
+
"49406": {
|
| 5 |
+
"content": "<|startoftext|>",
|
| 6 |
+
"lstrip": false,
|
| 7 |
+
"normalized": true,
|
| 8 |
+
"rstrip": false,
|
| 9 |
+
"single_word": false,
|
| 10 |
+
"special": true
|
| 11 |
+
},
|
| 12 |
+
"49407": {
|
| 13 |
+
"content": "<|endoftext|>",
|
| 14 |
+
"lstrip": false,
|
| 15 |
+
"normalized": true,
|
| 16 |
+
"rstrip": false,
|
| 17 |
+
"single_word": false,
|
| 18 |
+
"special": true
|
| 19 |
+
},
|
| 20 |
+
"49408": {
|
| 21 |
+
"content": "<cat-toy>",
|
| 22 |
+
"lstrip": false,
|
| 23 |
+
"normalized": true,
|
| 24 |
+
"rstrip": false,
|
| 25 |
+
"single_word": false,
|
| 26 |
+
"special": false
|
| 27 |
+
}
|
| 28 |
+
},
|
| 29 |
+
"bos_token": "<|startoftext|>",
|
| 30 |
+
"clean_up_tokenization_spaces": false,
|
| 31 |
+
"do_lower_case": true,
|
| 32 |
+
"eos_token": "<|endoftext|>",
|
| 33 |
+
"errors": "replace",
|
| 34 |
+
"extra_special_tokens": {},
|
| 35 |
+
"model_max_length": 77,
|
| 36 |
+
"pad_token": "<|endoftext|>",
|
| 37 |
+
"tokenizer_class": "CLIPTokenizer",
|
| 38 |
+
"unk_token": "<|endoftext|>"
|
| 39 |
+
}
|
tokenizer/vocab.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|