Shangy commited on
Commit
348024f
·
verified ·
1 Parent(s): 5a45c90

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ trainer_state.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_gradient_checkpointing": false,
3
+ "architectures": [
4
+ "MetaQuery"
5
+ ],
6
+ "attn_implementation": null,
7
+ "connector_num_hidden_layers": 24,
8
+ "diffusion_model_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers",
9
+ "discard_mllm_image_feature": false,
10
+ "dtype": "bfloat16",
11
+ "in_channels": 32,
12
+ "input_size": [
13
+ 15,
14
+ 20
15
+ ],
16
+ "loss_type": "flow",
17
+ "max_input_text_tokens": 256,
18
+ "max_pixels": 1003520,
19
+ "min_pixels": 200740,
20
+ "mllm_id": "google/gemma-2-2b-it",
21
+ "model_type": "metaquery",
22
+ "modules_to_freeze": [
23
+ "vae",
24
+ "model.mllm_backbone"
25
+ ],
26
+ "modules_to_unfreeze": [],
27
+ "noise_scheduler_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers",
28
+ "num_metaqueries": 64,
29
+ "scheduler_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers",
30
+ "source_vae_feature": true,
31
+ "system_prompt": "You are a robot and should focus on your actions. Generate a new image that meets the user's instruction while maintaining consistency with the original input where appropriate.",
32
+ "transformers_version": "4.57.1",
33
+ "vae_downsample_f": 32,
34
+ "vae_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers"
35
+ }
model-00001-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05824b40b9a35b84ae84598a480e3b41b9ae4cb85f3d8a75b9f0ef7926556c02
3
+ size 4988031160
model-00002-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:701c39a5e803f6c935df026a062ada69c4196051f81f03e54ab79c9273efcfb0
3
+ size 4999985168
model-00003-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:161c4d8f4d1d8e5aeb2c716be661e42bc686b64c538eacdce457d67b328d3db2
3
+ size 253880566
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4267103928e8e19ffea1f0e40493c2b911c356deffd9bda6a337638dd04e8c69
3
+ size 12408484