zhuoyang20 commited on
Commit
7a03dc4
·
verified ·
1 Parent(s): 6ae1e45

Upload folder using huggingface_hub

Browse files
config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_gradient_checkpointing": false,
3
+ "architectures": [
4
+ "MetaQuery"
5
+ ],
6
+ "attn_implementation": null,
7
+ "connector_num_hidden_layers": 24,
8
+ "diffusion_model_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers",
9
+ "discard_mllm_image_feature": false,
10
+ "dtype": "bfloat16",
11
+ "in_channels": 32,
12
+ "input_size": [
13
+ 20,
14
+ 15
15
+ ],
16
+ "loss_type": "flow",
17
+ "max_input_text_tokens": 256,
18
+ "max_pixels": 1003520,
19
+ "min_pixels": 200740,
20
+ "mllm_id": "google/gemma-2-2b-it",
21
+ "model_type": "metaquery",
22
+ "modules_to_freeze": [
23
+ "vae",
24
+ "model.mllm_backbone"
25
+ ],
26
+ "modules_to_unfreeze": [],
27
+ "noise_scheduler_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers",
28
+ "num_metaqueries": 64,
29
+ "scheduler_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers",
30
+ "source_vae_feature": true,
31
+ "system_prompt": "You are a robot and should focus on your actions. Generate a new image that meets the user's instruction while maintaining consistency with the original input where appropriate.",
32
+ "transformers_version": "4.57.1",
33
+ "vae_downsample_f": 32,
34
+ "vae_id": "Efficient-Large-Model/Sana_1600M_512px_diffusers"
35
+ }
model-00001-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05824b40b9a35b84ae84598a480e3b41b9ae4cb85f3d8a75b9f0ef7926556c02
3
+ size 4988031160
model-00002-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3febe45ea332f63d46b0aef6a1e5545715e12c00b8afac940f343c7a0950b2d
3
+ size 4999985168
model-00003-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:161c4d8f4d1d8e5aeb2c716be661e42bc686b64c538eacdce457d67b328d3db2
3
+ size 253880566
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff