kerzgrr commited on
Commit
a9b7249
·
verified ·
1 Parent(s): 5ca86d9

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +60 -0
config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "kerzgrr/imagenv1m",
3
+ "model_type": "imagen-dit",
4
+ "model_version": "v1-medium",
5
+ "model_size": "320M",
6
+
7
+ "architecture": {
8
+ "type": "DiT",
9
+ "hidden_size": 1024,
10
+ "depth": 12,
11
+ "num_heads": 16,
12
+ "patch_size": 2,
13
+ "mlp_ratio": 4.0,
14
+ "context_dim": 1024,
15
+ "in_channels": 4,
16
+ "use_rope": true,
17
+ "use_qk_norm": true,
18
+ "use_swiglu": true
19
+ },
20
+
21
+ "text_encoder": {
22
+ "type": "t5",
23
+ "model_name": "google/flan-t5-large",
24
+ "max_length": 256
25
+ },
26
+
27
+ "vae": {
28
+ "type": "sdxl",
29
+ "model_name": "stabilityai/sdxl-vae",
30
+ "latent_channels": 4,
31
+ "scaling_factor": 0.13025
32
+ },
33
+
34
+ "diffusion": {
35
+ "num_timesteps": 1000,
36
+ "schedule": "cosine",
37
+ "prediction_type": "epsilon"
38
+ },
39
+
40
+ "generation": {
41
+ "default_steps": 50,
42
+ "default_cfg_scale": 7.5,
43
+ "image_size": 256
44
+ },
45
+
46
+ "training": {
47
+ "dataset": "UCSC-VLAA/Recap-DataComp-1B",
48
+ "precision": "bf16",
49
+ "ema_decay": 0.9999
50
+ },
51
+
52
+ "model_family": {
53
+ "v1-nano": {"params": "50M", "hidden_size": 384, "depth": 8, "status": "planned"},
54
+ "v1-small": {"params": "150M", "hidden_size": 768, "depth": 10, "status": "planned"},
55
+ "v1-medium": {"params": "320M", "hidden_size": 1024, "depth": 12, "status": "released"},
56
+ "v1-large": {"params": "700M", "hidden_size": 1536, "depth": 16, "status": "planned"},
57
+ "v1-xlarge": {"params": "1.5B", "hidden_size": 2048, "depth": 24, "status": "planned"}
58
+ }
59
+ }
60
+