Vizuara commited on
Commit
a3bd115
·
verified ·
1 Parent(s): 496d5f5

Add config.json

Browse files
Files changed (1) hide show
  1. config.json +111 -0
config.json ADDED
@@ -0,0 +1,111 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_dim": 32,
3
+ "action_head_cfg": {
4
+ "_convert_": "object",
5
+ "_target_": "groot.vla.model.dreamzero.action_head.wan_flow_matching_action_tf.WANPolicyHead",
6
+ "config": {
7
+ "_recursive_": false,
8
+ "_target_": "groot.vla.model.dreamzero.action_head.wan_flow_matching_action_tf.WANPolicyHeadConfig",
9
+ "action_dim": 32,
10
+ "action_horizon": 24,
11
+ "action_loss_embodiment_ids": [
12
+ 26,
13
+ 17,
14
+ 32
15
+ ],
16
+ "add_pos_embed": true,
17
+ "backbone_embedding_dim": 0,
18
+ "backbone_features_projector_cfg": null,
19
+ "decouple_video_action_noise": false,
20
+ "diffusion_model_cfg": {
21
+ "_convert_": "object",
22
+ "_target_": "groot.vla.model.dreamzero.modules.wan_video_dit_action_casual_chunk.CausalWanModel",
23
+ "diffusion_model_pretrained_path": "/workspace/checkpoints/Wan2.1-I2V-14B-480P",
24
+ "dim": 5120,
25
+ "eps": 1e-06,
26
+ "ffn_dim": 13824,
27
+ "frame_seqlen": 880,
28
+ "freq_dim": 256,
29
+ "in_dim": 36,
30
+ "max_chunk_size": 4,
31
+ "model_type": "i2v",
32
+ "num_action_per_block": 24,
33
+ "num_frame_per_block": 2,
34
+ "num_heads": 40,
35
+ "num_layers": 40,
36
+ "num_state_per_block": 1,
37
+ "out_dim": 16
38
+ },
39
+ "expand_batch": null,
40
+ "freeze_decode_layer": false,
41
+ "hidden_size": 64,
42
+ "image_encoder_cfg": {
43
+ "_convert_": "object",
44
+ "_target_": "groot.vla.model.dreamzero.modules.wan_video_image_encoder.WanImageEncoder",
45
+ "image_encoder_pretrained_path": "/workspace/checkpoints/Wan2.1-I2V-14B-480P/models_clip_open-clip-xlm-roberta-large-vit-huge-14.pth"
46
+ },
47
+ "init_lora_weights": "kaiming",
48
+ "input_embedding_dim": 1536,
49
+ "load_pretrained_det_decode_layer_path": null,
50
+ "lora_alpha": 4,
51
+ "lora_rank": 4,
52
+ "lora_target_modules": "q,k,v,o,ffn.0,ffn.2",
53
+ "max_action_dim": 32,
54
+ "max_state_dim": 64,
55
+ "model_dtype": "float32",
56
+ "noise_beta_alpha": 1.5,
57
+ "noise_beta_beta": 1.0,
58
+ "noise_s": 0.999,
59
+ "num_frame_per_block": 2,
60
+ "num_frames": 33,
61
+ "num_inference_timesteps": 4,
62
+ "num_timestep_buckets": 1000,
63
+ "repa_coeff": 1.0,
64
+ "repa_layer": 8,
65
+ "text_encoder_cfg": {
66
+ "_convert_": "object",
67
+ "_target_": "groot.vla.model.dreamzero.modules.wan_video_text_encoder.WanTextEncoder",
68
+ "text_encoder_pretrained_path": "/workspace/checkpoints/Wan2.1-I2V-14B-480P/models_t5_umt5-xxl-enc-bf16.pth"
69
+ },
70
+ "tile_size_height": 34,
71
+ "tile_size_width": 34,
72
+ "tile_stride_height": 18,
73
+ "tile_stride_width": 16,
74
+ "tiled": false,
75
+ "train_architecture": "lora",
76
+ "tune_diffusion_model": true,
77
+ "tune_projector": true,
78
+ "use_gradient_checkpointing": true,
79
+ "use_vlln": true,
80
+ "vae_cfg": {
81
+ "_convert_": "object",
82
+ "_target_": "groot.vla.model.dreamzero.modules.wan_video_vae.WanVideoVAE",
83
+ "vae_pretrained_path": "/workspace/checkpoints/Wan2.1-I2V-14B-480P/Wan2.1_VAE.pth"
84
+ },
85
+ "video_noise_beta_alpha": 3.0,
86
+ "video_noise_beta_beta": 1.0,
87
+ "vl_self_attention_cfg": {
88
+ "_target_": "groot.vla.model.n1_5.modules.cross_attention_dit.SelfAttentionTransformer",
89
+ "attention_head_dim": 64,
90
+ "dropout": 0.2,
91
+ "final_dropout": true,
92
+ "num_attention_heads": 24,
93
+ "num_layers": 4,
94
+ "positional_embeddings": null
95
+ }
96
+ }
97
+ },
98
+ "action_horizon": 24,
99
+ "architectures": [
100
+ "VLA"
101
+ ],
102
+ "backbone_cfg": {
103
+ "_target_": "groot.vla.model.dreamzero.backbone.identity.IdentityBackbone"
104
+ },
105
+ "hidden_size": 0,
106
+ "model_dtype": "float32",
107
+ "model_type": "vla",
108
+ "resume_path": "/workspace/checkpoints/dreamzero-so101-lora",
109
+ "torch_dtype": "bfloat16",
110
+ "transformers_version": "4.51.3"
111
+ }