onpix commited on
Commit
1dfb99e
·
verified ·
1 Parent(s): 441c700

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ ar_distilled_action_model/model.safetensors filter=lfs diff=lfs merge=lfs -text
37
+ ar_model/diffusion_pytorch_model.safetensors filter=lfs diff=lfs merge=lfs -text
38
+ bidirectional_model/diffusion_pytorch_model.safetensors filter=lfs diff=lfs merge=lfs -text
ar_distilled_action_model/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2642ca972e49355e1a00d18dbc9847a2d8c1e707a6a9abd0994d4949258cc963
3
+ size 34231948208
ar_model/config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "patch_size": [
3
+ 1,
4
+ 1,
5
+ 1
6
+ ],
7
+ "in_channels": 32,
8
+ "concat_condition": true,
9
+ "out_channels": 32,
10
+ "hidden_size": 2048,
11
+ "heads_num": 16,
12
+ "mlp_width_ratio": 4,
13
+ "mlp_act_type": "gelu_tanh",
14
+ "mm_double_blocks_depth": 54,
15
+ "mm_single_blocks_depth": 0,
16
+ "rope_dim_list": [
17
+ 16,
18
+ 56,
19
+ 56
20
+ ],
21
+ "qkv_bias": true,
22
+ "qk_norm": true,
23
+ "qk_norm_type": "rms",
24
+ "guidance_embed": false,
25
+ "use_meanflow": false,
26
+ "text_projection": "single_refiner",
27
+ "use_attention_mask": true,
28
+ "text_states_dim": 3584,
29
+ "text_states_dim_2": null,
30
+ "text_pool_type": null,
31
+ "rope_theta": 256,
32
+ "attn_mode": "flash",
33
+ "attn_param": null,
34
+ "glyph_byT5_v2": true,
35
+ "vision_projection": "linear",
36
+ "vision_states_dim": 1152,
37
+ "is_reshape_temporal_channels": false,
38
+ "use_cond_type_embedding": true,
39
+ "ideal_resolution": "480p",
40
+ "ideal_task": "i2v",
41
+ "_class_name": "ARHunyuanVideo_1_5_DiffusionTransformer",
42
+ "_diffusers_version": "0.35.0",
43
+ "_name_or_path": "/apdcephfs_jn2/share_303535725/aejionzhang/checkpoints/hunyuanvideo_1_5/transformer/480p_i2v/"
44
+ }
ar_model/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d71e503fc36dd0a44b985de1e05bfedb8825f571ccce7d6039b4a2dcd954f9c8
3
+ size 34231948208
bidirectional_model/config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "patch_size": [
3
+ 1,
4
+ 1,
5
+ 1
6
+ ],
7
+ "in_channels": 32,
8
+ "concat_condition": true,
9
+ "out_channels": 32,
10
+ "hidden_size": 2048,
11
+ "heads_num": 16,
12
+ "mlp_width_ratio": 4,
13
+ "mlp_act_type": "gelu_tanh",
14
+ "mm_double_blocks_depth": 54,
15
+ "mm_single_blocks_depth": 0,
16
+ "rope_dim_list": [
17
+ 16,
18
+ 56,
19
+ 56
20
+ ],
21
+ "qkv_bias": true,
22
+ "qk_norm": true,
23
+ "qk_norm_type": "rms",
24
+ "guidance_embed": false,
25
+ "use_meanflow": false,
26
+ "text_projection": "single_refiner",
27
+ "use_attention_mask": true,
28
+ "text_states_dim": 3584,
29
+ "text_states_dim_2": null,
30
+ "text_pool_type": null,
31
+ "rope_theta": 256,
32
+ "attn_mode": "flash",
33
+ "attn_param": null,
34
+ "glyph_byT5_v2": true,
35
+ "vision_projection": "linear",
36
+ "vision_states_dim": 1152,
37
+ "is_reshape_temporal_channels": false,
38
+ "use_cond_type_embedding": true,
39
+ "ideal_resolution": "480p",
40
+ "ideal_task": "i2v",
41
+ "_class_name": "HunyuanVideo_1_5_DiffusionTransformer",
42
+ "_diffusers_version": "0.35.0",
43
+ "_name_or_path": "/apdcephfs_jn2/share_303535725/aejionzhang/checkpoints/hunyuanvideo_1_5/transformer/480p_i2v/"
44
+ }
bidirectional_model/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1926ad6356248f191092768758ef959608f0ee7473c06e6ae7c7f116b9f77b19
3
+ size 34231948208