nickname100231 commited on
Commit
85268e8
·
verified ·
1 Parent(s): 56fa8f9

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. config.json +71 -0
  3. consolidated-00181-of-00272.safetensors +3 -0
  4. consolidated-00182-of-00272.safetensors +3 -0
  5. consolidated-00185-of-00272.safetensors +3 -0
  6. consolidated-00187-of-00272.safetensors +3 -0
  7. consolidated-00188-of-00272.safetensors +3 -0
  8. consolidated-00189-of-00272.safetensors +3 -0
  9. consolidated-00192-of-00272.safetensors +3 -0
  10. consolidated-00193-of-00272.safetensors +3 -0
  11. consolidated-00194-of-00272.safetensors +3 -0
  12. consolidated-00195-of-00272.safetensors +3 -0
  13. consolidated-00196-of-00272.safetensors +3 -0
  14. consolidated-00198-of-00272.safetensors +3 -0
  15. consolidated-00199-of-00272.safetensors +3 -0
  16. consolidated-00201-of-00272.safetensors +3 -0
  17. consolidated-00202-of-00272.safetensors +3 -0
  18. consolidated-00203-of-00272.safetensors +3 -0
  19. consolidated-00204-of-00272.safetensors +3 -0
  20. consolidated-00205-of-00272.safetensors +3 -0
  21. consolidated-00206-of-00272.safetensors +3 -0
  22. consolidated-00207-of-00272.safetensors +3 -0
  23. consolidated-00208-of-00272.safetensors +3 -0
  24. consolidated-00209-of-00272.safetensors +3 -0
  25. consolidated-00211-of-00272.safetensors +3 -0
  26. consolidated-00212-of-00272.safetensors +3 -0
  27. consolidated-00213-of-00272.safetensors +3 -0
  28. consolidated-00214-of-00272.safetensors +3 -0
  29. consolidated-00216-of-00272.safetensors +3 -0
  30. consolidated-00217-of-00272.safetensors +3 -0
  31. consolidated-00219-of-00272.safetensors +3 -0
  32. consolidated-00221-of-00272.safetensors +3 -0
  33. consolidated-00222-of-00272.safetensors +3 -0
  34. consolidated-00224-of-00272.safetensors +3 -0
  35. consolidated-00225-of-00272.safetensors +3 -0
  36. consolidated-00226-of-00272.safetensors +3 -0
  37. consolidated-00228-of-00272.safetensors +3 -0
  38. consolidated-00229-of-00272.safetensors +3 -0
  39. consolidated-00231-of-00272.safetensors +3 -0
  40. consolidated-00232-of-00272.safetensors +3 -0
  41. consolidated-00234-of-00272.safetensors +3 -0
  42. consolidated-00235-of-00272.safetensors +3 -0
  43. consolidated-00238-of-00272.safetensors +3 -0
  44. consolidated-00239-of-00272.safetensors +3 -0
  45. consolidated-00241-of-00272.safetensors +3 -0
  46. consolidated-00242-of-00272.safetensors +3 -0
  47. consolidated-00245-of-00272.safetensors +3 -0
  48. consolidated-00246-of-00272.safetensors +3 -0
  49. consolidated-00247-of-00272.safetensors +3 -0
  50. model.safetensors.index.json +0 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tekken.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "head_dim": 192,
3
+ "vocab_size": 131072,
4
+ "llama_4_scaling": {
5
+ "original_max_position_embeddings": 8192,
6
+ "beta": 0.1
7
+ },
8
+ "q_lora_rank": 1536,
9
+ "qk_rope_head_dim": 64,
10
+ "qk_nope_head_dim": 128,
11
+ "kv_lora_rank": 512,
12
+ "v_head_dim": 128,
13
+ "vision_encoder": {
14
+ "image_token_id": 10,
15
+ "image_break_token_id": 12,
16
+ "image_end_token_id": 13,
17
+ "intermediate_size": 8192,
18
+ "num_hidden_layers": 48,
19
+ "num_attention_heads": 16,
20
+ "mm_projector_id": "patch_merge",
21
+ "spatial_merge_size": 2,
22
+ "hidden_size": 1664,
23
+ "num_channels": 3,
24
+ "image_size": 1540,
25
+ "max_image_size": 1540,
26
+ "patch_size": 14,
27
+ "rope_theta": 10000.0,
28
+ "add_pre_mm_projector_layer_norm": true,
29
+ "adapter_bias": false
30
+ },
31
+ "hidden_size": 7168,
32
+ "rms_norm_eps": 1e-06,
33
+ "num_key_value_heads": 128,
34
+ "num_hidden_layers": 61,
35
+ "num_attention_heads": 128,
36
+ "intermediate_size": 16384,
37
+ "model_type": "deepseek_v3",
38
+ "hidden_act": "silu",
39
+ "tie_word_embeddings": false,
40
+ "max_seq_len": 262144,
41
+ "max_position_embeddings": 294912,
42
+ "moe_layer_freq": 1,
43
+ "first_k_dense_replace": 3,
44
+ "num_experts_per_tok": 4,
45
+ "n_routed_experts": 128,
46
+ "moe_intermediate_size": 4096,
47
+ "routed_scaling_factor": 1.0,
48
+ "n_shared_experts": 1,
49
+ "n_group": 1,
50
+ "topk_group": 1,
51
+ "topk_method": null,
52
+ "norm_topk_prob": true,
53
+ "scoring_func": "softmax",
54
+ "num_local_experts": 128,
55
+ "architectures": [
56
+ "DeepseekV3ForCausalLM"
57
+ ],
58
+ "rope_scaling": {
59
+ "rope_type": "yarn",
60
+ "mscale_all_dim": 1,
61
+ "mscale": 1,
62
+ "rope_theta": 10000.0,
63
+ "factor": 36,
64
+ "original_max_position_embeddings": 8192,
65
+ "beta_fast": 32,
66
+ "beta_slow": 1,
67
+ "llama_4_scaling_beta": 0.1
68
+ },
69
+ "bos_token_id": 1,
70
+ "eos_token_id": 2
71
+ }
consolidated-00181-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa321693447c82130313f54f1ebfceca1de6d70890b57c0a0a3408c22f8d5b2e
3
+ size 4991232376
consolidated-00182-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5339e22c60f1e1c98b49c3aab5c0d764ec529d40b9a0143351e34d3b60cf349
3
+ size 4956269264
consolidated-00185-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50b26b4803d26fc9b2a72f0226b004c6a682573455d2615cc0876fe02f9b317f
3
+ size 4991232368
consolidated-00187-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a41a291924649dacaebfbe620292156aa6d6bbc1d77cacb1161a60ff82d14803
3
+ size 4956269296
consolidated-00188-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:205a171c28b82417ed2bca20d6d884991700626c7c68776a282f0b1dadd4095d
3
+ size 4991232408
consolidated-00189-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f79eaa6fd7cb2bc6a059a3dcb72ab6efaaad7e9ac46bcb5d28cd6540bdafacbd
3
+ size 4991232368
consolidated-00192-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99a155e77194b775ae19c8086373c18e9d0416a7fc78d78757ab48a73f6d1b4e
3
+ size 4991232464
consolidated-00193-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4043ecb75c46200996340f3ce3ffef63ae1ada5e66d42e8723c7709d39e3102
3
+ size 4991232376
consolidated-00194-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83277f34ec1fc527badf380bfc38b779b37f3df1a9969f91eef33a7bf587d5cf
3
+ size 4991232376
consolidated-00195-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be593f29dd2e9c6579a8a4e7e6e8110a9374605022608bcdea0673c2ad9a2df2
3
+ size 4991232376
consolidated-00196-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9eec2864624ed1d8fe48b80e2aaf23f2aeb34a8569c833f00fe38f3251a67fee
3
+ size 4956269224
consolidated-00198-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc432b22413b531a8eea42cd5352579c31bbd5d9d70418d40e9866408c5e5b10
3
+ size 4991232288
consolidated-00199-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63ff48037d3e85fb5061a8e5b86760b7aad9a9d1a53efb00f3e995b328b5a8c9
3
+ size 4991232288
consolidated-00201-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6580f548e686cacd94e07fb8331f03d87b37c3ebd9ed2a1f2c857aafb9ffa3c8
3
+ size 4956269296
consolidated-00202-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d83b4a15e6f943fcc752eb60fb6b966976b2fdc8791d4fe0de032cc874148974
3
+ size 4991232400
consolidated-00203-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5abb6b563820e5c73782a60fb00e27a035825ff5cf5074ec50046a7124a6e406
3
+ size 4991232376
consolidated-00204-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fca62aea9d43f0bbb8481faf0384e3f77dd8d1d118523c2bed3df7fb0e58979
3
+ size 4991232368
consolidated-00205-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61add23c94bd81ccf097b455939eaaddbd3b83eb2aa15eca85f56de30a4f52b9
3
+ size 4956269248
consolidated-00206-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50938a2883bacb357948a2e3949267e754c9dcbaf428179739a70f884be7d094
3
+ size 4991232456
consolidated-00207-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7888d1030f3884d0e68c407aa601bd089619ec89ac9266fe8eacb948eb17a55b
3
+ size 4991232376
consolidated-00208-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdb52d330712a073da71d5227e9bede557850591e2d2ef27ffa2e94dfff97e76
3
+ size 4991232376
consolidated-00209-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6d26c505907bd6bfcc9af5e2de996f865bf545d9b1c44ed5a2d4242c351b398
3
+ size 4991232376
consolidated-00211-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1b1f457849d9e600284a5d17d1cf0f7282e61159a0a5768460e2a52a8966d66
3
+ size 4991232424
consolidated-00212-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95970a7deeb5b75bc3ab3fb5c892d2d7a4e8d026cb0e1d4b63cc6bd60206119c
3
+ size 4991232376
consolidated-00213-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc9cf4f957994c9e0adbe381f7dfd56724740af252a0ef9becac0872882a163c
3
+ size 4991232376
consolidated-00214-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34fe15bf56b227afbe0b042a1b3079cceaf8a307698d953efa8c697686bb0117
3
+ size 4917457752
consolidated-00216-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcc3f7e5ddc50b2899b5d32c0c8bb8eae7c55a6237eb35694d385a92bccd0a78
3
+ size 4991232392
consolidated-00217-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2be932c5f4cecb98f18c443e94637fd74eb9388e1ec335b118290a38a5975a8c
3
+ size 4991232376
consolidated-00219-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5851584c2775ee5e69a1dd6ce6ebe053b58c28b5bc194fbe676e274827a5c44
3
+ size 4956269256
consolidated-00221-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2f58d8395137ba18f2e3e74542d946d0be8006ec7c00dbfa069f26ddc3c1ad8
3
+ size 4991232368
consolidated-00222-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a54e041ed68baf82c1c821a944c65eef7cadbb099738fde073873fc85ba5f5a
3
+ size 4991232376
consolidated-00224-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67bfe0c017c3466fc0bc691d7ae97d946cbf93251df63c453c128c3b13c81db7
3
+ size 4956269288
consolidated-00225-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36e5ccd6d934bd7cc751923b2fa0d8c16bf244c759d99f849190ddc5582aef5d
3
+ size 4991232416
consolidated-00226-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9accec2f3a08b47a4dbd679def1103c684ab5fa473a828b9cdf5fcfcacfac0fc
3
+ size 4991232376
consolidated-00228-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be072eac7a8e87593eb1baff3232dcb0480962c60c0532736f521abb19acd3e0
3
+ size 4956269240
consolidated-00229-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf9b67a100630b42ea7a913f7c53409765d28d6811cd27eb49cd109b94545f9a
3
+ size 4991232448
consolidated-00231-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bda0d0807fa8504aac6548ab08f8208300e7460ba5c84422698eeb827cfd9959
3
+ size 4991232376
consolidated-00232-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c060dc8e7f06bf57bf3e26ce995af279fb2d7ee5a8785e75043c49801919a1f
3
+ size 4991232376
consolidated-00234-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc362032e164147767c4b4a543c1c9bcdae3356b6d9ef49cf8c7370506e13a84
3
+ size 4991232440
consolidated-00235-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbde6226008667d7efb5dd5863d442b72bb58eebed5bfcf4f5c88558f03dda2e
3
+ size 4991232376
consolidated-00238-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9b5a161f1333367e31388c3335dabb5f50ba1efb40a92322e5191f99c5ad0f4
3
+ size 4956269296
consolidated-00239-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4cd03114579627f04b5d6bf8ad52d18c16186eeb2c5b9b455662a562ee37e41
3
+ size 4991232408
consolidated-00241-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f9bd69b5746f2124b7a880ea0457e5a961e724f97053b948223b3d6594487b8
3
+ size 4991232376
consolidated-00242-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:057e1881cad30e22ce6dacdb76e483bcea8c482a2cf1751666d96f77977a0c7c
3
+ size 4956269240
consolidated-00245-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04c6297ff7e28abe70fe833f9daf5ed9cf766fc43ad6662d54f07f118aa61785
3
+ size 4991232376
consolidated-00246-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f010c4d49588705a1b26b6b8dbc54acf17ce0000a0c086e03280882c39b1bd40
3
+ size 4991232376
consolidated-00247-of-00272.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8484c70fc8af07a9b29155205ff2d66c1a50886af1d80f661a13f66e33ceeb1
3
+ size 4956269224
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff