Upload folder using huggingface_hub
#1
by at676 - opened
- config.json +51 -0
- generation_config.json +12 -0
- model-00001-of-00034.safetensors +3 -0
- model-00002-of-00034.safetensors +3 -0
- model-00003-of-00034.safetensors +3 -0
- model-00004-of-00034.safetensors +3 -0
- model-00005-of-00034.safetensors +3 -0
- model-00006-of-00034.safetensors +3 -0
- model-00007-of-00034.safetensors +3 -0
- model-00008-of-00034.safetensors +3 -0
- model-00009-of-00034.safetensors +3 -0
- model-00010-of-00034.safetensors +3 -0
- model-00011-of-00034.safetensors +3 -0
- model-00012-of-00034.safetensors +3 -0
- model-00013-of-00034.safetensors +3 -0
- model-00014-of-00034.safetensors +3 -0
- model-00015-of-00034.safetensors +3 -0
- model-00016-of-00034.safetensors +3 -0
- model-00017-of-00034.safetensors +3 -0
- model-00018-of-00034.safetensors +3 -0
- model-00019-of-00034.safetensors +3 -0
- model-00020-of-00034.safetensors +3 -0
- model-00021-of-00034.safetensors +3 -0
- model-00022-of-00034.safetensors +3 -0
- model-00023-of-00034.safetensors +3 -0
- model-00024-of-00034.safetensors +3 -0
- model-00025-of-00034.safetensors +3 -0
- model-00026-of-00034.safetensors +3 -0
- model-00027-of-00034.safetensors +3 -0
- model-00028-of-00034.safetensors +3 -0
- model-00029-of-00034.safetensors +3 -0
- model-00030-of-00034.safetensors +3 -0
- model-00031-of-00034.safetensors +3 -0
- model-00032-of-00034.safetensors +3 -0
- model-00033-of-00034.safetensors +3 -0
- model-00034-of-00034.safetensors +3 -0
- model.safetensors.index.json +0 -0
config.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_name_or_path": "meta-llama/Meta-Llama-3.1-405B-Instruct",
|
| 3 |
+
"architectures": [
|
| 4 |
+
"LlamaForCausalLM"
|
| 5 |
+
],
|
| 6 |
+
"attention_bias": false,
|
| 7 |
+
"attention_dropout": 0.0,
|
| 8 |
+
"bos_token_id": 128000,
|
| 9 |
+
"eos_token_id": [
|
| 10 |
+
128001,
|
| 11 |
+
128008,
|
| 12 |
+
128009
|
| 13 |
+
],
|
| 14 |
+
"head_dim": 128,
|
| 15 |
+
"hidden_act": "silu",
|
| 16 |
+
"hidden_size": 16384,
|
| 17 |
+
"initializer_range": 0.02,
|
| 18 |
+
"intermediate_size": 53248,
|
| 19 |
+
"max_position_embeddings": 131072,
|
| 20 |
+
"mlp_bias": false,
|
| 21 |
+
"model_type": "llama",
|
| 22 |
+
"num_attention_heads": 128,
|
| 23 |
+
"num_hidden_layers": 126,
|
| 24 |
+
"num_key_value_heads": 8,
|
| 25 |
+
"pretraining_tp": 1,
|
| 26 |
+
"quip_params": {
|
| 27 |
+
"K": 3,
|
| 28 |
+
"L": 16,
|
| 29 |
+
"V": 2,
|
| 30 |
+
"codebook": "bitshift",
|
| 31 |
+
"codebook_version": 0,
|
| 32 |
+
"decode_mode": "quantlut_sym",
|
| 33 |
+
"td_x": 16,
|
| 34 |
+
"td_y": 16,
|
| 35 |
+
"tlut_bits": 9
|
| 36 |
+
},
|
| 37 |
+
"rms_norm_eps": 1e-05,
|
| 38 |
+
"rope_scaling": {
|
| 39 |
+
"factor": 8.0,
|
| 40 |
+
"high_freq_factor": 4.0,
|
| 41 |
+
"low_freq_factor": 1.0,
|
| 42 |
+
"original_max_position_embeddings": 8192,
|
| 43 |
+
"rope_type": "llama3"
|
| 44 |
+
},
|
| 45 |
+
"rope_theta": 500000.0,
|
| 46 |
+
"tie_word_embeddings": false,
|
| 47 |
+
"torch_dtype": "bfloat16",
|
| 48 |
+
"transformers_version": "4.45.2",
|
| 49 |
+
"use_cache": true,
|
| 50 |
+
"vocab_size": 128256
|
| 51 |
+
}
|
generation_config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token_id": 128000,
|
| 3 |
+
"do_sample": true,
|
| 4 |
+
"eos_token_id": [
|
| 5 |
+
128001,
|
| 6 |
+
128008,
|
| 7 |
+
128009
|
| 8 |
+
],
|
| 9 |
+
"temperature": 0.6,
|
| 10 |
+
"top_p": 0.9,
|
| 11 |
+
"transformers_version": "4.45.2"
|
| 12 |
+
}
|
model-00001-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a42deca02abcefc58242c25cefbfc71ba235f025e87a6562bf94510d3873e5e2
|
| 3 |
+
size 4744288624
|
model-00002-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c6c8b2ce881db2a10a332d340ab9083b2da893b9f2c7fa29d9e64d1a37f6521
|
| 3 |
+
size 4785574248
|
model-00003-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1effc15a8e6bff779bd2d69576a2352e90f5a4242d21aaae190986fb0ae1ee18
|
| 3 |
+
size 4785574248
|
model-00004-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0ad27d0b7627694be8213fa797a12e29eb978ab611a9077c573297a90167a549
|
| 3 |
+
size 4785574328
|
model-00005-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc4f631cd63569758d212a5b157616c22ee2be348adc6bf3756c9c358f8481a0
|
| 3 |
+
size 4785574368
|
model-00006-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47f18a027a2f9a3692311c44c40054f60bbe84d818463e4cf0ca1588aaf1ab19
|
| 3 |
+
size 4785574368
|
model-00007-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0ea2824c2e53ca325219220ccb9759a54710fb4731ac60d19dfdf260f32b091
|
| 3 |
+
size 4785574368
|
model-00008-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d1fde9f3469f0f14b7c1bd3e7bedb1e4adaf575171240d39857c09d8f1d9978
|
| 3 |
+
size 4785574368
|
model-00009-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ec887524b05edb1cb8518bfc7e6fa1a4d60122d46796f0181742e3f11384780
|
| 3 |
+
size 4785574368
|
model-00010-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bc0da1cb9b42972d6649231b66f8d8c2b187d2fe438a03c2f65312f73669aff
|
| 3 |
+
size 4785574368
|
model-00011-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e64204fe44c6e2a09f38bbd3a317832e5a325b4fa754c55e45d9fdb2d8b9e19e
|
| 3 |
+
size 4785574368
|
model-00012-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd9dc098ad292e79d26b3006921ae3e6b1f20e21d44fc62709d86bcb04a3b645
|
| 3 |
+
size 4785574368
|
model-00013-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2ec5f7bea8e751982cd267b0db5ec8f53341cbc3dc211ac25fba8168329556a
|
| 3 |
+
size 4785574368
|
model-00014-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:342106a19f04746272440840cc7580cec84a660055c9a358268f27aa3185f4da
|
| 3 |
+
size 4785574368
|
model-00015-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5131fe57c81e29efa187fc77af55a935a045c81f2cb6faba0a722e14647a62b6
|
| 3 |
+
size 4785574368
|
model-00016-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1842f1505a48bd06d73dff1d4e743b9ad93cf7a57905e1007d394958ddea81df
|
| 3 |
+
size 4785574368
|
model-00017-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d38612c5bdcde4cb1a6409a8edf89693436250fb51a1769d89f633ea6f4685e8
|
| 3 |
+
size 4785574368
|
model-00018-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d7489a481bc990a57d631c4bed93ff105655679baea41bbddcdf02b96bb903c
|
| 3 |
+
size 4785574368
|
model-00019-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:458c27ea0de160cdd1e7418a28a4d140a06454fe81549ca9c161f96ae80be3a6
|
| 3 |
+
size 4785574368
|
model-00020-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba7fcffddf087d7441d28e4208fdd8d521d2cf9daabbc1899641f60ca1649806
|
| 3 |
+
size 4785574368
|
model-00021-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:82580025a77f93b9718bdf1a19b803befe2578733aff3b822f850e299306f7d0
|
| 3 |
+
size 4785574368
|
model-00022-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cba94cdc47e0ec3fe9d3654dffd8d1075409fc87102b8d9e60b6108c1e317b4
|
| 3 |
+
size 4785574368
|
model-00023-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8ea243b3e9e8095e7374d7e66b53c87f28185777ef934c1680ddac4582c7f9b4
|
| 3 |
+
size 4785574368
|
model-00024-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b52474db9dc9b785df0984f9926f69d1738169327039af8e2f0ce41f04a94fc
|
| 3 |
+
size 4785574368
|
model-00025-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c3a90ae500d679a893f1f6820bfbd2d9d409b7b1ec31b7b56bcef1d12021608
|
| 3 |
+
size 4785574368
|
model-00026-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd8f6a3681073cc2da50f5a8ebcc7f2531f3a83b5cf3fc528d66a835bc35c70f
|
| 3 |
+
size 4785574384
|
model-00027-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4056031273560748c122df42bd4fd7a245eb820d08f10a1a0c1a7fbb7e7e2cfd
|
| 3 |
+
size 4785574488
|
model-00028-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef5bc3315c8e1027532f131897cc09558cf65f9afc0019bc6e98ff5fd7b2a03a
|
| 3 |
+
size 4785574488
|
model-00029-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17ecba067b4609fa1a97d651ee01a6fcb79e61ef6e4d2d3add73d0806fa81f7e
|
| 3 |
+
size 4785574488
|
model-00030-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70cd3373b9827f488c4ec09819d1502e6d89a361894b571dc63124ace58bfb56
|
| 3 |
+
size 4785574488
|
model-00031-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a00d96cfbabae5081fcccec3a54f8dd194185844d2aae639db56b5d62676d021
|
| 3 |
+
size 4785574488
|
model-00032-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:063d533fe69e11a564b480062686feffa17b1c3ac7d2ad51ff8cb7b3af7384f4
|
| 3 |
+
size 4785574488
|
model-00033-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c060cd8ee1d4f25e39115324e8f8ab1a0c126dc3610fc24b6536ee7174e1b8e
|
| 3 |
+
size 1851224240
|
model-00034-of-00034.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71b079a02069ebe5a5f4f8135815f136afb1d6fc4423620dcb2a14fa399cdf12
|
| 3 |
+
size 4202692736
|
model.safetensors.index.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|