camsemianalsyis commited on
Commit
ae0c5d8
·
verified ·
1 Parent(s): 408ba06

Add files using upload-large-folder tool

Browse files
Files changed (50) hide show
  1. chat_template.jinja +101 -0
  2. config.json +115 -0
  3. generation_config.json +9 -0
  4. model-00001-of-00135.safetensors +3 -0
  5. model-00003-of-00135.safetensors +3 -0
  6. model-00005-of-00135.safetensors +3 -0
  7. model-00006-of-00135.safetensors +3 -0
  8. model-00009-of-00135.safetensors +3 -0
  9. model-00012-of-00135.safetensors +3 -0
  10. model-00013-of-00135.safetensors +3 -0
  11. model-00016-of-00135.safetensors +3 -0
  12. model-00017-of-00135.safetensors +3 -0
  13. model-00018-of-00135.safetensors +3 -0
  14. model-00021-of-00135.safetensors +3 -0
  15. model-00022-of-00135.safetensors +3 -0
  16. model-00023-of-00135.safetensors +3 -0
  17. model-00024-of-00135.safetensors +3 -0
  18. model-00027-of-00135.safetensors +3 -0
  19. model-00028-of-00135.safetensors +3 -0
  20. model-00030-of-00135.safetensors +3 -0
  21. model-00031-of-00135.safetensors +3 -0
  22. model-00033-of-00135.safetensors +3 -0
  23. model-00034-of-00135.safetensors +3 -0
  24. model-00035-of-00135.safetensors +3 -0
  25. model-00038-of-00135.safetensors +3 -0
  26. model-00039-of-00135.safetensors +3 -0
  27. model-00040-of-00135.safetensors +3 -0
  28. model-00042-of-00135.safetensors +3 -0
  29. model-00044-of-00135.safetensors +3 -0
  30. model-00045-of-00135.safetensors +3 -0
  31. model-00047-of-00135.safetensors +3 -0
  32. model-00048-of-00135.safetensors +3 -0
  33. model-00049-of-00135.safetensors +3 -0
  34. model-00052-of-00135.safetensors +3 -0
  35. model-00054-of-00135.safetensors +3 -0
  36. model-00057-of-00135.safetensors +3 -0
  37. model-00062-of-00135.safetensors +3 -0
  38. model-00064-of-00135.safetensors +3 -0
  39. model-00070-of-00135.safetensors +3 -0
  40. model-00071-of-00135.safetensors +3 -0
  41. model-00072-of-00135.safetensors +3 -0
  42. model-00074-of-00135.safetensors +3 -0
  43. model-00075-of-00135.safetensors +3 -0
  44. model-00076-of-00135.safetensors +3 -0
  45. model-00079-of-00135.safetensors +3 -0
  46. model.safetensors.index.json +0 -0
  47. recipe.yaml +7 -0
  48. special_tokens_map.json +23 -0
  49. tokenizer.json +0 -0
  50. tokenizer_config.json +0 -0
chat_template.jinja ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- if not add_generation_prompt is defined %}
2
+ {%- set add_generation_prompt = false %}
3
+ {%- endif %}
4
+ {%- set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='', is_first_sp=true, is_last_user=false) %}
5
+ {%- for message in messages %}
6
+ {%- if message['role'] == 'system' %}
7
+ {%- if ns.is_first_sp %}
8
+ {%- set ns.system_prompt = ns.system_prompt + message['content'] %}
9
+ {%- set ns.is_first_sp = false %}
10
+ {%- else %}
11
+ {%- set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}
12
+ {%- endif %}
13
+ {%- endif %}
14
+ {%- endfor %}
15
+
16
+ {#- Adapted from https://github.com/sgl-project/sglang/blob/main/examples/chat_template/tool_chat_template_deepseekr1.jinja #}
17
+ {%- if tools is defined and tools is not none %}
18
+ {%- set tool_ns = namespace(text='You are a helpful assistant with tool calling capabilities. ' + 'When a tool call is needed, you MUST use the following format to issue the call:\n' + '<|tool▁calls▁begin|><|tool▁call▁begin|>function<|tool▁sep|>FUNCTION_NAME\n' + '```json\n{"param1": "value1", "param2": "value2"}\n```<|tool▁call▁end|><|tool▁calls▁end|>\n\n' + 'Make sure the JSON is valid.' + '## Tools\n\n### Function\n\nYou have the following functions available:\n\n') %}
19
+ {%- for tool in tools %}
20
+ {%- set tool_ns.text = tool_ns.text + '\n```json\n' + (tool | tojson) + '\n```\n' %}
21
+ {%- endfor %}
22
+ {%- if ns.system_prompt|length != 0 %}
23
+ {%- set ns.system_prompt = ns.system_prompt + '\n\n' + tool_ns.text %}
24
+ {%- else %}
25
+ {%- set ns.system_prompt = tool_ns.text %}
26
+ {%- endif %}
27
+ {%- endif %}
28
+ {{- bos_token }}
29
+ {{- ns.system_prompt }}
30
+ {%- set last_index = (messages|length - 1) %}
31
+ {%- for message in messages %}
32
+ {%- set content = message['content'] %}
33
+ {%- if message['role'] == 'user' %}
34
+ {%- set ns.is_tool = false -%}
35
+ {%- set ns.is_first = false -%}
36
+ {%- set ns.is_last_user = true -%}
37
+ {%- if loop.index0 == last_index %}
38
+ {{- '<|User|>' + content }}
39
+ {%- else %}
40
+ {{- '<|User|>' + content + '<|Assistant|>'}}
41
+ {%- endif %}
42
+ {%- endif %}
43
+ {%- if message['role'] == 'assistant' %}
44
+ {%- if '</think>' in content %}
45
+ {%- set content = (content.split('</think>')|last) %}
46
+ {%- endif %}
47
+ {%- endif %}
48
+ {%- if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}
49
+ {%- set ns.is_last_user = false -%}
50
+ {%- if ns.is_tool %}
51
+ {{- '<|tool▁outputs▁end|>'}}
52
+ {%- endif %}
53
+ {%- set ns.is_first = false %}
54
+ {%- set ns.is_tool = false -%}
55
+ {%- set ns.is_output_first = true %}
56
+ {%- for tool in message['tool_calls'] %}
57
+ {%- set arguments = tool['function']['arguments'] %}
58
+ {%- if arguments is not string %}
59
+ {%- set arguments = arguments|tojson %}
60
+ {%- endif %}
61
+ {%- if not ns.is_first %}
62
+ {%- if content is none %}
63
+ {{- '<|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\n' + '```json' + '\n' + arguments + '\n' + '```' + '<|tool▁call▁end|>'}}
64
+ }
65
+ {%- else %}
66
+ {{- content + '<|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\n' + '```json' + '\n' + arguments + '\n' + '```' + '<|tool▁call▁end|>'}}
67
+ {%- endif %}
68
+ {%- set ns.is_first = true -%}
69
+ {%- else %}
70
+ {{- '\n' + '<|tool▁call▁begin|>' + tool['type'] + '<|tool▁sep|>' + tool['function']['name'] + '\n' + '```json' + '\n' + arguments + '\n' + '```' + '<|tool▁call▁end|>'}}
71
+ {%- endif %}
72
+ {%- endfor %}
73
+ {{- '<|tool▁calls▁end|><|end▁of▁sentence|>'}}
74
+ {%- endif %}
75
+ {%- if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none) %}
76
+ {%- set ns.is_last_user = false -%}
77
+ {%- if ns.is_tool %}
78
+ {{- '<|tool▁outputs▁end|>' + content + '<|end▁of▁sentence|>'}}
79
+ {%- set ns.is_tool = false -%}
80
+ {%- else %}
81
+ {{- content + '<|end▁of▁sentence|>'}}
82
+ {%- endif %}
83
+ {%- endif %}
84
+ {%- if message['role'] == 'tool' %}
85
+ {%- set ns.is_last_user = false -%}
86
+ {%- set ns.is_tool = true -%}
87
+ {%- if ns.is_output_first %}
88
+ {{- '<|tool▁outputs▁begin|><|tool▁output▁begin|>' + content + '<|tool▁output▁end|>'}}
89
+ {%- set ns.is_output_first = false %}
90
+ {%- else %}
91
+ {{- '\n<|tool▁output▁begin|>' + content + '<|tool▁output▁end|>'}}
92
+ {%- endif %}
93
+ {%- endif %}
94
+ {%- endfor -%}
95
+ {%- if ns.is_tool %}
96
+ {{- '<|tool▁outputs▁end|>'}}
97
+ {%- endif %}
98
+ {#- if add_generation_prompt and not ns.is_last_user and not ns.is_tool #}
99
+ {%- if add_generation_prompt and not ns.is_tool %}
100
+ {{- '<|Assistant|>'}}
101
+ {%- endif %}
config.json ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "DeepseekV3ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "auto_map": {
8
+ "AutoConfig": "configuration_deepseek.DeepseekV3Config",
9
+ "AutoModel": "modeling_deepseek.DeepseekV3Model",
10
+ "AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM"
11
+ },
12
+ "bos_token_id": 0,
13
+ "dtype": "bfloat16",
14
+ "eos_token_id": 1,
15
+ "ep_size": 1,
16
+ "first_k_dense_replace": 3,
17
+ "head_dim": 64,
18
+ "hidden_act": "silu",
19
+ "hidden_size": 7168,
20
+ "initializer_range": 0.02,
21
+ "intermediate_size": 18432,
22
+ "kv_lora_rank": 512,
23
+ "max_position_embeddings": 163840,
24
+ "model_type": "deepseek_v3",
25
+ "moe_intermediate_size": 2048,
26
+ "moe_layer_freq": 1,
27
+ "n_group": 8,
28
+ "n_routed_experts": 256,
29
+ "n_shared_experts": 1,
30
+ "norm_topk_prob": true,
31
+ "num_attention_heads": 128,
32
+ "num_experts_per_tok": 8,
33
+ "num_hidden_layers": 61,
34
+ "num_key_value_heads": 128,
35
+ "num_nextn_predict_layers": 1,
36
+ "pad_token_id": 2,
37
+ "pretraining_tp": 1,
38
+ "q_lora_rank": 1536,
39
+ "qk_head_dim": 192,
40
+ "qk_nope_head_dim": 128,
41
+ "qk_rope_head_dim": 64,
42
+ "quantization_config": {
43
+ "config_groups": {
44
+ "group_0": {
45
+ "format": "int-quantized",
46
+ "input_activations": {
47
+ "actorder": null,
48
+ "block_structure": null,
49
+ "dynamic": true,
50
+ "group_size": null,
51
+ "num_bits": 8,
52
+ "observer": null,
53
+ "observer_kwargs": {},
54
+ "scale_dtype": null,
55
+ "strategy": "token",
56
+ "symmetric": true,
57
+ "type": "int",
58
+ "zp_dtype": null
59
+ },
60
+ "output_activations": null,
61
+ "targets": [
62
+ "Linear"
63
+ ],
64
+ "weights": {
65
+ "actorder": null,
66
+ "block_structure": null,
67
+ "dynamic": false,
68
+ "group_size": null,
69
+ "num_bits": 8,
70
+ "observer": "memoryless_minmax",
71
+ "observer_kwargs": {},
72
+ "scale_dtype": null,
73
+ "strategy": "channel",
74
+ "symmetric": true,
75
+ "type": "int",
76
+ "zp_dtype": null
77
+ }
78
+ }
79
+ },
80
+ "format": "int-quantized",
81
+ "global_compression_ratio": null,
82
+ "ignore": [
83
+ "lm_head"
84
+ ],
85
+ "kv_cache_scheme": null,
86
+ "quant_method": "compressed-tensors",
87
+ "quantization_status": "compressed",
88
+ "sparsity_config": {},
89
+ "transform_config": {},
90
+ "version": "0.14.0.1"
91
+ },
92
+ "rms_norm_eps": 1e-06,
93
+ "rope_interleave": true,
94
+ "rope_scaling": {
95
+ "beta_fast": 32.0,
96
+ "beta_slow": 1.0,
97
+ "factor": 40.0,
98
+ "mscale": 1.0,
99
+ "mscale_all_dim": 1.0,
100
+ "original_max_position_embeddings": 4096,
101
+ "rope_type": "yarn",
102
+ "type": "yarn"
103
+ },
104
+ "rope_theta": 10000,
105
+ "routed_scaling_factor": 2.5,
106
+ "scoring_func": "sigmoid",
107
+ "tie_word_embeddings": false,
108
+ "topk_group": 4,
109
+ "topk_method": "noaux_tc",
110
+ "transformers_version": "4.57.6",
111
+ "unsloth_fixed": true,
112
+ "use_cache": true,
113
+ "v_head_dim": 128,
114
+ "vocab_size": 129280
115
+ }
generation_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 0,
4
+ "do_sample": true,
5
+ "eos_token_id": 1,
6
+ "temperature": 0.6,
7
+ "top_p": 0.95,
8
+ "transformers_version": "4.57.6"
9
+ }
model-00001-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eeea0d5a585f59581246895a2e50ed7a44fbc324e1a9e8458574fd957cc78fe
3
+ size 4996170688
model-00003-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:621c02e029b4dd789358b5b2a7e42e624247d4704d9d64228b1fc6a399e886fb
3
+ size 4993864896
model-00005-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:718df2252ec16287f1c81c512deaa3fde9041a60eba2c2d788a452e8b21faf83
3
+ size 4993854648
model-00006-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e12eed0df0f2018ae2d5828fe7966d834d0fdc94adb5d5f52d8b180c42b8c17a
3
+ size 4993859656
model-00009-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be4b3dda7a9f549b58669b42245bbea4638bdf3631eb8b7c883a8868d0d55fed
3
+ size 4993864512
model-00012-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93f81f3c5b3622ac7f4ecbc51088675e5f5836a01dae5b3e51e527e005c9f775
3
+ size 4993854648
model-00013-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae8727e35e1f0066abe844d8c16b3bfc8d7b43240add36deceddc7f93bbf237d
3
+ size 4993859656
model-00016-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b567d5539bba366f5b41f60eca1c289e155fc676ef5844fe85338c91acc299e9
3
+ size 4993854328
model-00017-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f2465d4f86f597adb86a2539188644b632b54f8dd34478082050d1580814d31
3
+ size 4993860088
model-00018-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7638e3a655377b6f91e6539429698145a5883b4406b53b8c8962dd9d19779be
3
+ size 4993854792
model-00021-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb3e5ea00a1eca8eb7f2bd61d1a33c4ad6dd45537b66b5a3ee4f469e3996eb3c
3
+ size 4993855272
model-00022-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7812fb5769bb381d5b56775d479b0b03ada464af5e3948686957d3149fff8509
3
+ size 4993860384
model-00023-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd0b7c7b96815e6e38f540bdaf08a1d1f0518832c0acc5bccdec4fbb7e675d91
3
+ size 4993855056
model-00024-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0c24b4133ca6e529c2fca0be5154c0f9ca25470bd1f5ca48f81a58169d88238
3
+ size 4993860592
model-00027-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6a9704ee1cf67ed3138f61c9dbd8311cc2bb763e1a679846bb552c1e9c142a8
3
+ size 4993860328
model-00028-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d38bae63aa601c72fe4ac163934078c74da33599797b978e9eab03204bde5057
3
+ size 4993855320
model-00030-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cefe2fe15f9ba847968145192a503c7581275578e608d7ab9544965505cd815
3
+ size 4993865360
model-00031-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21656b7c8d9e3d4995cec3dff0e66602477733f12fccb49485d95d1e2a057fa9
3
+ size 4993860536
model-00033-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d507ffeba5cfd1ff5befcb8d6190dca815877c0029226e5cd84f62f1bb735c1
3
+ size 4997526088
model-00034-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5720daf2560f8e97ea57d41ae49165fc77fccf38b8c2d7e0ae8021928c86f9c7
3
+ size 4990189360
model-00035-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ad64b63fb2aae6646e1ff2d30bd62ec73fb3532c7406cfadb38b3c20bff7645
3
+ size 4993865576
model-00038-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c4e4c4eddaca6d4d0925c4df3007755cafdf4fb5edb3e23bda46f2fa374c0f9
3
+ size 4993860480
model-00039-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e028f1bd9b2b62fa6cbd2376cf1fb6b02048abd93f052f1ddc555ff6d7f31cf2
3
+ size 4993854960
model-00040-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e222fc0d6c8109d43b62798d72b32101422260efb492662721c4f5c9d49144c
3
+ size 4993860720
model-00042-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d17d941cc20a2669c3af763cd8450477d8908d780b87d7bf25fe526d05c22d4f
3
+ size 4993855328
model-00044-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd10b01a69047f207f790ec84fd9347f26ce454550e4ca0cffa8904df8403b1f
3
+ size 4993855224
model-00045-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd84714f85e06b4ae98fd246a1cdbbb53f3ae5cf261f495dcf5294001ab0b7f4
3
+ size 4993860424
model-00047-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51bd5440a58dcf77f59a236e0c261afb73ad9328271547363a82834c84920083
3
+ size 4993860632
model-00048-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e2a38dd1ca57eb4e84904c0a69149777f4b34b6851699141ce43e2084647299
3
+ size 4993854808
model-00049-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15a0508c986debd1589bc745678b57a25743791faa043ea2539b1c560bb5e66b
3
+ size 4993855328
model-00052-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b62db2d5aaad26ddd4a6d11187793c0560ac767d99ddb1c2bf01ef2ac371b81
3
+ size 4993860368
model-00054-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d0c9f3b27f3d64de4d1dcfcfaef54773fe05cec48c99190f3b6db82c162725a
3
+ size 4993860576
model-00057-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb8c5058692f0d69f2f9f90be914eeef350fb0afab6682297b9b00645ae9922a
3
+ size 4993860336
model-00062-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ad9608264b45a7f33b5b13545742ae2ca1ff575ae1fe684cef8bf7f05a5bd6a
3
+ size 4993865168
model-00064-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:180036548c3c4260ee66a31cbae7d21b646a0cc1507fc08688fba66f77c3b362
3
+ size 4993803760
model-00070-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7637b0b2317318681a55227817a8aba114013ad394330800a1851f7af0339827
3
+ size 4993860696
model-00071-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3b82def1d2db15c878691451686b81ea6a60fd4acbebf60e52cc9b0ff0592b1
3
+ size 4993864992
model-00072-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21014c762262a04f2389a17e2b242b23a4456f4dd211609109823e202b76ef19
3
+ size 4993855328
model-00074-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ac3331a46d864cc1db33be4b1d2f65bc22587adbb749674417738bc1cd315fc
3
+ size 4993855240
model-00075-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aecb48ac43d9838c6275e0a6b7ce8e73715756ea1181f251c51f2344641ee97a
3
+ size 4993860408
model-00076-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fc92f762e69b61d77606fea0156f84b201782480f8c3ee7d388c1232ac708d5
3
+ size 4993865272
model-00079-of-00135.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f438701238016979a86cc1d4177eb339f9f01e31a8c1a3e51b02d31b1634be2
3
+ size 4993855328
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
recipe.yaml ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ default_stage:
2
+ default_modifiers:
3
+ QuantizationModifier:
4
+ targets: [Linear]
5
+ ignore: [lm_head]
6
+ scheme: W8A8
7
+ bypass_divisibility_checks: false
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|begin▁of▁sentence|>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|end▁of▁sentence|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<|▁pad▁|>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff