camsemianalsyis commited on 7 days ago

Commit

ae0c5d8

verified ·

1 Parent(s): 408ba06

Add files using upload-large-folder tool

Browse files

Files changed (50) hide show

chat_template.jinja +101 -0
config.json +115 -0
generation_config.json +9 -0
model-00001-of-00135.safetensors +3 -0
model-00003-of-00135.safetensors +3 -0
model-00005-of-00135.safetensors +3 -0
model-00006-of-00135.safetensors +3 -0
model-00009-of-00135.safetensors +3 -0
model-00012-of-00135.safetensors +3 -0
model-00013-of-00135.safetensors +3 -0
model-00016-of-00135.safetensors +3 -0
model-00017-of-00135.safetensors +3 -0
model-00018-of-00135.safetensors +3 -0
model-00021-of-00135.safetensors +3 -0
model-00022-of-00135.safetensors +3 -0
model-00023-of-00135.safetensors +3 -0
model-00024-of-00135.safetensors +3 -0
model-00027-of-00135.safetensors +3 -0
model-00028-of-00135.safetensors +3 -0
model-00030-of-00135.safetensors +3 -0
model-00031-of-00135.safetensors +3 -0
model-00033-of-00135.safetensors +3 -0
model-00034-of-00135.safetensors +3 -0
model-00035-of-00135.safetensors +3 -0
model-00038-of-00135.safetensors +3 -0
model-00039-of-00135.safetensors +3 -0
model-00040-of-00135.safetensors +3 -0
model-00042-of-00135.safetensors +3 -0
model-00044-of-00135.safetensors +3 -0
model-00045-of-00135.safetensors +3 -0
model-00047-of-00135.safetensors +3 -0
model-00048-of-00135.safetensors +3 -0
model-00049-of-00135.safetensors +3 -0
model-00052-of-00135.safetensors +3 -0
model-00054-of-00135.safetensors +3 -0
model-00057-of-00135.safetensors +3 -0
model-00062-of-00135.safetensors +3 -0
model-00064-of-00135.safetensors +3 -0
model-00070-of-00135.safetensors +3 -0
model-00071-of-00135.safetensors +3 -0
model-00072-of-00135.safetensors +3 -0
model-00074-of-00135.safetensors +3 -0
model-00075-of-00135.safetensors +3 -0
model-00076-of-00135.safetensors +3 -0
model-00079-of-00135.safetensors +3 -0
model.safetensors.index.json +0 -0
recipe.yaml +7 -0
special_tokens_map.json +23 -0
tokenizer.json +0 -0
tokenizer_config.json +0 -0

chat_template.jinja ADDED Viewed

	@@ -0,0 +1,101 @@

+{%- if not add_generation_prompt is defined %}
+    {%- set add_generation_prompt = false %}
+{%- endif %}
+{%- set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='', is_first_sp=true, is_last_user=false) %}
+{%- for message in messages %}
+    {%- if message['role'] == 'system' %}
+        {%- if ns.is_first_sp %}
+            {%- set ns.system_prompt = ns.system_prompt + message['content'] %}
+            {%- set ns.is_first_sp = false %}
+        {%- else %}
+            {%- set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}
+        {%- endif %}
+    {%- endif %}
+{%- endfor %}
+{#- Adapted from https://github.com/sgl-project/sglang/blob/main/examples/chat_template/tool_chat_template_deepseekr1.jinja #}
+{%- if tools is defined and tools is not none %}
+    {%- set tool_ns = namespace(text='You are a helpful assistant with tool calling capabilities. ' + 'When a tool call is needed, you MUST use the following format to issue the call:\n' + '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>function<｜tool▁sep｜>FUNCTION_NAME\n' + '```json\n{"param1": "value1", "param2": "value2"}\n```<｜tool▁call▁end｜><｜tool▁calls▁end｜>\n\n' + 'Make sure the JSON is valid.' + '## Tools\n\n### Function\n\nYou have the following functions available:\n\n') %}
+    {%- for tool in tools %}
+        {%- set tool_ns.text = tool_ns.text + '\n```json\n' + (tool | tojson) + '\n```\n' %}
+    {%- endfor %}
+    {%- if ns.system_prompt|length != 0 %}
+        {%- set ns.system_prompt = ns.system_prompt + '\n\n' + tool_ns.text %}
+    {%- else %}
+        {%- set ns.system_prompt = tool_ns.text %}
+    {%- endif %}
+{%- endif %}
+{{- bos_token }}
+{{- ns.system_prompt }}
+{%- set last_index = (messages|length - 1) %}
+{%- for message in messages %}
+    {%- set content = message['content'] %}
+    {%- if message['role'] == 'user' %}
+        {%- set ns.is_tool = false -%}
+        {%- set ns.is_first = false -%}
+        {%- set ns.is_last_user = true -%}
+        {%- if loop.index0 == last_index %}
+            {{- '<｜User｜>' + content }}
+        {%- else %}
+            {{- '<｜User｜>' + content + '<｜Assistant｜>'}}
+        {%- endif %}
+    {%- endif %}
+    {%- if message['role'] == 'assistant' %}
+        {%- if '</think>' in content %}
+            {%- set content = (content.split('</think>')|last) %}
+        {%- endif %}
+    {%- endif %}
+    {%- if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}
+        {%- set ns.is_last_user = false -%}
+        {%- if ns.is_tool %}
+            {{- '<｜tool▁outputs▁end｜>'}}
+        {%- endif %}
+        {%- set ns.is_first = false %}
+        {%- set ns.is_tool = false -%}
+        {%- set ns.is_output_first = true %}
+        {%- for tool in message['tool_calls'] %}
+            {%- set arguments = tool['function']['arguments'] %}
+            {%- if arguments is not string %}
+                {%- set arguments = arguments|tojson %}
+            {%- endif %}
+            {%- if not ns.is_first %}
+                {%- if content is none %}
+                    {{- '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + arguments + '\n' + '```' + '<｜tool▁call▁end｜>'}}
+                }
+                {%- else %}
+                    {{- content + '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + arguments + '\n' + '```' + '<｜tool▁call▁end｜>'}}
+                {%- endif %}
+                {%- set ns.is_first = true -%}
+            {%- else %}
+                {{- '\n' + '<｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + arguments + '\n' + '```' + '<｜tool▁call▁end｜>'}}
+            {%- endif %}
+        {%- endfor %}
+        {{- '<｜tool▁calls▁end｜><｜end▁of▁sentence｜>'}}
+    {%- endif %}
+    {%- if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none) %}
+        {%- set ns.is_last_user = false -%}
+        {%- if ns.is_tool %}
+            {{- '<｜tool▁outputs▁end｜>' + content + '<｜end▁of▁sentence｜>'}}
+            {%- set ns.is_tool = false -%}
+        {%- else %}
+            {{- content + '<｜end▁of▁sentence｜>'}}
+        {%- endif %}
+    {%- endif %}
+    {%- if message['role'] == 'tool' %}
+        {%- set ns.is_last_user = false -%}
+        {%- set ns.is_tool = true -%}
+        {%- if ns.is_output_first %}
+            {{- '<｜tool▁outputs▁begin｜><｜tool▁output▁begin｜>' + content + '<｜tool▁output▁end｜>'}}
+            {%- set ns.is_output_first = false %}
+        {%- else %}
+            {{- '\n<｜tool▁output▁begin｜>' + content + '<｜tool▁output▁end｜>'}}
+        {%- endif %}
+    {%- endif %}
+{%- endfor -%}
+{%- if ns.is_tool %}
+    {{- '<｜tool▁outputs▁end｜>'}}
+{%- endif %}
+{#- if add_generation_prompt and not ns.is_last_user and not ns.is_tool #}
+{%- if add_generation_prompt and not ns.is_tool %}
+    {{- '<｜Assistant｜>'}}
+{%- endif %}

config.json ADDED Viewed

	@@ -0,0 +1,115 @@

+{
+  "architectures": [
+    "DeepseekV3ForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "auto_map": {
+    "AutoConfig": "configuration_deepseek.DeepseekV3Config",
+    "AutoModel": "modeling_deepseek.DeepseekV3Model",
+    "AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM"
+  },
+  "bos_token_id": 0,
+  "dtype": "bfloat16",
+  "eos_token_id": 1,
+  "ep_size": 1,
+  "first_k_dense_replace": 3,
+  "head_dim": 64,
+  "hidden_act": "silu",
+  "hidden_size": 7168,
+  "initializer_range": 0.02,
+  "intermediate_size": 18432,
+  "kv_lora_rank": 512,
+  "max_position_embeddings": 163840,
+  "model_type": "deepseek_v3",
+  "moe_intermediate_size": 2048,
+  "moe_layer_freq": 1,
+  "n_group": 8,
+  "n_routed_experts": 256,
+  "n_shared_experts": 1,
+  "norm_topk_prob": true,
+  "num_attention_heads": 128,
+  "num_experts_per_tok": 8,
+  "num_hidden_layers": 61,
+  "num_key_value_heads": 128,
+  "num_nextn_predict_layers": 1,
+  "pad_token_id": 2,
+  "pretraining_tp": 1,
+  "q_lora_rank": 1536,
+  "qk_head_dim": 192,
+  "qk_nope_head_dim": 128,
+  "qk_rope_head_dim": 64,
+  "quantization_config": {
+    "config_groups": {
+      "group_0": {
+        "format": "int-quantized",
+        "input_activations": {
+          "actorder": null,
+          "block_structure": null,
+          "dynamic": true,
+          "group_size": null,
+          "num_bits": 8,
+          "observer": null,
+          "observer_kwargs": {},
+          "scale_dtype": null,
+          "strategy": "token",
+          "symmetric": true,
+          "type": "int",
+          "zp_dtype": null
+        },
+        "output_activations": null,
+        "targets": [
+          "Linear"
+        ],
+        "weights": {
+          "actorder": null,
+          "block_structure": null,
+          "dynamic": false,
+          "group_size": null,
+          "num_bits": 8,
+          "observer": "memoryless_minmax",
+          "observer_kwargs": {},
+          "scale_dtype": null,
+          "strategy": "channel",
+          "symmetric": true,
+          "type": "int",
+          "zp_dtype": null
+        }
+      }
+    },
+    "format": "int-quantized",
+    "global_compression_ratio": null,
+    "ignore": [
+      "lm_head"
+    ],
+    "kv_cache_scheme": null,
+    "quant_method": "compressed-tensors",
+    "quantization_status": "compressed",
+    "sparsity_config": {},
+    "transform_config": {},
+    "version": "0.14.0.1"
+  },
+  "rms_norm_eps": 1e-06,
+  "rope_interleave": true,
+  "rope_scaling": {
+    "beta_fast": 32.0,
+    "beta_slow": 1.0,
+    "factor": 40.0,
+    "mscale": 1.0,
+    "mscale_all_dim": 1.0,
+    "original_max_position_embeddings": 4096,
+    "rope_type": "yarn",
+    "type": "yarn"
+  },
+  "rope_theta": 10000,
+  "routed_scaling_factor": 2.5,
+  "scoring_func": "sigmoid",
+  "tie_word_embeddings": false,
+  "topk_group": 4,
+  "topk_method": "noaux_tc",
+  "transformers_version": "4.57.6",
+  "unsloth_fixed": true,
+  "use_cache": true,
+  "v_head_dim": 128,
+  "vocab_size": 129280
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 0,
+  "do_sample": true,
+  "eos_token_id": 1,
+  "temperature": 0.6,
+  "top_p": 0.95,
+  "transformers_version": "4.57.6"
+}

model-00001-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6eeea0d5a585f59581246895a2e50ed7a44fbc324e1a9e8458574fd957cc78fe
+size 4996170688

model-00003-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:621c02e029b4dd789358b5b2a7e42e624247d4704d9d64228b1fc6a399e886fb
+size 4993864896

model-00005-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:718df2252ec16287f1c81c512deaa3fde9041a60eba2c2d788a452e8b21faf83
+size 4993854648

model-00006-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e12eed0df0f2018ae2d5828fe7966d834d0fdc94adb5d5f52d8b180c42b8c17a
+size 4993859656

model-00009-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be4b3dda7a9f549b58669b42245bbea4638bdf3631eb8b7c883a8868d0d55fed
+size 4993864512

model-00012-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93f81f3c5b3622ac7f4ecbc51088675e5f5836a01dae5b3e51e527e005c9f775
+size 4993854648

model-00013-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae8727e35e1f0066abe844d8c16b3bfc8d7b43240add36deceddc7f93bbf237d
+size 4993859656

model-00016-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b567d5539bba366f5b41f60eca1c289e155fc676ef5844fe85338c91acc299e9
+size 4993854328

model-00017-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f2465d4f86f597adb86a2539188644b632b54f8dd34478082050d1580814d31
+size 4993860088

model-00018-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7638e3a655377b6f91e6539429698145a5883b4406b53b8c8962dd9d19779be
+size 4993854792

model-00021-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb3e5ea00a1eca8eb7f2bd61d1a33c4ad6dd45537b66b5a3ee4f469e3996eb3c
+size 4993855272

model-00022-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7812fb5769bb381d5b56775d479b0b03ada464af5e3948686957d3149fff8509
+size 4993860384

model-00023-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dd0b7c7b96815e6e38f540bdaf08a1d1f0518832c0acc5bccdec4fbb7e675d91
+size 4993855056

model-00024-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0c24b4133ca6e529c2fca0be5154c0f9ca25470bd1f5ca48f81a58169d88238
+size 4993860592

model-00027-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d6a9704ee1cf67ed3138f61c9dbd8311cc2bb763e1a679846bb552c1e9c142a8
+size 4993860328

model-00028-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d38bae63aa601c72fe4ac163934078c74da33599797b978e9eab03204bde5057
+size 4993855320

model-00030-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1cefe2fe15f9ba847968145192a503c7581275578e608d7ab9544965505cd815
+size 4993865360

model-00031-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:21656b7c8d9e3d4995cec3dff0e66602477733f12fccb49485d95d1e2a057fa9
+size 4993860536

model-00033-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d507ffeba5cfd1ff5befcb8d6190dca815877c0029226e5cd84f62f1bb735c1
+size 4997526088

model-00034-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5720daf2560f8e97ea57d41ae49165fc77fccf38b8c2d7e0ae8021928c86f9c7
+size 4990189360

model-00035-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2ad64b63fb2aae6646e1ff2d30bd62ec73fb3532c7406cfadb38b3c20bff7645
+size 4993865576

model-00038-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6c4e4c4eddaca6d4d0925c4df3007755cafdf4fb5edb3e23bda46f2fa374c0f9
+size 4993860480

model-00039-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e028f1bd9b2b62fa6cbd2376cf1fb6b02048abd93f052f1ddc555ff6d7f31cf2
+size 4993854960

model-00040-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e222fc0d6c8109d43b62798d72b32101422260efb492662721c4f5c9d49144c
+size 4993860720

model-00042-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d17d941cc20a2669c3af763cd8450477d8908d780b87d7bf25fe526d05c22d4f
+size 4993855328

model-00044-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd10b01a69047f207f790ec84fd9347f26ce454550e4ca0cffa8904df8403b1f
+size 4993855224

model-00045-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd84714f85e06b4ae98fd246a1cdbbb53f3ae5cf261f495dcf5294001ab0b7f4
+size 4993860424

model-00047-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:51bd5440a58dcf77f59a236e0c261afb73ad9328271547363a82834c84920083
+size 4993860632

model-00048-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e2a38dd1ca57eb4e84904c0a69149777f4b34b6851699141ce43e2084647299
+size 4993854808

model-00049-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:15a0508c986debd1589bc745678b57a25743791faa043ea2539b1c560bb5e66b
+size 4993855328

model-00052-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b62db2d5aaad26ddd4a6d11187793c0560ac767d99ddb1c2bf01ef2ac371b81
+size 4993860368

model-00054-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d0c9f3b27f3d64de4d1dcfcfaef54773fe05cec48c99190f3b6db82c162725a
+size 4993860576

model-00057-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb8c5058692f0d69f2f9f90be914eeef350fb0afab6682297b9b00645ae9922a
+size 4993860336

model-00062-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ad9608264b45a7f33b5b13545742ae2ca1ff575ae1fe684cef8bf7f05a5bd6a
+size 4993865168

model-00064-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:180036548c3c4260ee66a31cbae7d21b646a0cc1507fc08688fba66f77c3b362
+size 4993803760

model-00070-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7637b0b2317318681a55227817a8aba114013ad394330800a1851f7af0339827
+size 4993860696

model-00071-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a3b82def1d2db15c878691451686b81ea6a60fd4acbebf60e52cc9b0ff0592b1
+size 4993864992

model-00072-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:21014c762262a04f2389a17e2b242b23a4456f4dd211609109823e202b76ef19
+size 4993855328

model-00074-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5ac3331a46d864cc1db33be4b1d2f65bc22587adbb749674417738bc1cd315fc
+size 4993855240

model-00075-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aecb48ac43d9838c6275e0a6b7ce8e73715756ea1181f251c51f2344641ee97a
+size 4993860408

model-00076-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9fc92f762e69b61d77606fea0156f84b201782480f8c3ee7d388c1232ac708d5
+size 4993865272

model-00079-of-00135.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f438701238016979a86cc1d4177eb339f9f01e31a8c1a3e51b02d31b1634be2
+size 4993855328

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

recipe.yaml ADDED Viewed

	@@ -0,0 +1,7 @@

+default_stage:
+  default_modifiers:
+    QuantizationModifier:
+      targets: [Linear]
+      ignore: [lm_head]
+      scheme: W8A8
+      bypass_divisibility_checks: false

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "bos_token": {
+    "content": "<｜begin▁of▁sentence｜>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<｜end▁of▁sentence｜>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<｜▁pad▁｜>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

The diff for this file is too large to render. See raw diff