Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

.gitattributes +2 -0
README.md +15 -0
config.json +10 -0
embeddings_bf16.bin +3 -0
export_args.json +42 -0
llm.mnn +3 -0
llm.mnn.json +0 -0
llm.mnn.weight +3 -0
llm_config.json +11 -0
tokenizer.txt +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+llm.mnn filter=lfs diff=lfs merge=lfs -text
+llm.mnn.weight filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,3 +1,18 @@
 ---
 license: apache-2.0
 ---

 ---
 license: apache-2.0
+language:
+- en
+base_model: Nanbeige/Nanbeige4.1-3B
+base_model_relation: quantized
+pipeline_tag: text-generation
+library_name: mnn
+tags:
+- code
+- mnn
 ---
+This model [DeProgrammer/Nanbeige4.1-3B-MNN](https://huggingface.co/DeProgrammer/Nanbeige4.1-3B-MNN) was
+converted to MNN format from [Nanbeige/Nanbeige4.1-3B](https://huggingface.co/Nanbeige/Nanbeige4.1-3B)
+using [llmexport.py](https://github.com/alibaba/MNN/issues/4153#issuecomment-3866182869) in [MNN version **3.4.0**](https://github.com/alibaba/MNN/commit/a874b302f094599e2838a9186e5ce2cf6a81a7a7).
+Inference can be run via MNN, e.g., MNN Chat on Android.

config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+    "llm_model": "llm.mnn",
+    "llm_weight": "llm.mnn.weight",
+    "backend_type": "cpu",
+    "thread_num": 4,
+    "precision": "low",
+    "memory": "low",
+    "sampler_type": "penalty",
+    "penalty": 1.1
+}

embeddings_bf16.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:038397ef5b03e16c16d8d69df3c03d503e3d279913dca86dacae53d8c182803a
+size 850657280

export_args.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+    "path": "Nanbeige/Nanbeige4.1-3B",
+    "type": null,
+    "tokenizer_path": "Nanbeige/Nanbeige4.1-3B",
+    "eagle_path": null,
+    "lora_path": null,
+    "gptq_path": null,
+    "dst_path": "./model",
+    "verbose": false,
+    "test": null,
+    "export": "mnn",
+    "onnx_slim": false,
+    "quant_bit": 8,
+    "quant_block": 64,
+    "visual_quant_bit": null,
+    "visual_quant_block": null,
+    "lm_quant_bit": 8,
+    "lm_quant_block": 64,
+    "mnnconvert": "../../../build/MNNConvert",
+    "ppl": false,
+    "awq": false,
+    "hqq": false,
+    "omni": false,
+    "transformer_fuse": false,
+    "group_conv_native": false,
+    "smooth": false,
+    "sym": false,
+    "visual_sym": false,
+    "seperate_embed": false,
+    "lora_split": false,
+    "calib_data": null,
+    "act_bit": 16,
+    "embed_bit": 16,
+    "act_sym": false,
+    "quant_config": null,
+    "generate_for_npu": false,
+    "skip_weight": false,
+    "omni_epochs": 20,
+    "omni_lr": 0.005,
+    "omni_wd": 0.0001,
+    "tie_word_embeddings": false
+}

llm.mnn ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d4e22b71abb1d44f17640d5a25a280595d966e66f818f2ff455e7a1a015e858e
+size 558736

llm.mnn.json ADDED Viewed

The diff for this file is too large to render. See raw diff

llm.mnn.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3269e2db150a7a4e427513f16fa2a11a1e19707d1c2814c2b3bf1e27dbae60b9
+size 3948049994

llm_config.json ADDED Viewed

	@@ -0,0 +1,11 @@

+{
+    "model_type": "llama",
+    "hidden_size": 2560,
+    "attention_mask": "float",
+    "attention_type": "full",
+    "jinja": {
+        "chat_template": "\n        {%- if tools %}\n            {{- '<|im_start|>system\n' }}\n            {%- if messages[0].role == 'system' %}\n                {{- messages[0].content + '\n\n' }}\n            {%- else %} \n                {{- '你是一位工具函数调用专家，你会得到一个问题和一组可能的工具函数。根据问题，你需要进行一个或多个函数/工具调用以实现目的，请尽量尝试探索通过工具解决问题。\n如果没有一个函数可以使用，请直接使用自然语言回复用户。\n如果给定的问题缺少函数所需的参数，请使用自然语言进行提问，向用户询问必要信息。\n如果调用结果已经足够回答用户问题，请对历史结果进行总结，使用自然语言回复用户。' }} \n            {%- endif %}\n            {{- \"# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>\" }}\n            {%- for tool in tools %}\n                {{- \"\n\" }}\n                {{- tool | tojson }}\n            {%- endfor %}\n            {{- \"\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\\\"name\\\": <function-name>, \\\"arguments\\\": <args-json-object>}\n</tool_call><|im_end|>\n\" }}\n        {%- else %}\n            {%- if messages[0].role == 'system' %}\n                {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}\n            {%- else %} \n                {{- '<|im_start|>system\n你是南北阁，一款由BOSS直聘自主研发并训练的专业大语言模型。<|im_end|>\n' }} \n            {%- endif %}\n        {%- endif %}\n        {%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}\n        {%- for message in messages[::-1] %}\n            {%- set index = (messages|length - 1) - loop.index0 %}\n            {%- if ns.multi_step_tool and message.role == \"user\" and message.content is string and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}\n                {%- set ns.multi_step_tool = false %}\n                {%- set ns.last_query_index = index %}\n            {%- endif %}\n        {%- endfor %}\n        {%- for message in messages %}\n            {%- if message.content is string %}\n                {%- set content = message.content %}\n            {%- else %}\n                {%- set content = '' %}\n            {%- endif %}\n            {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) %}\n                {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}\n            {%- elif message.role == \"assistant\" %}\n                {%- set reasoning_content = '' %}\n                {%- if message.reasoning_content is string %}\n                    {%- set reasoning_content = message.reasoning_content %}\n                {%- else %}\n                    {%- if '</think>' in content %}\n                        {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}\n                        {%- set content = content.split('</think>')[-1].lstrip('\n') %}\n                    {%- endif %}\n                {%- endif %}\n                {%- if loop.index0 > ns.last_query_index or keep_all_think or (extra_body is defined and extra_body.keep_all_think) %}\n                    {%- if loop.last or (not loop.last and reasoning_content) %}\n                        {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}\n                    {%- else %}\n                        {{- '<|im_start|>' + message.role + '\n' + content }}\n                    {%- endif %}\n                {%- else %}\n                    {{- '<|im_start|>' + message.role + '\n' + content }}\n                {%- endif %}\n                {%- if message.tool_calls %}\n                    {%- for tool_call in message.tool_calls %}\n                        {%- if (loop.first and content) or (not loop.first) %}\n                            {{- '\n' }}\n                        {%- endif %}\n                        {%- if tool_call.function %}\n                            {%- set tool_call = tool_call.function %}\n                        {%- endif %}\n                        {{- '<tool_call>\n{\"name\": \"' }}\n                        {{- tool_call.name }}\n                        {{- '\", \"arguments\": ' }}\n                        {%- if tool_call.arguments is string %}\n                            {{- tool_call.arguments }}\n                        {%- else %}\n                            {{- tool_call.arguments | tojson }}\n                        {%- endif %}\n                        {{- '}\n</tool_call>' }}\n                    {%- endfor %}\n                {%- endif %}\n                {{- '<|im_end|>\n' }}\n            {%- elif message.role == \"tool\" %}\n                {%- if loop.first or (messages[loop.index0 - 1].role != \"tool\") %}\n                    {{- '<|im_start|>user' }}\n                {%- endif %}\n                {{- '\n<tool_response>\n' }}\n                {{- content }}\n                {{- '\n</tool_response>' }}\n                {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n                    {{- '<|im_end|>\n' }}\n                {%- endif %}\n            {%- endif %}\n        {%- endfor %}\n        {%- if add_generation_prompt %}\n            {{- '<|im_start|>assistant\n' }}\n        {%- endif %}\n",
+        "bos": "<|im_start|>",
+        "eos": "<|im_end|>"
+    }
+}

tokenizer.txt ADDED Viewed

The diff for this file is too large to render. See raw diff