Chan-Y
/

RegularLLM-iOS

Model card Files Files and versions

Chan-Y commited on Jan 1

Commit

868a7c0

·

verified ·

1 Parent(s): f65321d

Update mlc-chat-config.json

Files changed (1) hide show

mlc-chat-config.json +69 -40

mlc-chat-config.json CHANGED Viewed

@@ -1,43 +1,72 @@
 {
-    "version": "0.1.0",
-    "model_type": "qwen2",
-    "quantization": "q4f16_1",
-    "model_config": {
-        "hidden_size": 768,
-        "intermediate_size": 3072,
-        "num_attention_heads": 12,
-        "num_hidden_layers": 12,
-        "num_key_value_heads": 4,
-        "rms_norm_eps": 1e-05,
-        "rope_theta": 10000.0,
-        "vocab_size": 32768,
-        "tie_word_embeddings": true,
-        "context_window_size": 2048,
-        "sliding_window_size": 128,
-        "prefill_chunk_size": 512,
-        "head_dim": 64,
-        "dtype": "float32",
-        "hidden_act": "silu"
-    },
     "vocab_size": 32768,
-    "conv_template": {
-        "name": "custom_chat",
-        "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
-        "system_message": "You are a helpful AI assistant created by Cihan Yalçın.",
-        "roles": {
-            "user": "<|im_start|>user",
-            "assistant": "<|im_start|>assistant"
-        },
-        "seps": [
-            "<|im_end|>\n"
-        ],
-        "stop_str": [
-            "<|im_end|>",
-            "<|endoftext|>"
-        ],
-        "stop_token_ids": [
-            0,
-            2
-        ]
-    }
 }

 {
+  "version": "0.1.0",
+  "model_type": "qwen2",
+  "model_lib": "regular_llm_v1",
+  "quantization": "q4f16_1",
+  "model_config": {
+    "hidden_act": "silu",
+    "hidden_size": 768,
+    "intermediate_size": 3072,
+    "num_attention_heads": 12,
+    "num_hidden_layers": 12,
+    "num_key_value_heads": 4,
+    "rms_norm_eps": 1e-05,
+    "rope_theta": 10000.0,
     "vocab_size": 32768,
+    "tie_word_embeddings": true,
+    "context_window_size": 2048,
+    "prefill_chunk_size": 512,
+    "tensor_parallel_shards": 1,
+    "head_dim": 64,
+    "dtype": "float32"
+  },
+  "vocab_size": 32768,
+  "context_window_size": 2048,
+  "sliding_window_size": 128,
+  "prefill_chunk_size": 512,
+  "attention_sink_size": -1,
+  "tensor_parallel_shards": 1,
+  "pipeline_parallel_stages": 1,
+  "temperature": 0.7,
+  "presence_penalty": 0.0,
+  "frequency_penalty": 0.0,
+  "repetition_penalty": 1.1,
+  "top_p": 0.8,
+  "tokenizer_files": [
+    "tokenizer.json",
+    "tokenizer_config.json"
+  ],
+  "tokenizer_info": {
+    "token_postproc_method": "byte_level",
+    "prepend_space_in_encode": false,
+    "strip_space_in_decode": false
+  },
+  "conv_template": {
+    "name": "qwen2",
+    "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
+    "system_message": "You are a helpful AI assistant created by Cihan Yalçın.",
+    "roles": {
+      "user": "<|im_start|>user",
+      "assistant": "<|im_start|>assistant"
+    },
+    "seps": [
+      "<|im_end|>\n"
+    ],
+    "role_content_sep": "\n",
+    "role_empty_sep": "\n",
+    "stop_str": [
+      "<|endoftext|>",
+      "<|im_end|>"
+    ],
+    "stop_token_ids": [
+      0,
+      2
+    ]
+  },
+  "pad_token_id": 0,
+  "bos_token_id": 0,
+  "eos_token_id": [
+    2,
+    0
+  ]
 }