Fix: Properly convert to HuggingFace LLaMA format with correct weight mapping and architecture

Files changed (3) hide show

config.json CHANGED Viewed

@@ -8,7 +8,7 @@
   "hidden_act": "silu",
   "hidden_size": 288,
   "initializer_range": 0.02,
-  "intermediate_size": 1152,
   "max_position_embeddings": 2048,
   "model_type": "llama",
   "num_attention_heads": 6,

   "hidden_act": "silu",
   "hidden_size": 288,
   "initializer_range": 0.02,
+  "intermediate_size": 768,
   "max_position_embeddings": 2048,
   "model_type": "llama",
   "num_attention_heads": 6,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bed91b7aeb518d64f5265f2cadbea89da2c8fdf9d83d2dac469905e18c6eaae2
-size 25088104

 version https://git-lfs.github.com/spec/v1
+oid sha256:d910edc7031721de23a7af111e355e6c09d5f1b3a2c43c0b6b0aa6a9135ffe03
+size 25088592

tokenizer_config.json CHANGED Viewed

@@ -5,6 +5,7 @@
   "legacy": false,
   "model_max_length": 2048,
   "tokenizer_class": "LlamaTokenizer",
   "bos_token": {
     "__type": "AddedToken",
     "content": "<s>",

   "legacy": false,
   "model_max_length": 2048,
   "tokenizer_class": "LlamaTokenizer",
+  "pad_token": "<unk>",
   "bos_token": {
     "__type": "AddedToken",
     "content": "<s>",