manojredhat commited on
Commit
8f4b37b
·
verified ·
1 Parent(s): f058bcd

Fix: Properly convert to HuggingFace LLaMA format with correct weight mapping and architecture

Browse files
Files changed (3) hide show
  1. config.json +1 -1
  2. model.safetensors +2 -2
  3. tokenizer_config.json +1 -0
config.json CHANGED
@@ -8,7 +8,7 @@
8
  "hidden_act": "silu",
9
  "hidden_size": 288,
10
  "initializer_range": 0.02,
11
- "intermediate_size": 1152,
12
  "max_position_embeddings": 2048,
13
  "model_type": "llama",
14
  "num_attention_heads": 6,
 
8
  "hidden_act": "silu",
9
  "hidden_size": 288,
10
  "initializer_range": 0.02,
11
+ "intermediate_size": 768,
12
  "max_position_embeddings": 2048,
13
  "model_type": "llama",
14
  "num_attention_heads": 6,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bed91b7aeb518d64f5265f2cadbea89da2c8fdf9d83d2dac469905e18c6eaae2
3
- size 25088104
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d910edc7031721de23a7af111e355e6c09d5f1b3a2c43c0b6b0aa6a9135ffe03
3
+ size 25088592
tokenizer_config.json CHANGED
@@ -5,6 +5,7 @@
5
  "legacy": false,
6
  "model_max_length": 2048,
7
  "tokenizer_class": "LlamaTokenizer",
 
8
  "bos_token": {
9
  "__type": "AddedToken",
10
  "content": "<s>",
 
5
  "legacy": false,
6
  "model_max_length": 2048,
7
  "tokenizer_class": "LlamaTokenizer",
8
+ "pad_token": "<unk>",
9
  "bos_token": {
10
  "__type": "AddedToken",
11
  "content": "<s>",