Kwang-su commited on
Commit
4fef478
·
verified ·
1 Parent(s): c01b679

Upload LlamaForCausalLM

Browse files
config.json CHANGED
@@ -1,17 +1,19 @@
1
  {
2
- "_name_or_path": "beomi/Llama-3-Open-Ko-8B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
- "eos_token_id": 128001,
 
 
10
  "hidden_act": "silu",
11
  "hidden_size": 4096,
12
  "initializer_range": 0.02,
13
  "intermediate_size": 14336,
14
  "max_position_embeddings": 8192,
 
15
  "model_type": "llama",
16
  "num_attention_heads": 32,
17
  "num_hidden_layers": 32,
@@ -21,8 +23,7 @@
21
  "rope_scaling": null,
22
  "rope_theta": 500000.0,
23
  "tie_word_embeddings": false,
24
- "torch_dtype": "float16",
25
- "transformers_version": "4.40.0",
26
  "use_cache": true,
27
  "vocab_size": 128256
28
  }
 
1
  {
 
2
  "architectures": [
3
  "LlamaForCausalLM"
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 128000,
8
+ "dtype": "float16",
9
+ "eos_token_id": 128009,
10
+ "head_dim": 128,
11
  "hidden_act": "silu",
12
  "hidden_size": 4096,
13
  "initializer_range": 0.02,
14
  "intermediate_size": 14336,
15
  "max_position_embeddings": 8192,
16
+ "mlp_bias": false,
17
  "model_type": "llama",
18
  "num_attention_heads": 32,
19
  "num_hidden_layers": 32,
 
23
  "rope_scaling": null,
24
  "rope_theta": 500000.0,
25
  "tie_word_embeddings": false,
26
+ "transformers_version": "4.57.6",
 
27
  "use_cache": true,
28
  "vocab_size": 128256
29
  }
generation_config.json CHANGED
@@ -1,7 +1,12 @@
1
  {
2
- "_from_model_config": true,
3
- "bos_token_id": 1,
4
- "eos_token_id": 2,
5
- "pad_token_id": 2,
6
- "transformers_version": "4.40.0"
 
 
 
 
 
7
  }
 
1
  {
2
+ "bos_token_id": 128000,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128009
7
+ ],
8
+ "max_length": 4096,
9
+ "temperature": 0.6,
10
+ "top_p": 0.9,
11
+ "transformers_version": "4.57.6"
12
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56d48c98d37db8ac378e16475f67eee3cf48fd27287985e9493eddc4d3bf4d7c
3
  size 4976698592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:face513dab35244d03043f49e596805fbdaca2b9eb58dcf1e6a74a2f253ba665
3
  size 4976698592
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c66cc87e46255fa80896de9a67d9c7d94cf55de57d0fc86753f925226977f7f7
3
  size 4999802616
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf8042f848cde7cedaf8b563c87dc0885cb37074b21f28dfef2a98df57eb59c8
3
  size 4999802616
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52560285f89bc12524e5bb7f7609037b49434ccfb081ae6b626371e4fd1c5d94
3
  size 4915916080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8403da2ee8bb2a5caf8ff74a4118c0fb537af80dc042997e5f6777948c9a6122
3
  size 4915916080
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed70a3a9c1986d5b047fc1354aac07495559f1ebc37908e505a1655e44913680
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:146753a60dc85291a4fc40674be347e996064b6cd5a2e48f4b888000a1e19440
3
  size 1168138808
model.safetensors.index.json CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "metadata": {
 
3
  "total_size": 16060522496
4
  },
5
  "weight_map": {
 
1
  {
2
  "metadata": {
3
+ "total_parameters": 8030261248,
4
  "total_size": 16060522496
5
  },
6
  "weight_map": {