josem7 commited on
Commit
294541f
·
1 Parent(s): 7dd1591

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +4 -4
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/root/.cache/huggingface/hub/models--berrazuriz--SCHEMA-LINK-h2-SURI-13B/snapshots/35b59cad79de6a4cd7ab861174bc953d76194c27",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -10,7 +10,7 @@
10
  "hidden_size": 5120,
11
  "initializer_range": 0.02,
12
  "intermediate_size": 13824,
13
- "max_position_embeddings": 4096,
14
  "model_type": "llama",
15
  "num_attention_heads": 40,
16
  "num_hidden_layers": 40,
@@ -18,10 +18,10 @@
18
  "pretraining_tp": 1,
19
  "rms_norm_eps": 1e-05,
20
  "rope_scaling": null,
21
- "rope_theta": 10000.0,
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "bfloat16",
24
  "transformers_version": "4.35.0.dev0",
25
  "use_cache": true,
26
- "vocab_size": 32000
27
  }
 
1
  {
2
+ "_name_or_path": "/root/.cache/huggingface/hub/models--josem7--SQL-SURI-13B-v0.2/snapshots/3d3831df70dfcbfbc2bed1e33abc9d7fe9333091",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
10
  "hidden_size": 5120,
11
  "initializer_range": 0.02,
12
  "intermediate_size": 13824,
13
+ "max_position_embeddings": 16384,
14
  "model_type": "llama",
15
  "num_attention_heads": 40,
16
  "num_hidden_layers": 40,
 
18
  "pretraining_tp": 1,
19
  "rms_norm_eps": 1e-05,
20
  "rope_scaling": null,
21
+ "rope_theta": 1000000,
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "bfloat16",
24
  "transformers_version": "4.35.0.dev0",
25
  "use_cache": true,
26
+ "vocab_size": 32016
27
  }