deepnet commited on
Commit
59dcd47
·
verified ·
1 Parent(s): 59dbc71

Upload LlamaForCausalLM

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/Training/TrainedModel3B/",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -21,14 +21,10 @@
21
  "num_attention_heads": 24,
22
  "num_hidden_layers": 24,
23
  "num_key_value_heads": 24,
24
- "pop_states_at_layer": null,
25
  "pretraining_tp": 1,
26
- "return_states_at_layer": null,
27
  "rms_norm_eps": 1e-05,
28
  "rope_scaling": null,
29
  "rope_theta": 10000.0,
30
- "start_at_layer": null,
31
- "stash_states_at_layer": null,
32
  "tie_word_embeddings": false,
33
  "torch_dtype": "bfloat16",
34
  "transformers_version": "4.44.1",
 
1
  {
2
+ "_name_or_path": "/Training/SN9TrainedModel3B/",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
21
  "num_attention_heads": 24,
22
  "num_hidden_layers": 24,
23
  "num_key_value_heads": 24,
 
24
  "pretraining_tp": 1,
 
25
  "rms_norm_eps": 1e-05,
26
  "rope_scaling": null,
27
  "rope_theta": 10000.0,
 
 
28
  "tie_word_embeddings": false,
29
  "torch_dtype": "bfloat16",
30
  "transformers_version": "4.44.1",
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef4ace5d09552bc4d7df3dcc888d3eae58a1c052c980a56b375b1999fb9a7020
3
  size 4971811976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb2ac7b7d03d6915ea4f8e3905b83c22d35cff236f137e39b35757f16c006e4e
3
  size 4971811976
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59412f144c256b8d8f7f5d43a45e74b0a324ff182f2c3b637138e9d9348dbbbf
3
  size 1828189840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75fd98b950f7538dd779a624b03dbd276b00302f7671d0be907dc3d09f21643b
3
  size 1828189840