Stefan1982 commited on
Commit
031973a
·
verified ·
1 Parent(s): 0afeb61

Training in progress, step 100

Browse files
Files changed (3) hide show
  1. config.json +4 -4
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -6,16 +6,16 @@
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 2,
9
- "head_dim": 128,
10
  "hidden_act": "silu",
11
- "hidden_size": 1024,
12
  "initializer_range": 0.02,
13
- "intermediate_size": 5000,
14
  "max_position_embeddings": 2048,
15
  "mlp_bias": false,
16
  "model_type": "stockllama",
17
  "num_attention_heads": 8,
18
- "num_hidden_layers": 8,
19
  "num_key_value_heads": 8,
20
  "pad_token_id": 0,
21
  "pretraining_tp": 1,
 
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 2,
9
+ "head_dim": 256,
10
  "hidden_act": "silu",
11
+ "hidden_size": 2048,
12
  "initializer_range": 0.02,
13
+ "intermediate_size": 8192,
14
  "max_position_embeddings": 2048,
15
  "mlp_bias": false,
16
  "model_type": "stockllama",
17
  "num_attention_heads": 8,
18
+ "num_hidden_layers": 12,
19
  "num_key_value_heads": 8,
20
  "pad_token_id": 0,
21
  "pretraining_tp": 1,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:270d4f45357a1b8e5e170ee0b59b369d295dc2b7a373c72e4e5da2cf18f2cd68
3
- size 994459984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b7759cd17fa076b59364644ced80fa7d1cce0dc9797030dffe2b548f4140746
3
+ size 3958731256
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1feb4ae246ed74c133831cd522d3f268c44240db3e54cc445e171cd434558978
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:719182d078a65dad32d29e443cd06558d8aabb2fbf857e8656103b6b9a87c3c6
3
  size 5176