Blancy commited on
Commit
4706082
·
verified ·
1 Parent(s): 504a2a2

Training in progress, epoch 1

Browse files
Files changed (3) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -8,9 +8,9 @@
8
  "eos_token_id": 151645,
9
  "head_dim": 128,
10
  "hidden_act": "silu",
11
- "hidden_size": 1024,
12
  "initializer_range": 0.02,
13
- "intermediate_size": 3072,
14
  "max_position_embeddings": 40960,
15
  "max_window_layers": 28,
16
  "model_type": "qwen3",
 
8
  "eos_token_id": 151645,
9
  "head_dim": 128,
10
  "hidden_act": "silu",
11
+ "hidden_size": 2048,
12
  "initializer_range": 0.02,
13
+ "intermediate_size": 6144,
14
  "max_position_embeddings": 40960,
15
  "max_window_layers": 28,
16
  "model_type": "qwen3",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e09dadbd1a2f9b52ba49439b7d86665fc098d329451d19761dc8b8c9a0d8713e
3
- size 1503300328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10a0e99b201648acb6ba458db99773a474c55d9ce92d72a203f30f6051dd1937
3
+ size 4063515640
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f15a9ef19580a4f91fd0f92f068fa8f8f23f39fafe4a093efa46d606d11c8aab
3
  size 7992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66bb1dd39935f18a98f0436e61fa9a767e1bedcbcb28b5b4d4a791a57719cde7
3
  size 7992