Azrail commited on
Commit
38b1a1b
·
verified ·
1 Parent(s): 466c359

Training in progress, step 61000

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. config.json +1 -5
  3. model.safetensors +1 -1
  4. training_args.bin +1 -1
README.md CHANGED
@@ -1,8 +1,8 @@
1
  ---
2
  library_name: transformers
3
  tags:
4
- - generated_from_trainer
5
  - smallm
 
6
  model-index:
7
  - name: smallm_70_rope
8
  results: []
 
1
  ---
2
  library_name: transformers
3
  tags:
 
4
  - smallm
5
+ - generated_from_trainer
6
  model-index:
7
  - name: smallm_70_rope
8
  results: []
config.json CHANGED
@@ -4,10 +4,6 @@
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.1,
7
- "auto_map": {
8
- "AutoConfig": "config.SmalLmConfig",
9
- "AutoModelForCausalLM": "model.SmalLmForCausalLM"
10
- },
11
  "balancing_coef": 0.0001,
12
  "bos_token_id": 1,
13
  "embedding_dropout": 0.0,
@@ -43,7 +39,7 @@
43
  "sliding_window_attention": true,
44
  "sliding_window_context": 1024,
45
  "sliding_window_period": 4,
46
- "static_residual": true,
47
  "token_experts": 3,
48
  "torch_dtype": "float32",
49
  "transformers_version": "4.50.3",
 
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.1,
 
 
 
 
7
  "balancing_coef": 0.0001,
8
  "bos_token_id": 1,
9
  "embedding_dropout": 0.0,
 
39
  "sliding_window_attention": true,
40
  "sliding_window_context": 1024,
41
  "sliding_window_period": 4,
42
+ "static_residual": false,
43
  "token_experts": 3,
44
  "torch_dtype": "float32",
45
  "transformers_version": "4.50.3",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c41967e5432db5ed91bc1228a51744d8af764a94e341f801caf2cc8d0b340946
3
  size 301235464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ff3677e2a6c68c6a9bc84018c91a9abb1bcf7c14c1b566d1f4d545783476a72
3
  size 301235464
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae75bb2a8bb196138369db914584406a32731cac3b2572b642609f88b870f3b8
3
  size 6008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a964c444482261d405cae313adc306063a7a31a0cff9e89a43e151d806eeee7e
3
  size 6008