LLucass commited on
Commit
00048be
·
verified ·
1 Parent(s): ee7dfbc

Training in progress, step 50

Browse files
Files changed (3) hide show
  1. config.json +1 -2
  2. model.safetensors +1 -1
  3. training_args.bin +1 -1
config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_name_or_path": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
@@ -22,7 +21,7 @@
22
  "sliding_window": 4096,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
- "transformers_version": "4.49.0",
26
  "use_cache": false,
27
  "use_mrope": false,
28
  "use_sliding_window": false,
 
1
  {
 
2
  "architectures": [
3
  "Qwen2ForCausalLM"
4
  ],
 
21
  "sliding_window": 4096,
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "bfloat16",
24
+ "transformers_version": "4.51.3",
25
  "use_cache": false,
26
  "use_mrope": false,
27
  "use_sliding_window": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18c6ff50b4bee65d3c8c028fa049a67a93811e0f82eb994ece75923a73d56483
3
  size 3554214752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17239d2b3c3e1a5b520841a5f02034acd62155541e8d16cb28849cd0b1e47a02
3
  size 3554214752
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af73b27661da8a7d636c4f31b34d39635bc198f5be08b10a1504c40be9a75769
3
  size 8184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebbb74d674013a368a52aaab287a1e88a12d2111e547dd2e742c9c5aa026eca7
3
  size 8184