flyingbugs commited on
Commit
8888369
·
verified ·
1 Parent(s): 10392e7

Model save

Browse files
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: Qwen/Qwen2.5-Math-7B
3
  library_name: transformers
4
  model_name: Qwen2.5-7B-Open-R1-Distill-mixed
5
  tags:
@@ -11,7 +11,7 @@ licence: license
11
 
12
  # Model Card for Qwen2.5-7B-Open-R1-Distill-mixed
13
 
14
- This model is a fine-tuned version of [Qwen/Qwen2.5-Math-7B](https://huggingface.co/Qwen/Qwen2.5-Math-7B).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
@@ -27,7 +27,7 @@ print(output["generated_text"])
27
 
28
  ## Training procedure
29
 
30
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/jjh233/huggingface/runs/4ee21rto)
31
 
32
 
33
  This model was trained with SFT.
 
1
  ---
2
+ base_model: Qwen/Qwen2.5-7B-Instruct
3
  library_name: transformers
4
  model_name: Qwen2.5-7B-Open-R1-Distill-mixed
5
  tags:
 
11
 
12
  # Model Card for Qwen2.5-7B-Open-R1-Distill-mixed
13
 
14
+ This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
 
27
 
28
  ## Training procedure
29
 
30
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/jjh233/huggingface/runs/qx8bei0j)
31
 
32
 
33
  This model was trained with SFT.
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "total_flos": 0.0,
3
- "train_loss": 9.05303086676834,
4
- "train_runtime": 99277.474,
5
  "train_samples": 16610,
6
- "train_samples_per_second": 0.218,
7
- "train_steps_per_second": 0.027
8
  }
 
1
  {
2
  "total_flos": 0.0,
3
+ "train_loss": 1.4448112659087413,
4
+ "train_runtime": 91860.5158,
5
  "train_samples": 16610,
6
+ "train_samples_per_second": 0.235,
7
+ "train_steps_per_second": 0.029
8
  }
config.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
- "_name_or_path": "Qwen/Qwen2.5-Math-7B",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 151643,
8
- "eos_token_id": 151643,
9
  "hidden_act": "silu",
10
  "hidden_size": 3584,
11
  "initializer_range": 0.02,
12
  "intermediate_size": 18944,
13
- "max_position_embeddings": 4096,
14
  "max_window_layers": 28,
15
  "model_type": "qwen2",
16
  "num_attention_heads": 28,
@@ -18,13 +18,12 @@
18
  "num_key_value_heads": 4,
19
  "rms_norm_eps": 1e-06,
20
  "rope_scaling": null,
21
- "rope_theta": 10000,
22
- "sliding_window": 4096,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.49.0.dev0",
26
  "use_cache": false,
27
- "use_mrope": false,
28
  "use_sliding_window": false,
29
  "vocab_size": 152064
30
  }
 
1
  {
2
+ "_name_or_path": "Qwen/Qwen2.5-7B-Instruct",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 151643,
8
+ "eos_token_id": 151645,
9
  "hidden_act": "silu",
10
  "hidden_size": 3584,
11
  "initializer_range": 0.02,
12
  "intermediate_size": 18944,
13
+ "max_position_embeddings": 32768,
14
  "max_window_layers": 28,
15
  "model_type": "qwen2",
16
  "num_attention_heads": 28,
 
18
  "num_key_value_heads": 4,
19
  "rms_norm_eps": 1e-06,
20
  "rope_scaling": null,
21
+ "rope_theta": 1000000.0,
22
+ "sliding_window": 131072,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.49.0.dev0",
26
  "use_cache": false,
 
27
  "use_sliding_window": false,
28
  "vocab_size": 152064
29
  }
generation_config.json CHANGED
@@ -1,6 +1,14 @@
1
  {
2
  "bos_token_id": 151643,
3
- "eos_token_id": 151643,
4
- "max_new_tokens": 2048,
 
 
 
 
 
 
 
 
5
  "transformers_version": "4.49.0.dev0"
6
  }
 
1
  {
2
  "bos_token_id": 151643,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "pad_token_id": 151643,
9
+ "repetition_penalty": 1.05,
10
+ "temperature": 0.7,
11
+ "top_k": 20,
12
+ "top_p": 0.8,
13
  "transformers_version": "4.49.0.dev0"
14
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2177467f63bc5aaf9de4c301ab72af7adc904148d9b4cdf899d3504f907c3f6
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92aed972beb5efc162e81cc18cdc5b53fcb17ef4008e0413598dd0c72f6065d2
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:07daa14da790d0628aeeac16c6e30c981612031c50e40d9bb0059723ef5cdce7
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ed30defca2c386ff61e8ba0ad1dd3ab3b94de98d62978721f07fab5888b6c9f
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21c9b61a1843f674c3ec29013f216f2f33be3bc35548f1ad6527f3becea389b3
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:890e40b6ecfcf0b27cc96e67434473231bf9d6ef8c08a4ee40bfe963e27abb0d
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a42786061c92654b2876018ac9898c04f5cd4fc8254b88f5dcd90a396268cc1
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd4d107cb11585b17c4f3c92913dabf9e81ede449f5246e183ada044ed181fd2
3
  size 1089994880
results/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B/results_2025-02-10T16-08-09.207705.json ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config_general": {
3
+ "lighteval_sha": "?",
4
+ "num_fewshot_seeds": 1,
5
+ "override_batch_size": -1,
6
+ "max_samples": null,
7
+ "job_id": 0,
8
+ "start_time": 627433.20374781,
9
+ "end_time": 627650.868866556,
10
+ "total_evaluation_time_secondes": "217.66511874599382",
11
+ "model_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
12
+ "model_sha": "",
13
+ "model_dtype": null,
14
+ "model_size": null
15
+ },
16
+ "results": {
17
+ "custom|aime24|1": {
18
+ "extractive_match": 0.2,
19
+ "extractive_match_stderr": 0.07427813527082075
20
+ },
21
+ "all": {
22
+ "extractive_match": 0.2,
23
+ "extractive_match_stderr": 0.07427813527082075
24
+ }
25
+ },
26
+ "versions": {
27
+ "custom|aime24|1": 1
28
+ },
29
+ "config_tasks": {
30
+ "custom|aime24": {
31
+ "name": "aime24",
32
+ "prompt_function": "aime_prompt_fn",
33
+ "hf_repo": "HuggingFaceH4/aime_2024",
34
+ "hf_subset": "default",
35
+ "metric": [
36
+ {
37
+ "metric_name": "extractive_match",
38
+ "higher_is_better": true,
39
+ "category": "3",
40
+ "use_case": "1",
41
+ "sample_level_fn": "sample_level_fn",
42
+ "corpus_level_fn": "mean"
43
+ }
44
+ ],
45
+ "hf_revision": null,
46
+ "hf_filter": null,
47
+ "hf_avail_splits": [
48
+ "train"
49
+ ],
50
+ "trust_dataset": false,
51
+ "evaluation_splits": [
52
+ "train"
53
+ ],
54
+ "few_shots_split": null,
55
+ "few_shots_select": null,
56
+ "generation_size": 32768,
57
+ "generation_grammar": null,
58
+ "stop_sequence": [],
59
+ "num_samples": null,
60
+ "suite": [
61
+ "custom"
62
+ ],
63
+ "original_num_docs": 30,
64
+ "effective_num_docs": 30,
65
+ "must_remove_duplicate_docs": false,
66
+ "version": 1
67
+ }
68
+ },
69
+ "summary_tasks": {
70
+ "custom|aime24|1": {
71
+ "hashes": {
72
+ "hash_examples": "18ca0099f8d8f826",
73
+ "hash_full_prompts": "558d24d97c0a0742",
74
+ "hash_input_tokens": "4637fbc1de5f6656",
75
+ "hash_cont_tokens": "78ccf84b49581fa6"
76
+ },
77
+ "truncated": 0,
78
+ "non_truncated": 30,
79
+ "padded": 0,
80
+ "non_padded": 30,
81
+ "effective_few_shots": -1.0,
82
+ "num_truncated_few_shots": 30
83
+ }
84
+ },
85
+ "summary_general": {
86
+ "hashes": {
87
+ "hash_examples": "c4769936f28d3d77",
88
+ "hash_full_prompts": "a1a733ebec6ebc6d",
89
+ "hash_input_tokens": "a8ff12512b74af64",
90
+ "hash_cont_tokens": "fd258a745d12f011"
91
+ },
92
+ "truncated": 0,
93
+ "non_truncated": 30,
94
+ "padded": 0,
95
+ "non_padded": 30,
96
+ "num_truncated_few_shots": 30
97
+ }
98
+ }
special_tokens_map.json CHANGED
@@ -15,11 +15,11 @@
15
  "<|video_pad|>"
16
  ],
17
  "eos_token": {
18
- "content": "<|endoftext|>",
19
  "lstrip": false,
20
  "normalized": false,
21
  "rstrip": false,
22
  "single_word": false
23
  },
24
- "pad_token": "<|endoftext|>"
25
  }
 
15
  "<|video_pad|>"
16
  ],
17
  "eos_token": {
18
+ "content": "<|im_end|>",
19
  "lstrip": false,
20
  "normalized": false,
21
  "rstrip": false,
22
  "single_word": false
23
  },
24
+ "pad_token": "<|im_end|>"
25
  }
tokenizer_config.json CHANGED
@@ -195,13 +195,13 @@
195
  "<|video_pad|>"
196
  ],
197
  "bos_token": null,
198
- "chat_template": "{%- if tools %}\n {{- '<|im_start|>system\\n' }}\n {%- if messages[0]['role'] == 'system' %}\n {{- messages[0]['content'] }}\n {%- else %}\n {{- 'Please reason step by step, and put your final answer within \\\\boxed{}.' }}\n {%- endif %}\n {{- \"\\n\\n# Tools\\n\\nYou may call one or more functions to assist with the user query.\\n\\nYou are provided with function signatures within <tools></tools> XML tags:\\n<tools>\" }}\n {%- for tool in tools %}\n {{- \"\\n\" }}\n {{- tool | tojson }}\n {%- endfor %}\n {{- \"\\n</tools>\\n\\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\\n<tool_call>\\n{\\\"name\\\": <function-name>, \\\"arguments\\\": <args-json-object>}\\n</tool_call><|im_end|>\\n\" }}\n{%- else %}\n {%- if messages[0]['role'] == 'system' %}\n {{- '<|im_start|>system\\n' + messages[0]['content'] + '<|im_end|>\\n' }}\n {%- else %}\n {{- '<|im_start|>system\\nPlease reason step by step, and put your final answer within \\\\boxed{}.<|im_end|>\\n' }}\n {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and not message.tool_calls) %}\n {{- '<|im_start|>' + message.role + '\\n' + message.content + '<|im_end|>' + '\\n' }}\n {%- elif message.role == \"assistant\" %}\n {{- '<|im_start|>' + message.role }}\n {%- if message.content %}\n {{- '\\n' + message.content }}\n {%- endif %}\n {%- for tool_call in message.tool_calls %}\n {%- if tool_call.function is defined %}\n {%- set tool_call = tool_call.function %}\n {%- endif %}\n {{- '\\n<tool_call>\\n{\"name\": \"' }}\n {{- tool_call.name }}\n {{- '\", \"arguments\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- '}\\n</tool_call>' }}\n {%- endfor %}\n {{- '<|im_end|>\\n' }}\n {%- elif message.role == \"tool\" %}\n {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != \"tool\") %}\n {{- '<|im_start|>user' }}\n {%- endif %}\n {{- '\\n<tool_response>\\n' }}\n {{- message.content }}\n {{- '\\n</tool_response>' }}\n {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n {{- '<|im_end|>\\n' }}\n {%- endif %}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|im_start|>assistant\\n' }}\n{%- endif %}\n",
199
  "clean_up_tokenization_spaces": false,
200
- "eos_token": "<|endoftext|>",
201
  "errors": "replace",
202
  "extra_special_tokens": {},
203
  "model_max_length": 131072,
204
- "pad_token": "<|endoftext|>",
205
  "split_special_tokens": false,
206
  "tokenizer_class": "Qwen2Tokenizer",
207
  "unk_token": null
 
195
  "<|video_pad|>"
196
  ],
197
  "bos_token": null,
198
+ "chat_template": "{%- if tools %}\n {{- '<|im_start|>system\\n' }}\n {%- if messages[0]['role'] == 'system' %}\n {{- messages[0]['content'] }}\n {%- else %}\n {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }}\n {%- endif %}\n {{- \"\\n\\n# Tools\\n\\nYou may call one or more functions to assist with the user query.\\n\\nYou are provided with function signatures within <tools></tools> XML tags:\\n<tools>\" }}\n {%- for tool in tools %}\n {{- \"\\n\" }}\n {{- tool | tojson }}\n {%- endfor %}\n {{- \"\\n</tools>\\n\\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\\n<tool_call>\\n{\\\"name\\\": <function-name>, \\\"arguments\\\": <args-json-object>}\\n</tool_call><|im_end|>\\n\" }}\n{%- else %}\n {%- if messages[0]['role'] == 'system' %}\n {{- '<|im_start|>system\\n' + messages[0]['content'] + '<|im_end|>\\n' }}\n {%- else %}\n {{- '<|im_start|>system\\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\\n' }}\n {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and not message.tool_calls) %}\n {{- '<|im_start|>' + message.role + '\\n' + message.content + '<|im_end|>' + '\\n' }}\n {%- elif message.role == \"assistant\" %}\n {{- '<|im_start|>' + message.role }}\n {%- if message.content %}\n {{- '\\n' + message.content }}\n {%- endif %}\n {%- for tool_call in message.tool_calls %}\n {%- if tool_call.function is defined %}\n {%- set tool_call = tool_call.function %}\n {%- endif %}\n {{- '\\n<tool_call>\\n{\"name\": \"' }}\n {{- tool_call.name }}\n {{- '\", \"arguments\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- '}\\n</tool_call>' }}\n {%- endfor %}\n {{- '<|im_end|>\\n' }}\n {%- elif message.role == \"tool\" %}\n {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != \"tool\") %}\n {{- '<|im_start|>user' }}\n {%- endif %}\n {{- '\\n<tool_response>\\n' }}\n {{- message.content }}\n {{- '\\n</tool_response>' }}\n {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n {{- '<|im_end|>\\n' }}\n {%- endif %}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|im_start|>assistant\\n' }}\n{%- endif %}\n",
199
  "clean_up_tokenization_spaces": false,
200
+ "eos_token": "<|im_end|>",
201
  "errors": "replace",
202
  "extra_special_tokens": {},
203
  "model_max_length": 131072,
204
+ "pad_token": "<|im_end|>",
205
  "split_special_tokens": false,
206
  "tokenizer_class": "Qwen2Tokenizer",
207
  "unk_token": null
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "total_flos": 0.0,
3
- "train_loss": 9.05303086676834,
4
- "train_runtime": 99277.474,
5
  "train_samples": 16610,
6
- "train_samples_per_second": 0.218,
7
- "train_steps_per_second": 0.027
8
  }
 
1
  {
2
  "total_flos": 0.0,
3
+ "train_loss": 1.4448112659087413,
4
+ "train_runtime": 91860.5158,
5
  "train_samples": 16610,
6
+ "train_samples_per_second": 0.235,
7
+ "train_steps_per_second": 0.029
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f311f0d076b6ff826d0428e10fb588767bf2c8f02c04ed19ff6db52a7decaa6
3
- size 6008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c61a9db7fca493e3e063521152d4de1a0e5c8a089eb36a2528d0b0d1d0294e9
3
+ size 5944