bluuluu commited on
Commit
66b72f8
·
verified ·
1 Parent(s): a53113b

End of training

Browse files
Files changed (3) hide show
  1. README.md +3 -1
  2. all_results.json +5 -0
  3. eval_results.json +4 -4
README.md CHANGED
@@ -1,14 +1,16 @@
1
  ---
 
2
  library_name: transformers
3
  model_name: Qwen2.5-1.5B-Open-R1-Distill
4
  tags:
5
  - generated_from_trainer
 
6
  licence: license
7
  ---
8
 
9
  # Model Card for Qwen2.5-1.5B-Open-R1-Distill
10
 
11
- This model is a fine-tuned version of [None](https://huggingface.co/None).
12
  It has been trained using [TRL](https://github.com/huggingface/trl).
13
 
14
  ## Quick start
 
1
  ---
2
+ datasets: HuggingFaceH4/Bespoke-Stratos-17k
3
  library_name: transformers
4
  model_name: Qwen2.5-1.5B-Open-R1-Distill
5
  tags:
6
  - generated_from_trainer
7
+ - open-r1
8
  licence: license
9
  ---
10
 
11
  # Model Card for Qwen2.5-1.5B-Open-R1-Distill
12
 
13
+ This model is a fine-tuned version of [None](https://huggingface.co/None) on the [HuggingFaceH4/Bespoke-Stratos-17k](https://huggingface.co/datasets/HuggingFaceH4/Bespoke-Stratos-17k) dataset.
14
  It has been trained using [TRL](https://github.com/huggingface/trl).
15
 
16
  ## Quick start
all_results.json CHANGED
@@ -1,4 +1,9 @@
1
  {
 
 
 
 
 
2
  "total_flos": 0.0,
3
  "train_loss": 0.8600422314672648,
4
  "train_runtime": 45916.2025,
 
1
  {
2
+ "eval_loss": 0.8818749785423279,
3
+ "eval_runtime": 22.8006,
4
+ "eval_samples": 100,
5
+ "eval_samples_per_second": 4.386,
6
+ "eval_steps_per_second": 0.57,
7
  "total_flos": 0.0,
8
  "train_loss": 0.8600422314672648,
9
  "train_runtime": 45916.2025,
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "eval_loss": 0.9327651262283325,
3
- "eval_runtime": 8.8796,
4
  "eval_samples": 100,
5
- "eval_samples_per_second": 7.433,
6
- "eval_steps_per_second": 0.563
7
  }
 
1
  {
2
+ "eval_loss": 0.8818749785423279,
3
+ "eval_runtime": 22.8006,
4
  "eval_samples": 100,
5
+ "eval_samples_per_second": 4.386,
6
+ "eval_steps_per_second": 0.57
7
  }