neginr commited on
Commit
abdead8
·
verified ·
1 Parent(s): 8832da6

End of training

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. all_results.json +3 -3
  3. train_results.json +3 -3
  4. trainer_state.json +3 -3
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # OpenR1-Math-Raw-all-correct-5k
18
 
19
- This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct) on an unknown dataset.
20
 
21
  ## Model description
22
 
 
16
 
17
  # OpenR1-Math-Raw-all-correct-5k
18
 
19
+ This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct) on the neginr/OpenR1-Math-Raw-all-correct-5k dataset.
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 6.955414012738854,
3
  "total_flos": 3.947982283988664e+17,
4
  "train_loss": 0.0,
5
- "train_runtime": 2.5246,
6
- "train_samples_per_second": 13863.535,
7
- "train_steps_per_second": 144.181
8
  }
 
2
  "epoch": 6.955414012738854,
3
  "total_flos": 3.947982283988664e+17,
4
  "train_loss": 0.0,
5
+ "train_runtime": 2.6671,
6
+ "train_samples_per_second": 13122.755,
7
+ "train_steps_per_second": 136.477
8
  }
train_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 6.955414012738854,
3
  "total_flos": 3.947982283988664e+17,
4
  "train_loss": 0.0,
5
- "train_runtime": 2.5246,
6
- "train_samples_per_second": 13863.535,
7
- "train_steps_per_second": 144.181
8
  }
 
2
  "epoch": 6.955414012738854,
3
  "total_flos": 3.947982283988664e+17,
4
  "train_loss": 0.0,
5
+ "train_runtime": 2.6671,
6
+ "train_samples_per_second": 13122.755,
7
+ "train_steps_per_second": 136.477
8
  }
trainer_state.json CHANGED
@@ -2561,9 +2561,9 @@
2561
  "step": 364,
2562
  "total_flos": 3.947982283988664e+17,
2563
  "train_loss": 0.0,
2564
- "train_runtime": 2.5246,
2565
- "train_samples_per_second": 13863.535,
2566
- "train_steps_per_second": 144.181
2567
  }
2568
  ],
2569
  "logging_steps": 1,
 
2561
  "step": 364,
2562
  "total_flos": 3.947982283988664e+17,
2563
  "train_loss": 0.0,
2564
+ "train_runtime": 2.6671,
2565
+ "train_samples_per_second": 13122.755,
2566
+ "train_steps_per_second": 136.477
2567
  }
2568
  ],
2569
  "logging_steps": 1,