ryanmarten commited on
Commit
c32cb39
·
verified ·
1 Parent(s): 5b37add

End of training

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. all_results.json +3 -3
  3. train_results.json +3 -3
  4. trainer_state.json +3 -3
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # e1_science_longest_r1
18
 
19
- This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct) on an unknown dataset.
20
 
21
  ## Model description
22
 
 
16
 
17
  # e1_science_longest_r1
18
 
19
+ This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct) on the mlfoundations-dev/e1_science_longest_r1 dataset.
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 4.9869587897756915,
3
  "total_flos": 2.8011398523411825e+18,
4
  "train_loss": 0.0,
5
- "train_runtime": 5.0033,
6
- "train_samples_per_second": 30641.958,
7
- "train_steps_per_second": 238.844
8
  }
 
2
  "epoch": 4.9869587897756915,
3
  "total_flos": 2.8011398523411825e+18,
4
  "train_loss": 0.0,
5
+ "train_runtime": 3.7901,
6
+ "train_samples_per_second": 40449.714,
7
+ "train_steps_per_second": 315.292
8
  }
train_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 4.9869587897756915,
3
  "total_flos": 2.8011398523411825e+18,
4
  "train_loss": 0.0,
5
- "train_runtime": 5.0033,
6
- "train_samples_per_second": 30641.958,
7
- "train_steps_per_second": 238.844
8
  }
 
2
  "epoch": 4.9869587897756915,
3
  "total_flos": 2.8011398523411825e+18,
4
  "train_loss": 0.0,
5
+ "train_runtime": 3.7901,
6
+ "train_samples_per_second": 40449.714,
7
+ "train_steps_per_second": 315.292
8
  }
trainer_state.json CHANGED
@@ -8378,9 +8378,9 @@
8378
  "step": 1195,
8379
  "total_flos": 2.8011398523411825e+18,
8380
  "train_loss": 0.0,
8381
- "train_runtime": 5.0033,
8382
- "train_samples_per_second": 30641.958,
8383
- "train_steps_per_second": 238.844
8384
  }
8385
  ],
8386
  "logging_steps": 1,
 
8378
  "step": 1195,
8379
  "total_flos": 2.8011398523411825e+18,
8380
  "train_loss": 0.0,
8381
+ "train_runtime": 3.7901,
8382
+ "train_samples_per_second": 40449.714,
8383
+ "train_steps_per_second": 315.292
8384
  }
8385
  ],
8386
  "logging_steps": 1,