neginr commited on
Commit
2735db1
·
verified ·
1 Parent(s): 743f304

End of training

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. all_results.json +3 -3
  3. train_results.json +3 -3
  4. trainer_state.json +3 -3
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # r1_annotated_finqa
18
 
19
- This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct) on an unknown dataset.
20
 
21
  ## Model description
22
 
 
16
 
17
  # r1_annotated_finqa
18
 
19
+ This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct) on the mlfoundations-dev/r1_annotated_finqa dataset.
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 6.955414012738854,
3
  "total_flos": 1.6645198251751014e+17,
4
  "train_loss": 0.0,
5
- "train_runtime": 5.2904,
6
- "train_samples_per_second": 6615.788,
7
- "train_steps_per_second": 68.804
8
  }
 
2
  "epoch": 6.955414012738854,
3
  "total_flos": 1.6645198251751014e+17,
4
  "train_loss": 0.0,
5
+ "train_runtime": 2.7097,
6
+ "train_samples_per_second": 12916.486,
7
+ "train_steps_per_second": 134.331
8
  }
train_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 6.955414012738854,
3
  "total_flos": 1.6645198251751014e+17,
4
  "train_loss": 0.0,
5
- "train_runtime": 5.2904,
6
- "train_samples_per_second": 6615.788,
7
- "train_steps_per_second": 68.804
8
  }
 
2
  "epoch": 6.955414012738854,
3
  "total_flos": 1.6645198251751014e+17,
4
  "train_loss": 0.0,
5
+ "train_runtime": 2.7097,
6
+ "train_samples_per_second": 12916.486,
7
+ "train_steps_per_second": 134.331
8
  }
trainer_state.json CHANGED
@@ -2561,9 +2561,9 @@
2561
  "step": 364,
2562
  "total_flos": 1.6645198251751014e+17,
2563
  "train_loss": 0.0,
2564
- "train_runtime": 5.2904,
2565
- "train_samples_per_second": 6615.788,
2566
- "train_steps_per_second": 68.804
2567
  }
2568
  ],
2569
  "logging_steps": 1,
 
2561
  "step": 364,
2562
  "total_flos": 1.6645198251751014e+17,
2563
  "train_loss": 0.0,
2564
+ "train_runtime": 2.7097,
2565
+ "train_samples_per_second": 12916.486,
2566
+ "train_steps_per_second": 134.331
2567
  }
2568
  ],
2569
  "logging_steps": 1,