bluuluu commited on
Commit
f6d76d0
·
verified ·
1 Parent(s): f4dbd47

Model save

Browse files
Files changed (4) hide show
  1. README.md +3 -3
  2. all_results.json +4 -4
  3. train_results.json +4 -4
  4. trainer_state.json +0 -0
README.md CHANGED
@@ -24,17 +24,17 @@ print(output["generated_text"])
24
 
25
  ## Training procedure
26
 
27
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/2741919970-hustvl/huggingface/runs/kmc58nu5)
28
 
29
 
30
  This model was trained with SFT.
31
 
32
  ### Framework versions
33
 
34
- - TRL: 0.15.0.dev0
35
  - Transformers: 4.49.0.dev0
36
  - Pytorch: 2.5.1
37
- - Datasets: 3.2.0
38
  - Tokenizers: 0.21.0
39
 
40
  ## Citations
 
24
 
25
  ## Training procedure
26
 
27
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/2741919970-hustvl/huggingface/runs/4c8t09gs)
28
 
29
 
30
  This model was trained with SFT.
31
 
32
  ### Framework versions
33
 
34
+ - TRL: 0.16.0.dev0
35
  - Transformers: 4.49.0.dev0
36
  - Pytorch: 2.5.1
37
+ - Datasets: 3.3.0
38
  - Tokenizers: 0.21.0
39
 
40
  ## Citations
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "total_flos": 0.0,
3
- "train_loss": 0.984842965855427,
4
- "train_runtime": 39952.7795,
5
  "train_samples": 16610,
6
- "train_samples_per_second": 3.298,
7
- "train_steps_per_second": 0.103
8
  }
 
1
  {
2
  "total_flos": 0.0,
3
+ "train_loss": 0.9694986148756377,
4
+ "train_runtime": 60321.7593,
5
  "train_samples": 16610,
6
+ "train_samples_per_second": 1.456,
7
+ "train_steps_per_second": 0.023
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "total_flos": 0.0,
3
- "train_loss": 0.984842965855427,
4
- "train_runtime": 39952.7795,
5
  "train_samples": 16610,
6
- "train_samples_per_second": 3.298,
7
- "train_steps_per_second": 0.103
8
  }
 
1
  {
2
  "total_flos": 0.0,
3
+ "train_loss": 0.9694986148756377,
4
+ "train_runtime": 60321.7593,
5
  "train_samples": 16610,
6
+ "train_samples_per_second": 1.456,
7
+ "train_steps_per_second": 0.023
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff