ucmp137538 commited on
Commit
e9db77e
·
verified ·
1 Parent(s): 812315c

Model save

Browse files
README.md CHANGED
@@ -26,7 +26,7 @@ print(output["generated_text"])
26
 
27
  ## Training procedure
28
 
29
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/mingzeli/PreThink_MemAgent/runs/c5tij9g9)
30
 
31
 
32
  This model was trained with SFT.
 
26
 
27
  ## Training procedure
28
 
29
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/mingzeli/PreThink_MemAgent/runs/6pz32z57)
30
 
31
 
32
  This model was trained with SFT.
all_results.json CHANGED
@@ -1,8 +1,13 @@
1
  {
 
 
 
 
 
2
  "total_flos": 21958899171328.0,
3
- "train_loss": 0.744699491904332,
4
- "train_runtime": 317.873,
5
  "train_samples": 821,
6
- "train_samples_per_second": 7.748,
7
- "train_steps_per_second": 0.123
8
  }
 
1
  {
2
+ "eval_loss": 0.5437560081481934,
3
+ "eval_runtime": 2.2423,
4
+ "eval_samples": 92,
5
+ "eval_samples_per_second": 41.029,
6
+ "eval_steps_per_second": 5.352,
7
  "total_flos": 21958899171328.0,
8
+ "train_loss": 0.0,
9
+ "train_runtime": 1.4645,
10
  "train_samples": 821,
11
+ "train_samples_per_second": 1681.768,
12
+ "train_steps_per_second": 26.63
13
  }
eval_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "eval_loss": 0.5437560081481934,
3
+ "eval_runtime": 2.2423,
4
+ "eval_samples": 92,
5
+ "eval_samples_per_second": 41.029,
6
+ "eval_steps_per_second": 5.352
7
+ }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "total_flos": 21958899171328.0,
3
- "train_loss": 0.744699491904332,
4
- "train_runtime": 317.873,
5
  "train_samples": 821,
6
- "train_samples_per_second": 7.748,
7
- "train_steps_per_second": 0.123
8
  }
 
1
  {
2
  "total_flos": 21958899171328.0,
3
+ "train_loss": 0.0,
4
+ "train_runtime": 1.4645,
5
  "train_samples": 821,
6
+ "train_samples_per_second": 1681.768,
7
+ "train_steps_per_second": 26.63
8
  }
trainer_state.json CHANGED
@@ -352,10 +352,10 @@
352
  "epoch": 3.0,
353
  "step": 39,
354
  "total_flos": 21958899171328.0,
355
- "train_loss": 0.744699491904332,
356
- "train_runtime": 317.873,
357
- "train_samples_per_second": 7.748,
358
- "train_steps_per_second": 0.123
359
  }
360
  ],
361
  "logging_steps": 1,
 
352
  "epoch": 3.0,
353
  "step": 39,
354
  "total_flos": 21958899171328.0,
355
+ "train_loss": 0.0,
356
+ "train_runtime": 1.4645,
357
+ "train_samples_per_second": 1681.768,
358
+ "train_steps_per_second": 26.63
359
  }
360
  ],
361
  "logging_steps": 1,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9bd5b9b81772425f2ca2d35ad7d8a3b7ce1df0e42aa7fc718f442a5c6f551fe3
3
  size 7889
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7abbf6d93c48bb7a1e3846a182c4aed4be2d9d92eb50729f609e3a287e235b19
3
  size 7889