flyingbugs commited on
Commit
ed0bef3
·
verified ·
1 Parent(s): ad99498

Model save

Browse files
README.md CHANGED
@@ -27,7 +27,7 @@ print(output["generated_text"])
27
 
28
  ## Training procedure
29
 
30
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/jjh233/huggingface/runs/l9e79305)
31
 
32
 
33
  This model was trained with SFT.
 
27
 
28
  ## Training procedure
29
 
30
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/jjh233/huggingface/runs/21iwqcw5)
31
 
32
 
33
  This model was trained with SFT.
all_results.json CHANGED
@@ -5,9 +5,9 @@
5
  "eval_samples_per_second": 4.944,
6
  "eval_steps_per_second": 1.265,
7
  "total_flos": 65635690217472.0,
8
- "train_loss": 0.7333491018714284,
9
- "train_runtime": 2770.9424,
10
- "train_samples": 16610,
11
- "train_samples_per_second": 31.21,
12
- "train_steps_per_second": 0.244
13
  }
 
5
  "eval_samples_per_second": 4.944,
6
  "eval_steps_per_second": 1.265,
7
  "total_flos": 65635690217472.0,
8
+ "train_loss": 0.0,
9
+ "train_runtime": 0.9025,
10
+ "train_samples": 93733,
11
+ "train_samples_per_second": 38008.288,
12
+ "train_steps_per_second": 296.966
13
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "total_flos": 65635690217472.0,
3
- "train_loss": 0.7333491018714284,
4
- "train_runtime": 2770.9424,
5
- "train_samples": 16610,
6
- "train_samples_per_second": 31.21,
7
- "train_steps_per_second": 0.244
8
  }
 
1
  {
2
  "total_flos": 65635690217472.0,
3
+ "train_loss": 0.0,
4
+ "train_runtime": 0.9025,
5
+ "train_samples": 93733,
6
+ "train_samples_per_second": 38008.288,
7
+ "train_steps_per_second": 296.966
8
  }
trainer_state.json CHANGED
@@ -2197,14 +2197,14 @@
2197
  "epoch": 1.0,
2198
  "step": 676,
2199
  "total_flos": 65635690217472.0,
2200
- "train_loss": 0.7333491018714284,
2201
- "train_runtime": 2770.9424,
2202
- "train_samples_per_second": 31.21,
2203
- "train_steps_per_second": 0.244
2204
  }
2205
  ],
2206
  "logging_steps": 5,
2207
- "max_steps": 676,
2208
  "num_input_tokens_seen": 0,
2209
  "num_train_epochs": 1,
2210
  "save_steps": 100,
 
2197
  "epoch": 1.0,
2198
  "step": 676,
2199
  "total_flos": 65635690217472.0,
2200
+ "train_loss": 0.0,
2201
+ "train_runtime": 0.9025,
2202
+ "train_samples_per_second": 38008.288,
2203
+ "train_steps_per_second": 296.966
2204
  }
2205
  ],
2206
  "logging_steps": 5,
2207
+ "max_steps": 268,
2208
  "num_input_tokens_seen": 0,
2209
  "num_train_epochs": 1,
2210
  "save_steps": 100,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72587138b5bb06ff5f7542be9ffb8468fbbacb0edfdd36ce6dc92498595c3cdc
3
- size 7416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ffb7cda303708d9e1ceff69a1d310dcccc3fdd78818229bcf01013473d18deb
3
+ size 7480