sedrickkeh commited on
Commit
bd72f27
·
verified ·
1 Parent(s): 9fe6d04

End of training

Browse files
README.md CHANGED
@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the llamafactory/alpaca_en dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 1.6962
22
 
23
  ## Model description
24
 
@@ -55,7 +55,7 @@ The following hyperparameters were used during training:
55
 
56
  | Training Loss | Epoch | Step | Validation Loss |
57
  |:-------------:|:------:|:----:|:---------------:|
58
- | No log | 0.1304 | 3 | 1.6962 |
59
 
60
 
61
  ### Framework versions
 
18
 
19
  This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the llamafactory/alpaca_en dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 1.6997
22
 
23
  ## Model description
24
 
 
55
 
56
  | Training Loss | Epoch | Step | Validation Loss |
57
  |:-------------:|:------:|:----:|:---------------:|
58
+ | No log | 0.1304 | 3 | 1.6997 |
59
 
60
 
61
  ### Framework versions
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 0.13043478260869565,
3
- "eval_loss": 1.6962372064590454,
4
- "eval_runtime": 2.034,
5
- "eval_samples_per_second": 303.343,
6
- "eval_steps_per_second": 4.916,
7
  "total_flos": 3.355230384370483e+16,
8
- "train_loss": 1.4135243097941081,
9
- "train_runtime": 205.0072,
10
- "train_samples_per_second": 7.492,
11
- "train_steps_per_second": 0.015
12
  }
 
1
  {
2
  "epoch": 0.13043478260869565,
3
+ "eval_loss": 1.6996564865112305,
4
+ "eval_runtime": 3.7243,
5
+ "eval_samples_per_second": 165.668,
6
+ "eval_steps_per_second": 2.685,
7
  "total_flos": 3.355230384370483e+16,
8
+ "train_loss": 1.413604736328125,
9
+ "train_runtime": 209.8464,
10
+ "train_samples_per_second": 7.32,
11
+ "train_steps_per_second": 0.014
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 0.13043478260869565,
3
- "eval_loss": 1.6962372064590454,
4
- "eval_runtime": 2.034,
5
- "eval_samples_per_second": 303.343,
6
- "eval_steps_per_second": 4.916
7
  }
 
1
  {
2
  "epoch": 0.13043478260869565,
3
+ "eval_loss": 1.6996564865112305,
4
+ "eval_runtime": 3.7243,
5
+ "eval_samples_per_second": 165.668,
6
+ "eval_steps_per_second": 2.685
7
  }
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6356b35f5ddc42451822bcb670ad99661bb3e76e15db53bba6f14965ad048b7f
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39fd425c2691693d271bee5ea875bc2f1b6b1017f01e653ba8b6c3b62a4633de
3
  size 4943162336
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09aacd51de6cf9a6f572cfc6d491f846f2758f1e3912717e3d56ad6269b88e83
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:080f42ac9101b71fcd1daa06890b34c920bad36feefa58370a9541928028703f
3
  size 4999819336
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6afb6d8844dc79b7f84cda99eafc03a630519ddb355d2f2247bc2e630fa8df8f
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:763a774370b3520296b4b083d0c293822a3441d5ecb4ef6c50593e287848e06d
3
  size 4540516344
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 0.13043478260869565,
3
  "total_flos": 3.355230384370483e+16,
4
- "train_loss": 1.4135243097941081,
5
- "train_runtime": 205.0072,
6
- "train_samples_per_second": 7.492,
7
- "train_steps_per_second": 0.015
8
  }
 
1
  {
2
  "epoch": 0.13043478260869565,
3
  "total_flos": 3.355230384370483e+16,
4
+ "train_loss": 1.413604736328125,
5
+ "train_runtime": 209.8464,
6
+ "train_samples_per_second": 7.32,
7
+ "train_steps_per_second": 0.014
8
  }
trainer_state.json CHANGED
@@ -10,20 +10,20 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.13043478260869565,
13
- "eval_loss": 1.6962372064590454,
14
- "eval_runtime": 1.8584,
15
- "eval_samples_per_second": 332.013,
16
- "eval_steps_per_second": 5.381,
17
  "step": 3
18
  },
19
  {
20
  "epoch": 0.13043478260869565,
21
  "step": 3,
22
  "total_flos": 3.355230384370483e+16,
23
- "train_loss": 1.4135243097941081,
24
- "train_runtime": 205.0072,
25
- "train_samples_per_second": 7.492,
26
- "train_steps_per_second": 0.015
27
  }
28
  ],
29
  "logging_steps": 10,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.13043478260869565,
13
+ "eval_loss": 1.6996564865112305,
14
+ "eval_runtime": 3.6392,
15
+ "eval_samples_per_second": 169.54,
16
+ "eval_steps_per_second": 2.748,
17
  "step": 3
18
  },
19
  {
20
  "epoch": 0.13043478260869565,
21
  "step": 3,
22
  "total_flos": 3.355230384370483e+16,
23
+ "train_loss": 1.413604736328125,
24
+ "train_runtime": 209.8464,
25
+ "train_samples_per_second": 7.32,
26
+ "train_steps_per_second": 0.014
27
  }
28
  ],
29
  "logging_steps": 10,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1520851757f31b8d05568c82a835c28b9e7b60b51902c9ec0f37649ce556cf29
3
  size 6520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82eb5f4ba327bda293928b93e3ee0739a8a789c729db7c85c739cc28b0b3adaa
3
  size 6520
training_eval_loss.png CHANGED