End of training

Files changed (10) hide show

README.md CHANGED Viewed

@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the llamafactory/alpaca_en dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.6962
 ## Model description
@@ -55,7 +55,7 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch  | Step | Validation Loss |
 |:-------------:|:------:|:----:|:---------------:|
-| No log        | 0.1304 | 3    | 1.6962          |
 ### Framework versions

 This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the llamafactory/alpaca_en dataset.
 It achieves the following results on the evaluation set:
+- Loss: 1.6997
 ## Model description
 | Training Loss | Epoch  | Step | Validation Loss |
 |:-------------:|:------:|:----:|:---------------:|
+| No log        | 0.1304 | 3    | 1.6997          |
 ### Framework versions

all_results.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
     "epoch": 0.13043478260869565,
-    "eval_loss": 1.6962372064590454,
-    "eval_runtime": 2.034,
-    "eval_samples_per_second": 303.343,
-    "eval_steps_per_second": 4.916,
     "total_flos": 3.355230384370483e+16,
-    "train_loss": 1.4135243097941081,
-    "train_runtime": 205.0072,
-    "train_samples_per_second": 7.492,
-    "train_steps_per_second": 0.015
 }

 {
     "epoch": 0.13043478260869565,
+    "eval_loss": 1.6996564865112305,
+    "eval_runtime": 3.7243,
+    "eval_samples_per_second": 165.668,
+    "eval_steps_per_second": 2.685,
     "total_flos": 3.355230384370483e+16,
+    "train_loss": 1.413604736328125,
+    "train_runtime": 209.8464,
+    "train_samples_per_second": 7.32,
+    "train_steps_per_second": 0.014
 }

eval_results.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
     "epoch": 0.13043478260869565,
-    "eval_loss": 1.6962372064590454,
-    "eval_runtime": 2.034,
-    "eval_samples_per_second": 303.343,
-    "eval_steps_per_second": 4.916
 }

 {
     "epoch": 0.13043478260869565,
+    "eval_loss": 1.6996564865112305,
+    "eval_runtime": 3.7243,
+    "eval_samples_per_second": 165.668,
+    "eval_steps_per_second": 2.685
 }

model-00001-of-00003.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6356b35f5ddc42451822bcb670ad99661bb3e76e15db53bba6f14965ad048b7f
 size 4943162336

 version https://git-lfs.github.com/spec/v1
+oid sha256:39fd425c2691693d271bee5ea875bc2f1b6b1017f01e653ba8b6c3b62a4633de
 size 4943162336

model-00002-of-00003.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:09aacd51de6cf9a6f572cfc6d491f846f2758f1e3912717e3d56ad6269b88e83
 size 4999819336

 version https://git-lfs.github.com/spec/v1
+oid sha256:080f42ac9101b71fcd1daa06890b34c920bad36feefa58370a9541928028703f
 size 4999819336

model-00003-of-00003.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6afb6d8844dc79b7f84cda99eafc03a630519ddb355d2f2247bc2e630fa8df8f
 size 4540516344

 version https://git-lfs.github.com/spec/v1
+oid sha256:763a774370b3520296b4b083d0c293822a3441d5ecb4ef6c50593e287848e06d
 size 4540516344

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 0.13043478260869565,
     "total_flos": 3.355230384370483e+16,
-    "train_loss": 1.4135243097941081,
-    "train_runtime": 205.0072,
-    "train_samples_per_second": 7.492,
-    "train_steps_per_second": 0.015
 }

 {
     "epoch": 0.13043478260869565,
     "total_flos": 3.355230384370483e+16,
+    "train_loss": 1.413604736328125,
+    "train_runtime": 209.8464,
+    "train_samples_per_second": 7.32,
+    "train_steps_per_second": 0.014
 }

trainer_state.json CHANGED Viewed

@@ -10,20 +10,20 @@
   "log_history": [
     {
       "epoch": 0.13043478260869565,
-      "eval_loss": 1.6962372064590454,
-      "eval_runtime": 1.8584,
-      "eval_samples_per_second": 332.013,
-      "eval_steps_per_second": 5.381,
       "step": 3
     },
     {
       "epoch": 0.13043478260869565,
       "step": 3,
       "total_flos": 3.355230384370483e+16,
-      "train_loss": 1.4135243097941081,
-      "train_runtime": 205.0072,
-      "train_samples_per_second": 7.492,
-      "train_steps_per_second": 0.015
     }
   ],
   "logging_steps": 10,

   "log_history": [
     {
       "epoch": 0.13043478260869565,
+      "eval_loss": 1.6996564865112305,
+      "eval_runtime": 3.6392,
+      "eval_samples_per_second": 169.54,
+      "eval_steps_per_second": 2.748,
       "step": 3
     },
     {
       "epoch": 0.13043478260869565,
       "step": 3,
       "total_flos": 3.355230384370483e+16,
+      "train_loss": 1.413604736328125,
+      "train_runtime": 209.8464,
+      "train_samples_per_second": 7.32,
+      "train_steps_per_second": 0.014
     }
   ],
   "logging_steps": 10,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1520851757f31b8d05568c82a835c28b9e7b60b51902c9ec0f37649ce556cf29
 size 6520

 version https://git-lfs.github.com/spec/v1
+oid sha256:82eb5f4ba327bda293928b93e3ee0739a8a789c729db7c85c739cc28b0b3adaa
 size 6520

training_eval_loss.png CHANGED Viewed