End of training

Files changed (4) hide show

README.md CHANGED Viewed

@@ -4,11 +4,23 @@ license: llama3.2
 base_model: meta-llama/Llama-3.2-1B
 tags:
 - generated_from_trainer
 metrics:
 - accuracy
 model-index:
 - name: test
-  results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,7 +28,7 @@ should probably proofread and complete it, then remove this comment. -->
 # test
-This model is a fine-tuned version of [meta-llama/Llama-3.2-1B](https://huggingface.co/meta-llama/Llama-3.2-1B) on an unknown dataset.
 It achieves the following results on the evaluation set:
 - Loss: 2.6568
 - Accuracy: 0.5230

 base_model: meta-llama/Llama-3.2-1B
 tags:
 - generated_from_trainer
+datasets:
+- LabHC/bias_in_bios
 metrics:
 - accuracy
 model-index:
 - name: test
+  results:
+  - task:
+      name: Causal Language Modeling
+      type: text-generation
+    dataset:
+      name: LabHC/bias_in_bios
+      type: LabHC/bias_in_bios
+    metrics:
+    - name: Accuracy
+      type: accuracy
+      value: 0.5230333635625984
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # test
+This model is a fine-tuned version of [meta-llama/Llama-3.2-1B](https://huggingface.co/meta-llama/Llama-3.2-1B) on the LabHC/bias_in_bios dataset.
 It achieves the following results on the evaluation set:
 - Loss: 2.6568
 - Accuracy: 0.5230

all_results.json CHANGED Viewed

@@ -2,9 +2,10 @@
     "epoch": 1.0,
     "eval_accuracy": 0.5230333635625984,
     "eval_loss": 2.656813859939575,
-    "eval_runtime": 59.8639,
-    "eval_samples_per_second": 85.611,
-    "eval_steps_per_second": 10.708,
     "perplexity": 14.250811606566634,
     "total_flos": 1695049253388288.0,
     "train_loss": 2.6765631017550615,

     "epoch": 1.0,
     "eval_accuracy": 0.5230333635625984,
     "eval_loss": 2.656813859939575,
+    "eval_runtime": 59.9412,
+    "eval_samples": 5125,
+    "eval_samples_per_second": 85.5,
+    "eval_steps_per_second": 10.694,
     "perplexity": 14.250811606566634,
     "total_flos": 1695049253388288.0,
     "train_loss": 2.6765631017550615,

eval_results.json CHANGED Viewed

@@ -1,10 +1,10 @@
 {
     "epoch": 1.0,
-    "eval_accuracy": 0.5619722863264766,
-    "eval_loss": 2.4340596199035645,
-    "eval_runtime": 13.228,
-    "eval_samples": 1138,
-    "eval_samples_per_second": 86.03,
-    "eval_steps_per_second": 10.81,
-    "perplexity": 11.405088550670825
 }

 {
     "epoch": 1.0,
+    "eval_accuracy": 0.5230333635625984,
+    "eval_loss": 2.656813859939575,
+    "eval_runtime": 59.9412,
+    "eval_samples": 5125,
+    "eval_samples_per_second": 85.5,
+    "eval_steps_per_second": 10.694,
+    "perplexity": 14.250811606566634
 }

trainer_state.json CHANGED Viewed

@@ -26,6 +26,15 @@
       "train_runtime": 106.623,
       "train_samples_per_second": 5.318,
       "train_steps_per_second": 1.332
     }
   ],
   "logging_steps": 500,

       "train_runtime": 106.623,
       "train_samples_per_second": 5.318,
       "train_steps_per_second": 1.332
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.5230333635625984,
+      "eval_loss": 2.656813859939575,
+      "eval_runtime": 59.8639,
+      "eval_samples_per_second": 85.611,
+      "eval_steps_per_second": 10.708,
+      "step": 142
     }
   ],
   "logging_steps": 500,