IeBoytsov
/

ox-llms-sula-10-profiles-sft

+{
+    "entropy": 0.1506435771783193,
+    "epoch": 1.0,
+    "mean_token_accuracy": 0.9381802678108215,
+    "num_tokens": 24937449.0,
+    "total_flos": 1.3805074115628892e+18,
+    "train_loss": 0.1824477752374585,
+    "train_runtime": 6615.9277,
+    "train_samples": 35223,
+    "train_samples_per_second": 5.324,
+    "train_steps_per_second": 0.333
+}

train_results.json ADDED Viewed

+{
+    "entropy": 0.1506435771783193,
+    "epoch": 1.0,
+    "mean_token_accuracy": 0.9381802678108215,
+    "num_tokens": 24937449.0,
+    "total_flos": 1.3805074115628892e+18,
+    "train_loss": 0.1824477752374585,
+    "train_runtime": 6615.9277,
+    "train_samples": 35223,
+    "train_samples_per_second": 5.324,
+    "train_steps_per_second": 0.333
+}

trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff