Training update: run 436, 500 iters, cache_key=ci

Files changed (3) hide show

README.md CHANGED Viewed

@@ -25,10 +25,10 @@ capabilities inspired by cognitive science and AGI research.
 ## Training Details
-- **Checkpoint ID**: ckpt_20260513_155809_12000_22deff1b_9470fbb7
-- **Training Iteration**: 12000
-- **Validation Loss**: 0.0003513691975240363
-- **Quality Score**: 1843200.7807372825
 ## Echo Self Features

 ## Training Details
+- **Checkpoint ID**: ckpt_20260513_212450_500_22deff1b_9470fbb7
+- **Training Iteration**: 500
+- **Validation Loss**: 7.496852426528931
+- **Quality Score**: 76800.67333019339
 ## Echo Self Features

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9acb930fbe51b80b57e70218078de1b5174ede81a0e65f9ef77a594e69aed4e5
 size 51464851

 version https://git-lfs.github.com/spec/v1
+oid sha256:d69e74bbf8b8ab5302e94a2db9c0ffbbce2e76816fea133d0829df99baed8027
 size 51464851

training_metadata.json CHANGED Viewed

@@ -1,11 +1,11 @@
 {
-  "checkpoint_id": "ckpt_20260513_155809_12000_22deff1b_9470fbb7",
-  "created_at": "2026-05-13T15:58:09.879130",
-  "iteration": 12000,
   "epoch": 0,
   "train_loss": 0.0,
-  "val_loss": 0.0003513691975240363,
-  "learning_rate": 0.0001322181943393505,
   "model_config": {
     "n_layer": 4,
     "n_head": 4,
@@ -36,20 +36,20 @@
     "block_size": 1024
   },
   "metrics": {
-    "val_loss": 0.0003513691975240363,
-    "connection_ratio": 1.0,
-    "tokens_processed": 24576000,
-    "training_speed_iters_per_sec": 0.07942402197792674
   },
   "tags": [
     "phase_adaptive_mastery",
-    "high_quality",
     "nanecho",
     "curriculum",
     "introspection"
   ],
   "parent_checkpoint": null,
-  "notes": "Training checkpoint at iteration 12000 (resumed from iteration 11500) | Phase: adaptive_mastery",
-  "file_size_mb": 253.3669786453247,
-  "quality_score": 1843200.7807372825
 }

 {
+  "checkpoint_id": "ckpt_20260513_212450_500_22deff1b_9470fbb7",
+  "created_at": "2026-05-13T21:24:50.756411",
+  "iteration": 500,
   "epoch": 0,
   "train_loss": 0.0,
+  "val_loss": 7.496852426528931,
+  "learning_rate": 1.3971999999999998e-05,
   "model_config": {
     "n_layer": 4,
     "n_head": 4,
     "block_size": 1024
   },
   "metrics": {
+    "val_loss": 7.496852426528931,
+    "connection_ratio": 0.3,
+    "tokens_processed": 1024000,
+    "training_speed_iters_per_sec": 0.08243751204598182
   },
   "tags": [
     "phase_adaptive_mastery",
+    "low_quality",
     "nanecho",
     "curriculum",
     "introspection"
   ],
   "parent_checkpoint": null,
+  "notes": "Training checkpoint at iteration 500 | Phase: adaptive_mastery",
+  "file_size_mb": 249.29015827178955,
+  "quality_score": 76800.67333019339
 }