Epoch 10 - Training started: 2025-11-15 19:24:39

Files changed (4) hide show

README.md CHANGED Viewed

@@ -6,7 +6,7 @@ NNUE (Efficiently Updatable Neural Network) chess evaluation model
 - **Model type**: NNUE Chess Evaluation
 - **Architecture**: HalfKP feature representation
-- **Uploaded**: 2025-11-15 19:17:53
 ## Architecture
@@ -28,9 +28,9 @@ Output Layer: 32 → 1 (centipawn evaluation)
 ## Training Information
-- **Epoch**: 64
-- **Training Loss**: 2944877.7457
-- **Validation Loss**: 2821792.7308
 ## Usage
@@ -61,8 +61,8 @@ model_config = checkpoint['model_config']
 ## Training Configuration
 - **batch_size**: 256
-- **learning_rate**: 0.001
-- **num_epochs**: 100
 - **optimizer**: adam
 - **loss_function**: mse
 - **hidden_size**: 256

 - **Model type**: NNUE Chess Evaluation
 - **Architecture**: HalfKP feature representation
+- **Uploaded**: 2025-11-15 19:27:29
 ## Architecture
 ## Training Information
+- **Epoch**: 10
+- **Training Loss**: 3120906.5251
+- **Validation Loss**: 2923721.9199
 ## Usage
 ## Training Configuration
 - **batch_size**: 256
+- **learning_rate**: 0.003
+- **num_epochs**: 50
 - **optimizer**: adam
 - **loss_function**: mse
 - **hidden_size**: 256

checkpoint_epoch_10.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:95ecaed5ba60bcbcd9b034d120d31efc0b7fd58dcafec3361a5167195a4623a3
-size 126054539

 version https://git-lfs.github.com/spec/v1
+oid sha256:fe4f79c0dd385b53af3bb7d104ae650b21bee0e676802c5eb2fe8323c07a98f4
+size 126054987

config.json CHANGED Viewed

@@ -10,9 +10,11 @@
     "train_data_path": "data/train.jsonl",
     "val_data_path": "data/val.jsonl",
     "batch_size": 256,
-    "learning_rate": 0.001,
-    "num_epochs": 100,
     "weight_decay": 1e-05,
     "hidden_size": 256,
     "hidden2_size": 32,
     "hidden3_size": 32,
@@ -29,6 +31,8 @@
     "scheduler": null,
     "scheduler_step_size": 30,
     "scheduler_gamma": 0.1,
     "loss_function": "mse",
     "log_every_n_batches": 100,
     "verbose": true,
@@ -43,7 +47,6 @@
     "download_positions_per_game": 10,
     "download_num_workers": 4,
     "download_batch_size": 100,
-    "download_output_format": "jsonl",
     "download_rated_only": true,
     "download_output_dir": "data",
     "download_mode": "streaming",

     "train_data_path": "data/train.jsonl",
     "val_data_path": "data/val.jsonl",
     "batch_size": 256,
+    "learning_rate": 0.003,
+    "num_epochs": 50,
     "weight_decay": 1e-05,
+    "max_grad_norm": 1.0,
+    "early_stopping_patience": 10,
     "hidden_size": 256,
     "hidden2_size": 32,
     "hidden3_size": 32,
     "scheduler": null,
     "scheduler_step_size": 30,
     "scheduler_gamma": 0.1,
+    "warmup_epochs": 5,
+    "warmup_start_lr": 1e-05,
     "loss_function": "mse",
     "log_every_n_batches": 100,
     "verbose": true,
     "download_positions_per_game": 10,
     "download_num_workers": 4,
     "download_batch_size": 100,
     "download_rated_only": true,
     "download_output_dir": "data",
     "download_mode": "streaming",

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cb969826c34dd87a0854234b70e304044a2af0ba8e7725a4fa2cc4fdeef7671c
-size 42017825

 version https://git-lfs.github.com/spec/v1
+oid sha256:d729af8233d872c00bd05b36bd5ee3d9b11a38b3d6d9abbeac94c7e0855d2bba
+size 42017953