ASzecsenyi
/

VQLM

ASzecsenyi commited on Jan 12

Commit

05e1aea

verified ·

1 Parent(s): 4656152

Upload gpt_ts_d1/meta_000034.json with huggingface_hub

Files changed (1) hide show

gpt_ts_d1/meta_000034.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "step": 34,
-  "val_bpb": 3.227674483606736,
   "model_config": {
     "run": "gpt_ts_d1",
     "device_type": "",
@@ -36,7 +36,7 @@
     "save_every": -1,
     "push_checkpoints_to_hub": true,
     "use_profiler": true,
-    "memory_history_max_entries": 100000,
     "model_tag": "gpt_ts_d1",
     "n_layer": 1,
     "n_head": 1,
@@ -79,7 +79,7 @@
     "save_every": -1,
     "push_checkpoints_to_hub": true,
     "use_profiler": true,
-    "memory_history_max_entries": 100000,
     "model_tag": "gpt_ts_d1"
   },
   "device_batch_size": 32,
@@ -89,8 +89,8 @@
     "rg_idx": 19
   },
   "loop_state": {
-    "min_val_bpb": 3.227674483606736,
-    "smooth_train_loss": 2.2645697647921272,
-    "total_training_time": 6.928574800491333
   }
 }

 {
   "step": 34,
+  "val_bpb": 3.2278985236288658,
   "model_config": {
     "run": "gpt_ts_d1",
     "device_type": "",
     "save_every": -1,
     "push_checkpoints_to_hub": true,
     "use_profiler": true,
+    "memory_history_max_entries": 10000,
     "model_tag": "gpt_ts_d1",
     "n_layer": 1,
     "n_head": 1,
     "save_every": -1,
     "push_checkpoints_to_hub": true,
     "use_profiler": true,
+    "memory_history_max_entries": 10000,
     "model_tag": "gpt_ts_d1"
   },
   "device_batch_size": 32,
     "rg_idx": 19
   },
   "loop_state": {
+    "min_val_bpb": 3.2278985236288658,
+    "smooth_train_loss": 2.2646813129219647,
+    "total_training_time": 4.694071292877197
   }
 }