Model save

Files changed (6) hide show

README.md CHANGED Viewed

@@ -33,7 +33,7 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
-- train_batch_size: 16
 - eval_batch_size: 8
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08

 The following hyperparameters were used during training:
 - learning_rate: 2e-05
+- train_batch_size: 100
 - eval_batch_size: 8
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08

all_results.json ADDED Viewed

+{
+    "epoch": 1.0,
+    "train_loss": 4.891794921875,
+    "train_runtime": 1355.1502,
+    "train_samples_per_second": 4.423,
+    "train_steps_per_second": 0.277
+}

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d13f58695578f83005a2af95b749ec34e9db21ffb9ad5f9dbced4621b10532e
 size 343875434

 version https://git-lfs.github.com/spec/v1
+oid sha256:e7e0f3be3d3196c2864f86f7dcc2f54fa5b548b1bd2ab6f07dd98ee54687d1b2
 size 343875434

train_results.json ADDED Viewed

+{
+    "epoch": 1.0,
+    "train_loss": 4.891794921875,
+    "train_runtime": 1355.1502,
+    "train_samples_per_second": 4.423,
+    "train_steps_per_second": 0.277
+}

trainer_state.json ADDED Viewed

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 3000,
+  "global_step": 375,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "step": 375,
+      "total_flos": 4.6531126963696435e+17,
+      "train_loss": 4.891794921875,
+      "train_runtime": 1355.1502,
+      "train_samples_per_second": 4.423,
+      "train_steps_per_second": 0.277
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 375,
+  "num_train_epochs": 1,
+  "save_steps": 3000,
+  "total_flos": 4.6531126963696435e+17,
+  "trial_name": null,
+  "trial_params": null
+}

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4054a98f7a29bff3d64b95d1fd586ecb89bff913f8d355a30e7fadd7d61bd3fb
 size 4472

 version https://git-lfs.github.com/spec/v1
+oid sha256:22590141c34c1c71972c41a35f0066b128b2b676917bdb1d1d2cc47f5fcd0edb
 size 4472