Training in progress, step 160
Browse files- config.json +2 -2
- model-00001-of-00014.safetensors +1 -1
- model-00002-of-00014.safetensors +1 -1
- model-00003-of-00014.safetensors +1 -1
- model-00004-of-00014.safetensors +1 -1
- model-00005-of-00014.safetensors +1 -1
- model-00006-of-00014.safetensors +1 -1
- model-00007-of-00014.safetensors +1 -1
- model-00008-of-00014.safetensors +1 -1
- model-00009-of-00014.safetensors +1 -1
- model-00010-of-00014.safetensors +1 -1
- model-00011-of-00014.safetensors +1 -1
- model-00012-of-00014.safetensors +1 -1
- model-00013-of-00014.safetensors +1 -1
- model-00014-of-00014.safetensors +1 -1
- trainer_log.jsonl +161 -323
- training_args.bin +1 -1
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "/
|
| 3 |
"architectures": [
|
| 4 |
"Qwen2ForCausalLM"
|
| 5 |
],
|
|
@@ -22,7 +22,7 @@
|
|
| 22 |
"sliding_window": null,
|
| 23 |
"tie_word_embeddings": false,
|
| 24 |
"torch_dtype": "bfloat16",
|
| 25 |
-
"transformers_version": "4.48.
|
| 26 |
"use_cache": false,
|
| 27 |
"use_sliding_window": false,
|
| 28 |
"vocab_size": 152064
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "saves/qwen2.5-32b/works_with_references/full/pretrain",
|
| 3 |
"architectures": [
|
| 4 |
"Qwen2ForCausalLM"
|
| 5 |
],
|
|
|
|
| 22 |
"sliding_window": null,
|
| 23 |
"tie_word_embeddings": false,
|
| 24 |
"torch_dtype": "bfloat16",
|
| 25 |
+
"transformers_version": "4.48.1",
|
| 26 |
"use_cache": false,
|
| 27 |
"use_sliding_window": false,
|
| 28 |
"vocab_size": 152064
|
model-00001-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4891730992
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:877072f5a264e787dc8592082e2fce6ea6e6e1c143552f92c6bf8c151ee5b013
|
| 3 |
size 4891730992
|
model-00002-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059352
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25f283172b327b0a445dc1693bc479bd5dd1aed7060b51ad4c07f064ea5df135
|
| 3 |
size 4876059352
|
model-00003-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059384
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41b29a951313e48eeb0f47b665e70ee8bedabefa26753a9c56ed2fce99e8e5ba
|
| 3 |
size 4876059384
|
model-00004-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:064cad34d8e82023deab3e79bce08571d3a247e67d5786591f50b8bd620e4732
|
| 3 |
size 4876059416
|
model-00005-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd24bd8575aec64aff272b25f913b3cc3157fa3bc01abd843f734cd5f1eb6bdc
|
| 3 |
size 4876059416
|
model-00006-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e16e4dc393145410b1ee9931c16ec7447ee7604982909717e0a9afecf706ec9
|
| 3 |
size 4876059416
|
model-00007-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d640e57b3eeabe4c58699e7447cdf19bc209735a28eacbcc847d5b4ecc41051f
|
| 3 |
size 4876059416
|
model-00008-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f89c9deb39bd117fb2f3d34a131c13c3125f85c6ddebeb10bc44e49c908afa37
|
| 3 |
size 4876059416
|
model-00009-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b550de694aaad02d9c9dc4fb59c626460e4c727178485e39159b9c4556e90e8f
|
| 3 |
size 4876059416
|
model-00010-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8d2189bba0cbb2c8e7d74d1c68dd59feab7efc046f87fa8d6bedd01a7485bb3
|
| 3 |
size 4876059416
|
model-00011-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ceb92299df4228cd515535bb1d235ecf9b7a3eed049276e9360eff7ac2cfb73
|
| 3 |
size 4876059416
|
model-00012-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:673bc76909801acd9a009e46f999baa8bde4a93a9dc3f9e9d4d8a4dcfaef500a
|
| 3 |
size 4876059416
|
model-00013-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7f6f5e398a5787483d79921c4aa5c06695feb6e86ab64feac0dc3d3d3218e53
|
| 3 |
size 4876059416
|
model-00014-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2123397800
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59bae169e109e7ef444903026f9bc3b6b47542d3fe11bdaad3afc5cc13e92bc6
|
| 3 |
size 2123397800
|
trainer_log.jsonl
CHANGED
|
@@ -1,323 +1,161 @@
|
|
| 1 |
-
{"current_steps": 1, "total_steps":
|
| 2 |
-
{"current_steps": 2, "total_steps":
|
| 3 |
-
{"current_steps": 3, "total_steps":
|
| 4 |
-
{"current_steps": 4, "total_steps":
|
| 5 |
-
{"current_steps": 5, "total_steps":
|
| 6 |
-
{"current_steps": 6, "total_steps":
|
| 7 |
-
{"current_steps": 7, "total_steps":
|
| 8 |
-
{"current_steps": 8, "total_steps":
|
| 9 |
-
{"current_steps": 9, "total_steps":
|
| 10 |
-
{"current_steps": 10, "total_steps":
|
| 11 |
-
{"current_steps": 11, "total_steps":
|
| 12 |
-
{"current_steps": 12, "total_steps":
|
| 13 |
-
{"current_steps": 13, "total_steps":
|
| 14 |
-
{"current_steps": 14, "total_steps":
|
| 15 |
-
{"current_steps": 15, "total_steps":
|
| 16 |
-
{"current_steps": 16, "total_steps":
|
| 17 |
-
{"current_steps": 17, "total_steps":
|
| 18 |
-
{"current_steps": 18, "total_steps":
|
| 19 |
-
{"current_steps": 19, "total_steps":
|
| 20 |
-
{"current_steps": 20, "total_steps":
|
| 21 |
-
{"current_steps": 21, "total_steps":
|
| 22 |
-
{"current_steps": 22, "total_steps":
|
| 23 |
-
{"current_steps": 23, "total_steps":
|
| 24 |
-
{"current_steps": 24, "total_steps":
|
| 25 |
-
{"current_steps": 25, "total_steps":
|
| 26 |
-
{"current_steps": 26, "total_steps":
|
| 27 |
-
{"current_steps": 27, "total_steps":
|
| 28 |
-
{"current_steps": 28, "total_steps":
|
| 29 |
-
{"current_steps": 29, "total_steps":
|
| 30 |
-
{"current_steps": 30, "total_steps":
|
| 31 |
-
{"current_steps": 31, "total_steps":
|
| 32 |
-
{"current_steps": 32, "total_steps":
|
| 33 |
-
{"current_steps": 33, "total_steps":
|
| 34 |
-
{"current_steps": 34, "total_steps":
|
| 35 |
-
{"current_steps": 35, "total_steps":
|
| 36 |
-
{"current_steps": 36, "total_steps":
|
| 37 |
-
{"current_steps": 37, "total_steps":
|
| 38 |
-
{"current_steps": 38, "total_steps":
|
| 39 |
-
{"current_steps": 39, "total_steps":
|
| 40 |
-
{"current_steps": 40, "total_steps":
|
| 41 |
-
{"current_steps": 41, "total_steps":
|
| 42 |
-
{"current_steps": 42, "total_steps":
|
| 43 |
-
{"current_steps": 43, "total_steps":
|
| 44 |
-
{"current_steps": 44, "total_steps":
|
| 45 |
-
{"current_steps": 45, "total_steps":
|
| 46 |
-
{"current_steps": 46, "total_steps":
|
| 47 |
-
{"current_steps": 47, "total_steps":
|
| 48 |
-
{"current_steps": 48, "total_steps":
|
| 49 |
-
{"current_steps": 49, "total_steps":
|
| 50 |
-
{"current_steps": 50, "total_steps":
|
| 51 |
-
{"current_steps": 51, "total_steps":
|
| 52 |
-
{"current_steps": 52, "total_steps":
|
| 53 |
-
{"current_steps": 53, "total_steps":
|
| 54 |
-
{"current_steps": 54, "total_steps":
|
| 55 |
-
{"current_steps": 55, "total_steps":
|
| 56 |
-
{"current_steps": 56, "total_steps":
|
| 57 |
-
{"current_steps": 57, "total_steps":
|
| 58 |
-
{"current_steps": 58, "total_steps":
|
| 59 |
-
{"current_steps": 59, "total_steps":
|
| 60 |
-
{"current_steps": 60, "total_steps":
|
| 61 |
-
{"current_steps": 61, "total_steps":
|
| 62 |
-
{"current_steps": 62, "total_steps":
|
| 63 |
-
{"current_steps": 63, "total_steps":
|
| 64 |
-
{"current_steps": 64, "total_steps":
|
| 65 |
-
{"current_steps": 65, "total_steps":
|
| 66 |
-
{"current_steps": 66, "total_steps":
|
| 67 |
-
{"current_steps": 67, "total_steps":
|
| 68 |
-
{"current_steps": 68, "total_steps":
|
| 69 |
-
{"current_steps": 69, "total_steps":
|
| 70 |
-
{"current_steps": 70, "total_steps":
|
| 71 |
-
{"current_steps": 71, "total_steps":
|
| 72 |
-
{"current_steps": 72, "total_steps":
|
| 73 |
-
{"current_steps": 73, "total_steps":
|
| 74 |
-
{"current_steps": 74, "total_steps":
|
| 75 |
-
{"current_steps": 75, "total_steps":
|
| 76 |
-
{"current_steps": 76, "total_steps":
|
| 77 |
-
{"current_steps": 77, "total_steps":
|
| 78 |
-
{"current_steps": 78, "total_steps":
|
| 79 |
-
{"current_steps": 79, "total_steps":
|
| 80 |
-
{"current_steps": 80, "total_steps":
|
| 81 |
-
{"current_steps": 81, "total_steps":
|
| 82 |
-
{"current_steps": 82, "total_steps":
|
| 83 |
-
{"current_steps": 83, "total_steps":
|
| 84 |
-
{"current_steps": 84, "total_steps":
|
| 85 |
-
{"current_steps": 85, "total_steps":
|
| 86 |
-
{"current_steps": 86, "total_steps":
|
| 87 |
-
{"current_steps": 87, "total_steps":
|
| 88 |
-
{"current_steps": 88, "total_steps":
|
| 89 |
-
{"current_steps": 89, "total_steps":
|
| 90 |
-
{"current_steps": 90, "total_steps":
|
| 91 |
-
{"current_steps": 91, "total_steps":
|
| 92 |
-
{"current_steps": 92, "total_steps":
|
| 93 |
-
{"current_steps": 93, "total_steps":
|
| 94 |
-
{"current_steps": 94, "total_steps":
|
| 95 |
-
{"current_steps": 95, "total_steps":
|
| 96 |
-
{"current_steps": 96, "total_steps":
|
| 97 |
-
{"current_steps": 97, "total_steps":
|
| 98 |
-
{"current_steps": 98, "total_steps":
|
| 99 |
-
{"current_steps": 99, "total_steps":
|
| 100 |
-
{"current_steps": 100, "total_steps":
|
| 101 |
-
{"current_steps": 101, "total_steps":
|
| 102 |
-
{"current_steps": 102, "total_steps":
|
| 103 |
-
{"current_steps": 103, "total_steps":
|
| 104 |
-
{"current_steps": 104, "total_steps":
|
| 105 |
-
{"current_steps": 105, "total_steps":
|
| 106 |
-
{"current_steps": 106, "total_steps":
|
| 107 |
-
{"current_steps": 107, "total_steps":
|
| 108 |
-
{"current_steps": 108, "total_steps":
|
| 109 |
-
{"current_steps": 109, "total_steps":
|
| 110 |
-
{"current_steps": 110, "total_steps":
|
| 111 |
-
{"current_steps": 111, "total_steps":
|
| 112 |
-
{"current_steps": 112, "total_steps":
|
| 113 |
-
{"current_steps": 113, "total_steps":
|
| 114 |
-
{"current_steps": 114, "total_steps":
|
| 115 |
-
{"current_steps": 115, "total_steps":
|
| 116 |
-
{"current_steps": 116, "total_steps":
|
| 117 |
-
{"current_steps": 117, "total_steps":
|
| 118 |
-
{"current_steps": 118, "total_steps":
|
| 119 |
-
{"current_steps": 119, "total_steps":
|
| 120 |
-
{"current_steps": 120, "total_steps":
|
| 121 |
-
{"current_steps": 121, "total_steps":
|
| 122 |
-
{"current_steps": 122, "total_steps":
|
| 123 |
-
{"current_steps": 123, "total_steps":
|
| 124 |
-
{"current_steps": 124, "total_steps":
|
| 125 |
-
{"current_steps": 125, "total_steps":
|
| 126 |
-
{"current_steps": 126, "total_steps":
|
| 127 |
-
{"current_steps": 127, "total_steps":
|
| 128 |
-
{"current_steps": 128, "total_steps":
|
| 129 |
-
{"current_steps": 129, "total_steps":
|
| 130 |
-
{"current_steps": 130, "total_steps":
|
| 131 |
-
{"current_steps": 131, "total_steps":
|
| 132 |
-
{"current_steps": 132, "total_steps":
|
| 133 |
-
{"current_steps": 133, "total_steps":
|
| 134 |
-
{"current_steps": 134, "total_steps":
|
| 135 |
-
{"current_steps": 135, "total_steps":
|
| 136 |
-
{"current_steps": 136, "total_steps":
|
| 137 |
-
{"current_steps": 137, "total_steps":
|
| 138 |
-
{"current_steps": 138, "total_steps":
|
| 139 |
-
{"current_steps": 139, "total_steps":
|
| 140 |
-
{"current_steps": 140, "total_steps":
|
| 141 |
-
{"current_steps": 141, "total_steps":
|
| 142 |
-
{"current_steps": 142, "total_steps":
|
| 143 |
-
{"current_steps": 143, "total_steps":
|
| 144 |
-
{"current_steps": 144, "total_steps":
|
| 145 |
-
{"current_steps": 145, "total_steps":
|
| 146 |
-
{"current_steps": 146, "total_steps":
|
| 147 |
-
{"current_steps": 147, "total_steps":
|
| 148 |
-
{"current_steps": 148, "total_steps":
|
| 149 |
-
{"current_steps": 149, "total_steps":
|
| 150 |
-
{"current_steps": 150, "total_steps":
|
| 151 |
-
{"current_steps": 151, "total_steps":
|
| 152 |
-
{"current_steps": 152, "total_steps":
|
| 153 |
-
{"current_steps": 153, "total_steps":
|
| 154 |
-
{"current_steps": 154, "total_steps":
|
| 155 |
-
{"current_steps": 155, "total_steps":
|
| 156 |
-
{"current_steps": 156, "total_steps":
|
| 157 |
-
{"current_steps": 157, "total_steps":
|
| 158 |
-
{"current_steps": 158, "total_steps":
|
| 159 |
-
{"current_steps": 159, "total_steps":
|
| 160 |
-
{"current_steps": 160, "total_steps":
|
| 161 |
-
{"current_steps":
|
| 162 |
-
{"current_steps": 162, "total_steps": 322, "loss": 1.9052, "lr": 1.7515463919937416e-05, "epoch": 1.0061776061776062, "percentage": 50.31, "elapsed_time": "9:29:38", "remaining_time": "9:22:36"}
|
| 163 |
-
{"current_steps": 163, "total_steps": 322, "loss": 0.8504, "lr": 1.735456917471084e-05, "epoch": 1.0123552123552124, "percentage": 50.62, "elapsed_time": "9:33:08", "remaining_time": "9:19:04"}
|
| 164 |
-
{"current_steps": 164, "total_steps": 322, "loss": 0.8583, "lr": 1.7193396194819332e-05, "epoch": 1.0185328185328186, "percentage": 50.93, "elapsed_time": "9:36:35", "remaining_time": "9:15:30"}
|
| 165 |
-
{"current_steps": 165, "total_steps": 322, "loss": 0.8515, "lr": 1.703196402574712e-05, "epoch": 1.0247104247104246, "percentage": 51.24, "elapsed_time": "9:40:06", "remaining_time": "9:11:59"}
|
| 166 |
-
{"current_steps": 166, "total_steps": 322, "loss": 0.8551, "lr": 1.6870291743606273e-05, "epoch": 1.0308880308880308, "percentage": 51.55, "elapsed_time": "9:43:36", "remaining_time": "9:08:26"}
|
| 167 |
-
{"current_steps": 167, "total_steps": 322, "loss": 0.8667, "lr": 1.6708398452882552e-05, "epoch": 1.037065637065637, "percentage": 51.86, "elapsed_time": "9:47:02", "remaining_time": "9:04:51"}
|
| 168 |
-
{"current_steps": 168, "total_steps": 322, "loss": 0.8531, "lr": 1.654630328417784e-05, "epoch": 1.0432432432432432, "percentage": 52.17, "elapsed_time": "9:50:27", "remaining_time": "9:01:14"}
|
| 169 |
-
{"current_steps": 169, "total_steps": 322, "loss": 0.8642, "lr": 1.638402539194953e-05, "epoch": 1.0494208494208495, "percentage": 52.48, "elapsed_time": "9:53:52", "remaining_time": "8:57:38"}
|
| 170 |
-
{"current_steps": 170, "total_steps": 322, "loss": 0.8718, "lr": 1.6221583952247098e-05, "epoch": 1.0555984555984557, "percentage": 52.8, "elapsed_time": "9:57:17", "remaining_time": "8:54:02"}
|
| 171 |
-
{"current_steps": 171, "total_steps": 322, "loss": 0.8623, "lr": 1.605899816044608e-05, "epoch": 1.0617760617760619, "percentage": 53.11, "elapsed_time": "10:00:41", "remaining_time": "8:50:26"}
|
| 172 |
-
{"current_steps": 172, "total_steps": 322, "loss": 0.8547, "lr": 1.589628722897982e-05, "epoch": 1.0679536679536679, "percentage": 53.42, "elapsed_time": "10:04:07", "remaining_time": "8:46:51"}
|
| 173 |
-
{"current_steps": 173, "total_steps": 322, "loss": 0.8752, "lr": 1.5733470385069142e-05, "epoch": 1.074131274131274, "percentage": 53.73, "elapsed_time": "10:07:36", "remaining_time": "8:43:18"}
|
| 174 |
-
{"current_steps": 174, "total_steps": 322, "loss": 0.8529, "lr": 1.5570566868450345e-05, "epoch": 1.0803088803088803, "percentage": 54.04, "elapsed_time": "10:11:04", "remaining_time": "8:39:45"}
|
| 175 |
-
{"current_steps": 175, "total_steps": 322, "loss": 0.8453, "lr": 1.540759592910167e-05, "epoch": 1.0864864864864865, "percentage": 54.35, "elapsed_time": "10:14:35", "remaining_time": "8:36:15"}
|
| 176 |
-
{"current_steps": 176, "total_steps": 322, "loss": 0.8521, "lr": 1.5244576824968541e-05, "epoch": 1.0926640926640927, "percentage": 54.66, "elapsed_time": "10:18:03", "remaining_time": "8:32:42"}
|
| 177 |
-
{"current_steps": 177, "total_steps": 322, "loss": 0.8573, "lr": 1.5081528819687952e-05, "epoch": 1.098841698841699, "percentage": 54.97, "elapsed_time": "10:21:29", "remaining_time": "8:29:08"}
|
| 178 |
-
{"current_steps": 178, "total_steps": 322, "loss": 0.8694, "lr": 1.4918471180312052e-05, "epoch": 1.1050193050193051, "percentage": 55.28, "elapsed_time": "10:24:54", "remaining_time": "8:25:32"}
|
| 179 |
-
{"current_steps": 179, "total_steps": 322, "loss": 0.8429, "lr": 1.4755423175031461e-05, "epoch": 1.111196911196911, "percentage": 55.59, "elapsed_time": "10:28:20", "remaining_time": "8:21:58"}
|
| 180 |
-
{"current_steps": 180, "total_steps": 322, "loss": 0.8474, "lr": 1.4592404070898337e-05, "epoch": 1.1173745173745173, "percentage": 55.9, "elapsed_time": "10:31:48", "remaining_time": "8:18:25"}
|
| 181 |
-
{"current_steps": 181, "total_steps": 322, "loss": 0.8643, "lr": 1.4429433131549661e-05, "epoch": 1.1235521235521235, "percentage": 56.21, "elapsed_time": "10:35:17", "remaining_time": "8:14:53"}
|
| 182 |
-
{"current_steps": 182, "total_steps": 322, "loss": 0.847, "lr": 1.4266529614930862e-05, "epoch": 1.1297297297297297, "percentage": 56.52, "elapsed_time": "10:38:46", "remaining_time": "8:11:22"}
|
| 183 |
-
{"current_steps": 183, "total_steps": 322, "loss": 0.8416, "lr": 1.4103712771020188e-05, "epoch": 1.135907335907336, "percentage": 56.83, "elapsed_time": "10:42:14", "remaining_time": "8:07:49"}
|
| 184 |
-
{"current_steps": 184, "total_steps": 322, "loss": 0.8808, "lr": 1.3941001839553921e-05, "epoch": 1.1420849420849422, "percentage": 57.14, "elapsed_time": "10:45:40", "remaining_time": "8:04:15"}
|
| 185 |
-
{"current_steps": 185, "total_steps": 322, "loss": 0.8422, "lr": 1.3778416047752906e-05, "epoch": 1.1482625482625481, "percentage": 57.45, "elapsed_time": "10:49:05", "remaining_time": "8:00:40"}
|
| 186 |
-
{"current_steps": 186, "total_steps": 322, "loss": 0.8537, "lr": 1.3615974608050472e-05, "epoch": 1.1544401544401544, "percentage": 57.76, "elapsed_time": "10:52:32", "remaining_time": "7:57:07"}
|
| 187 |
-
{"current_steps": 187, "total_steps": 322, "loss": 0.853, "lr": 1.3453696715822165e-05, "epoch": 1.1606177606177606, "percentage": 58.07, "elapsed_time": "10:55:57", "remaining_time": "7:53:33"}
|
| 188 |
-
{"current_steps": 188, "total_steps": 322, "loss": 0.8552, "lr": 1.329160154711745e-05, "epoch": 1.1667953667953668, "percentage": 58.39, "elapsed_time": "10:59:28", "remaining_time": "7:50:02"}
|
| 189 |
-
{"current_steps": 189, "total_steps": 322, "loss": 0.8346, "lr": 1.3129708256393725e-05, "epoch": 1.172972972972973, "percentage": 58.7, "elapsed_time": "11:02:57", "remaining_time": "7:46:31"}
|
| 190 |
-
{"current_steps": 190, "total_steps": 322, "loss": 0.8561, "lr": 1.2968035974252882e-05, "epoch": 1.1791505791505792, "percentage": 59.01, "elapsed_time": "11:06:25", "remaining_time": "7:42:59"}
|
| 191 |
-
{"current_steps": 191, "total_steps": 322, "loss": 0.8518, "lr": 1.2806603805180668e-05, "epoch": 1.1853281853281854, "percentage": 59.32, "elapsed_time": "11:09:51", "remaining_time": "7:39:26"}
|
| 192 |
-
{"current_steps": 192, "total_steps": 322, "loss": 0.8588, "lr": 1.2645430825289166e-05, "epoch": 1.1915057915057914, "percentage": 59.63, "elapsed_time": "11:13:20", "remaining_time": "7:35:54"}
|
| 193 |
-
{"current_steps": 193, "total_steps": 322, "loss": 0.839, "lr": 1.2484536080062583e-05, "epoch": 1.1976833976833976, "percentage": 59.94, "elapsed_time": "11:16:51", "remaining_time": "7:32:24"}
|
| 194 |
-
{"current_steps": 194, "total_steps": 322, "loss": 0.8534, "lr": 1.2323938582106725e-05, "epoch": 1.2038610038610038, "percentage": 60.25, "elapsed_time": "11:20:17", "remaining_time": "7:28:50"}
|
| 195 |
-
{"current_steps": 195, "total_steps": 322, "loss": 0.8586, "lr": 1.2163657308902256e-05, "epoch": 1.21003861003861, "percentage": 60.56, "elapsed_time": "11:23:41", "remaining_time": "7:25:16"}
|
| 196 |
-
{"current_steps": 196, "total_steps": 322, "loss": 0.8394, "lr": 1.2003711200562243e-05, "epoch": 1.2162162162162162, "percentage": 60.87, "elapsed_time": "11:27:06", "remaining_time": "7:21:42"}
|
| 197 |
-
{"current_steps": 197, "total_steps": 322, "loss": 0.8434, "lr": 1.1844119157593962e-05, "epoch": 1.2223938223938224, "percentage": 61.18, "elapsed_time": "11:30:31", "remaining_time": "7:18:09"}
|
| 198 |
-
{"current_steps": 198, "total_steps": 322, "loss": 0.8568, "lr": 1.1684900038665532e-05, "epoch": 1.2285714285714286, "percentage": 61.49, "elapsed_time": "11:34:00", "remaining_time": "7:14:37"}
|
| 199 |
-
{"current_steps": 199, "total_steps": 322, "loss": 0.8499, "lr": 1.1526072658377371e-05, "epoch": 1.2347490347490346, "percentage": 61.8, "elapsed_time": "11:37:29", "remaining_time": "7:11:06"}
|
| 200 |
-
{"current_steps": 200, "total_steps": 322, "loss": 0.8376, "lr": 1.1367655785038958e-05, "epoch": 1.2409266409266408, "percentage": 62.11, "elapsed_time": "11:41:00", "remaining_time": "7:07:36"}
|
| 201 |
-
{"current_steps": 201, "total_steps": 322, "loss": 0.8401, "lr": 1.120966813845098e-05, "epoch": 1.247104247104247, "percentage": 62.42, "elapsed_time": "11:51:53", "remaining_time": "7:08:33"}
|
| 202 |
-
{"current_steps": 202, "total_steps": 322, "loss": 0.8486, "lr": 1.1052128387693282e-05, "epoch": 1.2532818532818533, "percentage": 62.73, "elapsed_time": "11:55:22", "remaining_time": "7:04:58"}
|
| 203 |
-
{"current_steps": 203, "total_steps": 322, "loss": 0.8427, "lr": 1.0895055148918758e-05, "epoch": 1.2594594594594595, "percentage": 63.04, "elapsed_time": "11:58:50", "remaining_time": "7:01:23"}
|
| 204 |
-
{"current_steps": 204, "total_steps": 322, "loss": 0.84, "lr": 1.0738466983153535e-05, "epoch": 1.2656370656370657, "percentage": 63.35, "elapsed_time": "12:02:16", "remaining_time": "6:57:47"}
|
| 205 |
-
{"current_steps": 205, "total_steps": 322, "loss": 0.8361, "lr": 1.0582382394103629e-05, "epoch": 1.271814671814672, "percentage": 63.66, "elapsed_time": "12:05:42", "remaining_time": "6:54:10"}
|
| 206 |
-
{"current_steps": 206, "total_steps": 322, "loss": 0.851, "lr": 1.042681982596845e-05, "epoch": 1.2779922779922779, "percentage": 63.98, "elapsed_time": "12:09:07", "remaining_time": "6:50:34"}
|
| 207 |
-
{"current_steps": 207, "total_steps": 322, "loss": 0.8335, "lr": 1.0271797661261216e-05, "epoch": 1.284169884169884, "percentage": 64.29, "elapsed_time": "12:12:33", "remaining_time": "6:46:58"}
|
| 208 |
-
{"current_steps": 208, "total_steps": 322, "loss": 0.8413, "lr": 1.0117334218636795e-05, "epoch": 1.2903474903474903, "percentage": 64.6, "elapsed_time": "12:15:59", "remaining_time": "6:43:22"}
|
| 209 |
-
{"current_steps": 209, "total_steps": 322, "loss": 0.8418, "lr": 9.963447750726985e-06, "epoch": 1.2965250965250965, "percentage": 64.91, "elapsed_time": "12:19:25", "remaining_time": "6:39:47"}
|
| 210 |
-
{"current_steps": 210, "total_steps": 322, "loss": 0.8436, "lr": 9.810156441983667e-06, "epoch": 1.3027027027027027, "percentage": 65.22, "elapsed_time": "12:22:50", "remaining_time": "6:36:11"}
|
| 211 |
-
{"current_steps": 211, "total_steps": 322, "loss": 0.8382, "lr": 9.657478406529946e-06, "epoch": 1.308880308880309, "percentage": 65.53, "elapsed_time": "12:26:19", "remaining_time": "6:32:37"}
|
| 212 |
-
{"current_steps": 212, "total_steps": 322, "loss": 0.8519, "lr": 9.505431686019694e-06, "epoch": 1.3150579150579151, "percentage": 65.84, "elapsed_time": "12:29:47", "remaining_time": "6:29:02"}
|
| 213 |
-
{"current_steps": 213, "total_steps": 322, "loss": 0.8502, "lr": 9.354034247505557e-06, "epoch": 1.3212355212355211, "percentage": 66.15, "elapsed_time": "12:33:17", "remaining_time": "6:25:29"}
|
| 214 |
-
{"current_steps": 214, "total_steps": 322, "loss": 0.8172, "lr": 9.203303981315849e-06, "epoch": 1.3274131274131273, "percentage": 66.46, "elapsed_time": "12:36:46", "remaining_time": "6:21:55"}
|
| 215 |
-
{"current_steps": 215, "total_steps": 322, "loss": 0.8285, "lr": 9.053258698940485e-06, "epoch": 1.3335907335907335, "percentage": 66.77, "elapsed_time": "12:40:13", "remaining_time": "6:18:20"}
|
| 216 |
-
{"current_steps": 216, "total_steps": 322, "loss": 0.8411, "lr": 8.903916130926232e-06, "epoch": 1.3397683397683398, "percentage": 67.08, "elapsed_time": "12:43:42", "remaining_time": "6:14:47"}
|
| 217 |
-
{"current_steps": 217, "total_steps": 322, "loss": 0.8405, "lr": 8.755293924781524e-06, "epoch": 1.345945945945946, "percentage": 67.39, "elapsed_time": "12:47:14", "remaining_time": "6:11:14"}
|
| 218 |
-
{"current_steps": 218, "total_steps": 322, "loss": 0.8398, "lr": 8.607409642891091e-06, "epoch": 1.3521235521235522, "percentage": 67.7, "elapsed_time": "12:50:40", "remaining_time": "6:07:39"}
|
| 219 |
-
{"current_steps": 219, "total_steps": 322, "loss": 0.8214, "lr": 8.460280760440664e-06, "epoch": 1.3583011583011584, "percentage": 68.01, "elapsed_time": "12:54:09", "remaining_time": "6:04:06"}
|
| 220 |
-
{"current_steps": 220, "total_steps": 322, "loss": 0.8489, "lr": 8.313924663351927e-06, "epoch": 1.3644787644787644, "percentage": 68.32, "elapsed_time": "12:57:34", "remaining_time": "6:00:30"}
|
| 221 |
-
{"current_steps": 221, "total_steps": 322, "loss": 0.8297, "lr": 8.168358646228115e-06, "epoch": 1.3706563706563706, "percentage": 68.63, "elapsed_time": "13:01:00", "remaining_time": "5:56:55"}
|
| 222 |
-
{"current_steps": 222, "total_steps": 322, "loss": 0.8128, "lr": 8.023599910310287e-06, "epoch": 1.3768339768339768, "percentage": 68.94, "elapsed_time": "13:04:24", "remaining_time": "5:53:20"}
|
| 223 |
-
{"current_steps": 223, "total_steps": 322, "loss": 0.832, "lr": 7.879665561444752e-06, "epoch": 1.383011583011583, "percentage": 69.25, "elapsed_time": "13:07:52", "remaining_time": "5:49:46"}
|
| 224 |
-
{"current_steps": 224, "total_steps": 322, "loss": 0.8262, "lr": 7.73657260806164e-06, "epoch": 1.3891891891891892, "percentage": 69.57, "elapsed_time": "13:11:20", "remaining_time": "5:46:12"}
|
| 225 |
-
{"current_steps": 225, "total_steps": 322, "loss": 0.8375, "lr": 7.594337959165108e-06, "epoch": 1.3953667953667954, "percentage": 69.88, "elapsed_time": "13:14:45", "remaining_time": "5:42:37"}
|
| 226 |
-
{"current_steps": 226, "total_steps": 322, "loss": 0.8464, "lr": 7.452978422335191e-06, "epoch": 1.4015444015444016, "percentage": 70.19, "elapsed_time": "13:18:12", "remaining_time": "5:39:03"}
|
| 227 |
-
{"current_steps": 227, "total_steps": 322, "loss": 0.8301, "lr": 7.312510701741718e-06, "epoch": 1.4077220077220076, "percentage": 70.5, "elapsed_time": "13:21:36", "remaining_time": "5:35:28"}
|
| 228 |
-
{"current_steps": 228, "total_steps": 322, "loss": 0.8282, "lr": 7.172951396170404e-06, "epoch": 1.4138996138996138, "percentage": 70.81, "elapsed_time": "13:25:01", "remaining_time": "5:31:53"}
|
| 229 |
-
{"current_steps": 229, "total_steps": 322, "loss": 0.8406, "lr": 7.0343169970614e-06, "epoch": 1.42007722007722, "percentage": 71.12, "elapsed_time": "13:28:28", "remaining_time": "5:28:20"}
|
| 230 |
-
{"current_steps": 230, "total_steps": 322, "loss": 0.8262, "lr": 6.896623886560529e-06, "epoch": 1.4262548262548262, "percentage": 71.43, "elapsed_time": "13:31:55", "remaining_time": "5:24:46"}
|
| 231 |
-
{"current_steps": 231, "total_steps": 322, "loss": 0.8454, "lr": 6.759888335583458e-06, "epoch": 1.4324324324324325, "percentage": 71.74, "elapsed_time": "13:35:21", "remaining_time": "5:21:11"}
|
| 232 |
-
{"current_steps": 232, "total_steps": 322, "loss": 0.8284, "lr": 6.624126501892971e-06, "epoch": 1.4386100386100387, "percentage": 72.05, "elapsed_time": "13:38:45", "remaining_time": "5:17:37"}
|
| 233 |
-
{"current_steps": 233, "total_steps": 322, "loss": 0.8314, "lr": 6.489354428189684e-06, "epoch": 1.4447876447876449, "percentage": 72.36, "elapsed_time": "13:42:13", "remaining_time": "5:14:04"}
|
| 234 |
-
{"current_steps": 234, "total_steps": 322, "loss": 0.8281, "lr": 6.355588040216249e-06, "epoch": 1.4509652509652509, "percentage": 72.67, "elapsed_time": "13:45:39", "remaining_time": "5:10:30"}
|
| 235 |
-
{"current_steps": 235, "total_steps": 322, "loss": 0.8294, "lr": 6.222843144875494e-06, "epoch": 1.457142857142857, "percentage": 72.98, "elapsed_time": "13:49:04", "remaining_time": "5:06:56"}
|
| 236 |
-
{"current_steps": 236, "total_steps": 322, "loss": 0.8207, "lr": 6.091135428362536e-06, "epoch": 1.4633204633204633, "percentage": 73.29, "elapsed_time": "13:52:29", "remaining_time": "5:03:22"}
|
| 237 |
-
{"current_steps": 237, "total_steps": 322, "loss": 0.8243, "lr": 5.960480454311155e-06, "epoch": 1.4694980694980695, "percentage": 73.6, "elapsed_time": "13:55:57", "remaining_time": "4:59:49"}
|
| 238 |
-
{"current_steps": 238, "total_steps": 322, "loss": 0.817, "lr": 5.830893661954708e-06, "epoch": 1.4756756756756757, "percentage": 73.91, "elapsed_time": "13:59:22", "remaining_time": "4:56:15"}
|
| 239 |
-
{"current_steps": 239, "total_steps": 322, "loss": 0.8307, "lr": 5.702390364301677e-06, "epoch": 1.481853281853282, "percentage": 74.22, "elapsed_time": "14:02:47", "remaining_time": "4:52:41"}
|
| 240 |
-
{"current_steps": 240, "total_steps": 322, "loss": 0.8327, "lr": 5.574985746326181e-06, "epoch": 1.4880308880308881, "percentage": 74.53, "elapsed_time": "14:06:12", "remaining_time": "4:49:07"}
|
| 241 |
-
{"current_steps": 241, "total_steps": 322, "loss": 0.828, "lr": 5.448694863173572e-06, "epoch": 1.494208494208494, "percentage": 74.84, "elapsed_time": "14:09:40", "remaining_time": "4:45:34"}
|
| 242 |
-
{"current_steps": 242, "total_steps": 322, "loss": 0.8289, "lr": 5.3235326383814324e-06, "epoch": 1.5003861003861005, "percentage": 75.16, "elapsed_time": "14:13:08", "remaining_time": "4:42:01"}
|
| 243 |
-
{"current_steps": 243, "total_steps": 322, "loss": 0.8271, "lr": 5.19951386211607e-06, "epoch": 1.5065637065637065, "percentage": 75.47, "elapsed_time": "14:16:33", "remaining_time": "4:38:28"}
|
| 244 |
-
{"current_steps": 244, "total_steps": 322, "loss": 0.8246, "lr": 5.076653189424804e-06, "epoch": 1.5127413127413127, "percentage": 75.78, "elapsed_time": "14:19:57", "remaining_time": "4:34:54"}
|
| 245 |
-
{"current_steps": 245, "total_steps": 322, "loss": 0.8338, "lr": 4.954965138504187e-06, "epoch": 1.518918918918919, "percentage": 76.09, "elapsed_time": "14:23:25", "remaining_time": "4:31:21"}
|
| 246 |
-
{"current_steps": 246, "total_steps": 322, "loss": 0.8344, "lr": 4.834464088984452e-06, "epoch": 1.525096525096525, "percentage": 76.4, "elapsed_time": "14:26:52", "remaining_time": "4:27:49"}
|
| 247 |
-
{"current_steps": 247, "total_steps": 322, "loss": 0.8219, "lr": 4.7151642802302695e-06, "epoch": 1.5312741312741314, "percentage": 76.71, "elapsed_time": "14:30:19", "remaining_time": "4:24:16"}
|
| 248 |
-
{"current_steps": 248, "total_steps": 322, "loss": 0.8073, "lr": 4.597079809658136e-06, "epoch": 1.5374517374517374, "percentage": 77.02, "elapsed_time": "14:33:44", "remaining_time": "4:20:42"}
|
| 249 |
-
{"current_steps": 249, "total_steps": 322, "loss": 0.8256, "lr": 4.480224631070493e-06, "epoch": 1.5436293436293438, "percentage": 77.33, "elapsed_time": "14:37:09", "remaining_time": "4:17:09"}
|
| 250 |
-
{"current_steps": 250, "total_steps": 322, "loss": 0.8119, "lr": 4.364612553006847e-06, "epoch": 1.5498069498069498, "percentage": 77.64, "elapsed_time": "14:40:35", "remaining_time": "4:13:36"}
|
| 251 |
-
{"current_steps": 251, "total_steps": 322, "loss": 0.8455, "lr": 4.250257237112023e-06, "epoch": 1.555984555984556, "percentage": 77.95, "elapsed_time": "14:44:03", "remaining_time": "4:10:04"}
|
| 252 |
-
{"current_steps": 252, "total_steps": 322, "loss": 0.8231, "lr": 4.137172196521823e-06, "epoch": 1.5621621621621622, "percentage": 78.26, "elapsed_time": "14:47:31", "remaining_time": "4:06:31"}
|
| 253 |
-
{"current_steps": 253, "total_steps": 322, "loss": 0.8271, "lr": 4.0253707942661845e-06, "epoch": 1.5683397683397682, "percentage": 78.57, "elapsed_time": "14:51:01", "remaining_time": "4:03:00"}
|
| 254 |
-
{"current_steps": 254, "total_steps": 322, "loss": 0.8276, "lr": 3.914866241690115e-06, "epoch": 1.5745173745173746, "percentage": 78.88, "elapsed_time": "14:54:28", "remaining_time": "3:59:28"}
|
| 255 |
-
{"current_steps": 255, "total_steps": 322, "loss": 0.8394, "lr": 3.8056715968925094e-06, "epoch": 1.5806949806949806, "percentage": 79.19, "elapsed_time": "14:57:55", "remaining_time": "3:55:55"}
|
| 256 |
-
{"current_steps": 256, "total_steps": 322, "loss": 0.8383, "lr": 3.697799763183127e-06, "epoch": 1.586872586872587, "percentage": 79.5, "elapsed_time": "15:01:22", "remaining_time": "3:52:23"}
|
| 257 |
-
{"current_steps": 257, "total_steps": 322, "loss": 0.8372, "lr": 3.5912634875578267e-06, "epoch": 1.593050193050193, "percentage": 79.81, "elapsed_time": "15:04:52", "remaining_time": "3:48:51"}
|
| 258 |
-
{"current_steps": 258, "total_steps": 322, "loss": 0.8194, "lr": 3.4860753591922604e-06, "epoch": 1.5992277992277992, "percentage": 80.12, "elapsed_time": "15:08:17", "remaining_time": "3:45:18"}
|
| 259 |
-
{"current_steps": 259, "total_steps": 322, "loss": 0.8526, "lr": 3.3822478079542774e-06, "epoch": 1.6054054054054054, "percentage": 80.43, "elapsed_time": "15:11:42", "remaining_time": "3:41:46"}
|
| 260 |
-
{"current_steps": 260, "total_steps": 322, "loss": 0.8137, "lr": 3.2797931029350614e-06, "epoch": 1.6115830115830114, "percentage": 80.75, "elapsed_time": "15:15:09", "remaining_time": "3:38:13"}
|
| 261 |
-
{"current_steps": 261, "total_steps": 322, "loss": 0.8174, "lr": 3.178723350999362e-06, "epoch": 1.6177606177606179, "percentage": 81.06, "elapsed_time": "15:18:40", "remaining_time": "3:34:42"}
|
| 262 |
-
{"current_steps": 262, "total_steps": 322, "loss": 0.8307, "lr": 3.0790504953548115e-06, "epoch": 1.6239382239382238, "percentage": 81.37, "elapsed_time": "15:22:07", "remaining_time": "3:31:10"}
|
| 263 |
-
{"current_steps": 263, "total_steps": 322, "loss": 0.8281, "lr": 2.980786314140658e-06, "epoch": 1.6301158301158303, "percentage": 81.68, "elapsed_time": "15:25:32", "remaining_time": "3:27:37"}
|
| 264 |
-
{"current_steps": 264, "total_steps": 322, "loss": 0.8431, "lr": 2.8839424190359386e-06, "epoch": 1.6362934362934363, "percentage": 81.99, "elapsed_time": "15:28:59", "remaining_time": "3:24:05"}
|
| 265 |
-
{"current_steps": 265, "total_steps": 322, "loss": 0.8268, "lr": 2.788530253887371e-06, "epoch": 1.6424710424710425, "percentage": 82.3, "elapsed_time": "15:32:24", "remaining_time": "3:20:33"}
|
| 266 |
-
{"current_steps": 266, "total_steps": 322, "loss": 0.8086, "lr": 2.6945610933570297e-06, "epoch": 1.6486486486486487, "percentage": 82.61, "elapsed_time": "15:35:55", "remaining_time": "3:17:02"}
|
| 267 |
-
{"current_steps": 267, "total_steps": 322, "loss": 0.8345, "lr": 2.6020460415900786e-06, "epoch": 1.6548262548262547, "percentage": 82.92, "elapsed_time": "15:39:19", "remaining_time": "3:13:29"}
|
| 268 |
-
{"current_steps": 268, "total_steps": 322, "loss": 0.829, "lr": 2.510996030902581e-06, "epoch": 1.661003861003861, "percentage": 83.23, "elapsed_time": "15:42:47", "remaining_time": "3:09:57"}
|
| 269 |
-
{"current_steps": 269, "total_steps": 322, "loss": 0.8322, "lr": 2.4214218204896776e-06, "epoch": 1.667181467181467, "percentage": 83.54, "elapsed_time": "15:46:14", "remaining_time": "3:06:26"}
|
| 270 |
-
{"current_steps": 270, "total_steps": 322, "loss": 0.8307, "lr": 2.333333995154178e-06, "epoch": 1.6733590733590735, "percentage": 83.85, "elapsed_time": "15:49:39", "remaining_time": "3:02:53"}
|
| 271 |
-
{"current_steps": 271, "total_steps": 322, "loss": 0.8241, "lr": 2.2467429640557903e-06, "epoch": 1.6795366795366795, "percentage": 84.16, "elapsed_time": "15:53:04", "remaining_time": "2:59:21"}
|
| 272 |
-
{"current_steps": 272, "total_steps": 322, "loss": 0.8308, "lr": 2.161658959481065e-06, "epoch": 1.6857142857142857, "percentage": 84.47, "elapsed_time": "15:56:31", "remaining_time": "2:55:49"}
|
| 273 |
-
{"current_steps": 273, "total_steps": 322, "loss": 0.8202, "lr": 2.0780920356343015e-06, "epoch": 1.691891891891892, "percentage": 84.78, "elapsed_time": "15:59:56", "remaining_time": "2:52:17"}
|
| 274 |
-
{"current_steps": 274, "total_steps": 322, "loss": 0.8226, "lr": 1.9960520674494354e-06, "epoch": 1.698069498069498, "percentage": 85.09, "elapsed_time": "16:03:24", "remaining_time": "2:48:46"}
|
| 275 |
-
{"current_steps": 275, "total_steps": 322, "loss": 0.8259, "lr": 1.915548749423157e-06, "epoch": 1.7042471042471043, "percentage": 85.4, "elapsed_time": "16:06:49", "remaining_time": "2:45:14"}
|
| 276 |
-
{"current_steps": 276, "total_steps": 322, "loss": 0.842, "lr": 1.8365915944693102e-06, "epoch": 1.7104247104247103, "percentage": 85.71, "elapsed_time": "16:10:16", "remaining_time": "2:41:42"}
|
| 277 |
-
{"current_steps": 277, "total_steps": 322, "loss": 0.8068, "lr": 1.759189932794798e-06, "epoch": 1.7166023166023165, "percentage": 86.02, "elapsed_time": "16:13:42", "remaining_time": "2:38:11"}
|
| 278 |
-
{"current_steps": 278, "total_steps": 322, "loss": 0.8414, "lr": 1.6833529107970236e-06, "epoch": 1.7227799227799228, "percentage": 86.34, "elapsed_time": "16:17:08", "remaining_time": "2:34:39"}
|
| 279 |
-
{"current_steps": 279, "total_steps": 322, "loss": 0.8305, "lr": 1.6090894899831017e-06, "epoch": 1.728957528957529, "percentage": 86.65, "elapsed_time": "16:20:39", "remaining_time": "2:31:08"}
|
| 280 |
-
{"current_steps": 280, "total_steps": 322, "loss": 0.8345, "lr": 1.5364084459108874e-06, "epoch": 1.7351351351351352, "percentage": 86.96, "elapsed_time": "16:24:06", "remaining_time": "2:27:36"}
|
| 281 |
-
{"current_steps": 281, "total_steps": 322, "loss": 0.813, "lr": 1.4653183671519749e-06, "epoch": 1.7413127413127412, "percentage": 87.27, "elapsed_time": "16:27:34", "remaining_time": "2:24:05"}
|
| 282 |
-
{"current_steps": 282, "total_steps": 322, "loss": 0.8154, "lr": 1.395827654276825e-06, "epoch": 1.7474903474903476, "percentage": 87.58, "elapsed_time": "16:31:01", "remaining_time": "2:20:34"}
|
| 283 |
-
{"current_steps": 283, "total_steps": 322, "loss": 0.8256, "lr": 1.3279445188620614e-06, "epoch": 1.7536679536679536, "percentage": 87.89, "elapsed_time": "16:34:27", "remaining_time": "2:17:02"}
|
| 284 |
-
{"current_steps": 284, "total_steps": 322, "loss": 0.8265, "lr": 1.26167698252015e-06, "epoch": 1.7598455598455598, "percentage": 88.2, "elapsed_time": "16:37:56", "remaining_time": "2:13:31"}
|
| 285 |
-
{"current_steps": 285, "total_steps": 322, "loss": 0.834, "lr": 1.1970328759514893e-06, "epoch": 1.766023166023166, "percentage": 88.51, "elapsed_time": "16:41:25", "remaining_time": "2:10:00"}
|
| 286 |
-
{"current_steps": 286, "total_steps": 322, "loss": 0.8226, "lr": 1.1340198380190725e-06, "epoch": 1.7722007722007722, "percentage": 88.82, "elapsed_time": "16:44:55", "remaining_time": "2:06:29"}
|
| 287 |
-
{"current_steps": 287, "total_steps": 322, "loss": 0.8255, "lr": 1.0726453148458115e-06, "epoch": 1.7783783783783784, "percentage": 89.13, "elapsed_time": "16:48:21", "remaining_time": "2:02:58"}
|
| 288 |
-
{"current_steps": 288, "total_steps": 322, "loss": 0.8183, "lr": 1.0129165589346644e-06, "epoch": 1.7845559845559844, "percentage": 89.44, "elapsed_time": "16:51:48", "remaining_time": "1:59:26"}
|
| 289 |
-
{"current_steps": 289, "total_steps": 322, "loss": 0.8041, "lr": 9.548406283115969e-07, "epoch": 1.7907335907335908, "percentage": 89.75, "elapsed_time": "16:55:13", "remaining_time": "1:55:55"}
|
| 290 |
-
{"current_steps": 290, "total_steps": 322, "loss": 0.8229, "lr": 8.984243856915763e-07, "epoch": 1.7969111969111968, "percentage": 90.06, "elapsed_time": "16:58:42", "remaining_time": "1:52:24"}
|
| 291 |
-
{"current_steps": 291, "total_steps": 322, "loss": 0.8121, "lr": 8.436744976675875e-07, "epoch": 1.803088803088803, "percentage": 90.37, "elapsed_time": "17:02:10", "remaining_time": "1:48:53"}
|
| 292 |
-
{"current_steps": 292, "total_steps": 322, "loss": 0.794, "lr": 7.905974339228861e-07, "epoch": 1.8092664092664092, "percentage": 90.68, "elapsed_time": "17:05:38", "remaining_time": "1:45:22"}
|
| 293 |
-
{"current_steps": 293, "total_steps": 322, "loss": 0.8121, "lr": 7.391994664664625e-07, "epoch": 1.8154440154440155, "percentage": 90.99, "elapsed_time": "17:09:09", "remaining_time": "1:41:51"}
|
| 294 |
-
{"current_steps": 294, "total_steps": 322, "loss": 0.8169, "lr": 6.894866688919133e-07, "epoch": 1.8216216216216217, "percentage": 91.3, "elapsed_time": "17:12:36", "remaining_time": "1:38:20"}
|
| 295 |
-
{"current_steps": 295, "total_steps": 322, "loss": 0.8202, "lr": 6.41464915659723e-07, "epoch": 1.8277992277992277, "percentage": 91.61, "elapsed_time": "17:15:59", "remaining_time": "1:34:49"}
|
| 296 |
-
{"current_steps": 296, "total_steps": 322, "loss": 0.809, "lr": 5.951398814030951e-07, "epoch": 1.833976833976834, "percentage": 91.93, "elapsed_time": "17:19:24", "remaining_time": "1:31:17"}
|
| 297 |
-
{"current_steps": 297, "total_steps": 322, "loss": 0.829, "lr": 5.505170402573911e-07, "epoch": 1.84015444015444, "percentage": 92.24, "elapsed_time": "17:22:52", "remaining_time": "1:27:47"}
|
| 298 |
-
{"current_steps": 298, "total_steps": 322, "loss": 0.8155, "lr": 5.076016652132703e-07, "epoch": 1.8463320463320463, "percentage": 92.55, "elapsed_time": "17:26:21", "remaining_time": "1:24:16"}
|
| 299 |
-
{"current_steps": 299, "total_steps": 322, "loss": 0.8328, "lr": 4.6639882749357264e-07, "epoch": 1.8525096525096525, "percentage": 92.86, "elapsed_time": "17:29:49", "remaining_time": "1:20:45"}
|
| 300 |
-
{"current_steps": 300, "total_steps": 322, "loss": 0.8211, "lr": 4.2691339595408995e-07, "epoch": 1.8586872586872587, "percentage": 93.17, "elapsed_time": "17:33:17", "remaining_time": "1:17:14"}
|
| 301 |
-
{"current_steps": 301, "total_steps": 322, "loss": 0.8136, "lr": 3.891500365081996e-07, "epoch": 1.864864864864865, "percentage": 93.48, "elapsed_time": "17:44:10", "remaining_time": "1:14:14"}
|
| 302 |
-
{"current_steps": 302, "total_steps": 322, "loss": 0.8128, "lr": 3.53113211575512e-07, "epoch": 1.871042471042471, "percentage": 93.79, "elapsed_time": "17:47:40", "remaining_time": "1:10:42"}
|
| 303 |
-
{"current_steps": 303, "total_steps": 322, "loss": 0.8199, "lr": 3.188071795545561e-07, "epoch": 1.8772200772200773, "percentage": 94.1, "elapsed_time": "17:51:09", "remaining_time": "1:07:10"}
|
| 304 |
-
{"current_steps": 304, "total_steps": 322, "loss": 0.8232, "lr": 2.8623599431957137e-07, "epoch": 1.8833976833976833, "percentage": 94.41, "elapsed_time": "17:54:36", "remaining_time": "1:03:37"}
|
| 305 |
-
{"current_steps": 305, "total_steps": 322, "loss": 0.8266, "lr": 2.5540350474147324e-07, "epoch": 1.8895752895752895, "percentage": 94.72, "elapsed_time": "17:58:05", "remaining_time": "1:00:05"}
|
| 306 |
-
{"current_steps": 306, "total_steps": 322, "loss": 0.8275, "lr": 2.2631335423303312e-07, "epoch": 1.8957528957528957, "percentage": 95.03, "elapsed_time": "18:01:36", "remaining_time": "0:56:33"}
|
| 307 |
-
{"current_steps": 307, "total_steps": 322, "loss": 0.8141, "lr": 1.989689803183531e-07, "epoch": 1.901930501930502, "percentage": 95.34, "elapsed_time": "18:05:05", "remaining_time": "0:53:01"}
|
| 308 |
-
{"current_steps": 308, "total_steps": 322, "loss": 0.839, "lr": 1.7337361422664567e-07, "epoch": 1.9081081081081082, "percentage": 95.65, "elapsed_time": "18:08:33", "remaining_time": "0:49:28"}
|
| 309 |
-
{"current_steps": 309, "total_steps": 322, "loss": 0.8289, "lr": 1.4953028051042428e-07, "epoch": 1.9142857142857141, "percentage": 95.96, "elapsed_time": "18:12:00", "remaining_time": "0:45:56"}
|
| 310 |
-
{"current_steps": 310, "total_steps": 322, "loss": 0.8209, "lr": 1.2744179668808588e-07, "epoch": 1.9204633204633206, "percentage": 96.27, "elapsed_time": "18:15:38", "remaining_time": "0:42:24"}
|
| 311 |
-
{"current_steps": 311, "total_steps": 322, "loss": 0.8281, "lr": 1.0711077291097548e-07, "epoch": 1.9266409266409266, "percentage": 96.58, "elapsed_time": "18:19:04", "remaining_time": "0:38:52"}
|
| 312 |
-
{"current_steps": 312, "total_steps": 322, "loss": 0.8144, "lr": 8.853961165494472e-08, "epoch": 1.9328185328185328, "percentage": 96.89, "elapsed_time": "18:22:35", "remaining_time": "0:35:20"}
|
| 313 |
-
{"current_steps": 313, "total_steps": 322, "loss": 0.8205, "lr": 7.173050743646382e-08, "epoch": 1.938996138996139, "percentage": 97.2, "elapsed_time": "18:26:00", "remaining_time": "0:31:48"}
|
| 314 |
-
{"current_steps": 314, "total_steps": 322, "loss": 0.8063, "lr": 5.668544655329067e-08, "epoch": 1.9451737451737452, "percentage": 97.52, "elapsed_time": "18:29:24", "remaining_time": "0:28:15"}
|
| 315 |
-
{"current_steps": 315, "total_steps": 322, "loss": 0.8186, "lr": 4.3406206849763707e-08, "epoch": 1.9513513513513514, "percentage": 97.83, "elapsed_time": "18:32:50", "remaining_time": "0:24:43"}
|
| 316 |
-
{"current_steps": 316, "total_steps": 322, "loss": 0.8371, "lr": 3.189435750671321e-08, "epoch": 1.9575289575289574, "percentage": 98.14, "elapsed_time": "18:36:16", "remaining_time": "0:21:11"}
|
| 317 |
-
{"current_steps": 317, "total_steps": 322, "loss": 0.8223, "lr": 2.2151258856032974e-08, "epoch": 1.9637065637065638, "percentage": 98.45, "elapsed_time": "18:39:44", "remaining_time": "0:17:39"}
|
| 318 |
-
{"current_steps": 318, "total_steps": 322, "loss": 0.8275, "lr": 1.417806221993223e-08, "epoch": 1.9698841698841698, "percentage": 98.76, "elapsed_time": "18:43:12", "remaining_time": "0:14:07"}
|
| 319 |
-
{"current_steps": 319, "total_steps": 322, "loss": 0.8302, "lr": 7.975709774892815e-09, "epoch": 1.976061776061776, "percentage": 99.07, "elapsed_time": "18:46:43", "remaining_time": "0:10:35"}
|
| 320 |
-
{"current_steps": 320, "total_steps": 322, "loss": 0.8215, "lr": 3.544934440323222e-09, "epoch": 1.9822393822393822, "percentage": 99.38, "elapsed_time": "18:50:10", "remaining_time": "0:07:03"}
|
| 321 |
-
{"current_steps": 321, "total_steps": 322, "loss": 0.827, "lr": 8.862597919612192e-10, "epoch": 1.9884169884169884, "percentage": 99.69, "elapsed_time": "18:53:40", "remaining_time": "0:03:31"}
|
| 322 |
-
{"current_steps": 322, "total_steps": 322, "loss": 0.8302, "lr": 0.0, "epoch": 1.9945945945945946, "percentage": 100.0, "elapsed_time": "18:57:08", "remaining_time": "0:00:00"}
|
| 323 |
-
{"current_steps": 322, "total_steps": 322, "epoch": 1.9945945945945946, "percentage": 100.0, "elapsed_time": "19:04:26", "remaining_time": "0:00:00"}
|
|
|
|
| 1 |
+
{"current_steps": 1, "total_steps": 160, "loss": 1.097, "lr": 1.25e-06, "epoch": 0.01237432327919567, "percentage": 0.62, "elapsed_time": "0:07:00", "remaining_time": "18:33:53"}
|
| 2 |
+
{"current_steps": 2, "total_steps": 160, "loss": 1.0897, "lr": 2.5e-06, "epoch": 0.02474864655839134, "percentage": 1.25, "elapsed_time": "0:13:44", "remaining_time": "18:05:33"}
|
| 3 |
+
{"current_steps": 3, "total_steps": 160, "loss": 1.1065, "lr": 3.7500000000000005e-06, "epoch": 0.037122969837587005, "percentage": 1.88, "elapsed_time": "0:20:16", "remaining_time": "17:41:13"}
|
| 4 |
+
{"current_steps": 4, "total_steps": 160, "loss": 1.1059, "lr": 5e-06, "epoch": 0.04949729311678268, "percentage": 2.5, "elapsed_time": "0:26:50", "remaining_time": "17:26:38"}
|
| 5 |
+
{"current_steps": 5, "total_steps": 160, "loss": 1.1144, "lr": 6.25e-06, "epoch": 0.061871616395978345, "percentage": 3.12, "elapsed_time": "0:33:22", "remaining_time": "17:14:48"}
|
| 6 |
+
{"current_steps": 6, "total_steps": 160, "loss": 1.1001, "lr": 7.500000000000001e-06, "epoch": 0.07424593967517401, "percentage": 3.75, "elapsed_time": "0:39:57", "remaining_time": "17:05:24"}
|
| 7 |
+
{"current_steps": 7, "total_steps": 160, "loss": 1.0976, "lr": 8.750000000000001e-06, "epoch": 0.08662026295436968, "percentage": 4.38, "elapsed_time": "0:46:28", "remaining_time": "16:55:53"}
|
| 8 |
+
{"current_steps": 8, "total_steps": 160, "loss": 1.1055, "lr": 1e-05, "epoch": 0.09899458623356536, "percentage": 5.0, "elapsed_time": "0:53:02", "remaining_time": "16:47:41"}
|
| 9 |
+
{"current_steps": 9, "total_steps": 160, "loss": 1.1013, "lr": 1.125e-05, "epoch": 0.11136890951276102, "percentage": 5.62, "elapsed_time": "0:59:38", "remaining_time": "16:40:40"}
|
| 10 |
+
{"current_steps": 10, "total_steps": 160, "loss": 1.0971, "lr": 1.25e-05, "epoch": 0.12374323279195669, "percentage": 6.25, "elapsed_time": "1:06:12", "remaining_time": "16:33:08"}
|
| 11 |
+
{"current_steps": 11, "total_steps": 160, "loss": 1.0972, "lr": 1.375e-05, "epoch": 0.13611755607115236, "percentage": 6.88, "elapsed_time": "1:12:49", "remaining_time": "16:26:22"}
|
| 12 |
+
{"current_steps": 12, "total_steps": 160, "loss": 1.0934, "lr": 1.5000000000000002e-05, "epoch": 0.14849187935034802, "percentage": 7.5, "elapsed_time": "1:19:22", "remaining_time": "16:18:53"}
|
| 13 |
+
{"current_steps": 13, "total_steps": 160, "loss": 1.1053, "lr": 1.6250000000000002e-05, "epoch": 0.1608662026295437, "percentage": 8.12, "elapsed_time": "1:25:54", "remaining_time": "16:11:29"}
|
| 14 |
+
{"current_steps": 14, "total_steps": 160, "loss": 1.1018, "lr": 1.7500000000000002e-05, "epoch": 0.17324052590873937, "percentage": 8.75, "elapsed_time": "1:32:30", "remaining_time": "16:04:40"}
|
| 15 |
+
{"current_steps": 15, "total_steps": 160, "loss": 1.0898, "lr": 1.8750000000000002e-05, "epoch": 0.18561484918793503, "percentage": 9.38, "elapsed_time": "1:39:03", "remaining_time": "15:57:30"}
|
| 16 |
+
{"current_steps": 16, "total_steps": 160, "loss": 1.0954, "lr": 2e-05, "epoch": 0.19798917246713071, "percentage": 10.0, "elapsed_time": "1:45:34", "remaining_time": "15:50:11"}
|
| 17 |
+
{"current_steps": 17, "total_steps": 160, "loss": 1.0887, "lr": 1.999762027079909e-05, "epoch": 0.21036349574632637, "percentage": 10.62, "elapsed_time": "1:52:08", "remaining_time": "15:43:14"}
|
| 18 |
+
{"current_steps": 18, "total_steps": 160, "loss": 1.0951, "lr": 1.999048221581858e-05, "epoch": 0.22273781902552203, "percentage": 11.25, "elapsed_time": "1:58:38", "remaining_time": "15:35:55"}
|
| 19 |
+
{"current_steps": 19, "total_steps": 160, "loss": 1.0872, "lr": 1.9978589232386036e-05, "epoch": 0.23511214230471772, "percentage": 11.88, "elapsed_time": "2:05:08", "remaining_time": "15:28:41"}
|
| 20 |
+
{"current_steps": 20, "total_steps": 160, "loss": 1.0849, "lr": 1.9961946980917457e-05, "epoch": 0.24748646558391338, "percentage": 12.5, "elapsed_time": "2:11:43", "remaining_time": "15:22:04"}
|
| 21 |
+
{"current_steps": 21, "total_steps": 160, "loss": 1.091, "lr": 1.9940563382223196e-05, "epoch": 0.25986078886310904, "percentage": 13.12, "elapsed_time": "2:18:16", "remaining_time": "15:15:17"}
|
| 22 |
+
{"current_steps": 22, "total_steps": 160, "loss": 1.0975, "lr": 1.9914448613738107e-05, "epoch": 0.2722351121423047, "percentage": 13.75, "elapsed_time": "2:24:46", "remaining_time": "15:08:08"}
|
| 23 |
+
{"current_steps": 23, "total_steps": 160, "loss": 1.0882, "lr": 1.988361510467761e-05, "epoch": 0.2846094354215004, "percentage": 14.37, "elapsed_time": "2:31:19", "remaining_time": "15:01:24"}
|
| 24 |
+
{"current_steps": 24, "total_steps": 160, "loss": 1.0874, "lr": 1.9848077530122083e-05, "epoch": 0.29698375870069604, "percentage": 15.0, "elapsed_time": "2:37:55", "remaining_time": "14:54:54"}
|
| 25 |
+
{"current_steps": 25, "total_steps": 160, "loss": 1.0813, "lr": 1.9807852804032306e-05, "epoch": 0.30935808197989173, "percentage": 15.62, "elapsed_time": "2:44:31", "remaining_time": "14:48:26"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 160, "loss": 1.0889, "lr": 1.9762960071199334e-05, "epoch": 0.3217324052590874, "percentage": 16.25, "elapsed_time": "2:51:05", "remaining_time": "14:41:48"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 160, "loss": 1.0728, "lr": 1.9713420698132614e-05, "epoch": 0.33410672853828305, "percentage": 16.88, "elapsed_time": "2:57:37", "remaining_time": "14:34:56"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 160, "loss": 1.0798, "lr": 1.9659258262890683e-05, "epoch": 0.34648105181747874, "percentage": 17.5, "elapsed_time": "3:04:09", "remaining_time": "14:28:11"}
|
| 29 |
+
{"current_steps": 29, "total_steps": 160, "loss": 1.0805, "lr": 1.960049854385929e-05, "epoch": 0.3588553750966744, "percentage": 18.12, "elapsed_time": "3:10:45", "remaining_time": "14:21:40"}
|
| 30 |
+
{"current_steps": 30, "total_steps": 160, "loss": 1.0761, "lr": 1.953716950748227e-05, "epoch": 0.37122969837587005, "percentage": 18.75, "elapsed_time": "3:17:21", "remaining_time": "14:15:12"}
|
| 31 |
+
{"current_steps": 31, "total_steps": 160, "loss": 1.0889, "lr": 1.946930129495106e-05, "epoch": 0.38360402165506574, "percentage": 19.38, "elapsed_time": "3:23:56", "remaining_time": "14:08:38"}
|
| 32 |
+
{"current_steps": 32, "total_steps": 160, "loss": 1.0831, "lr": 1.9396926207859085e-05, "epoch": 0.39597834493426143, "percentage": 20.0, "elapsed_time": "3:30:31", "remaining_time": "14:02:05"}
|
| 33 |
+
{"current_steps": 33, "total_steps": 160, "loss": 1.0624, "lr": 1.932007869282799e-05, "epoch": 0.40835266821345706, "percentage": 20.62, "elapsed_time": "3:37:06", "remaining_time": "13:55:33"}
|
| 34 |
+
{"current_steps": 34, "total_steps": 160, "loss": 1.0742, "lr": 1.9238795325112867e-05, "epoch": 0.42072699149265275, "percentage": 21.25, "elapsed_time": "3:43:37", "remaining_time": "13:48:43"}
|
| 35 |
+
{"current_steps": 35, "total_steps": 160, "loss": 1.0683, "lr": 1.9153114791194475e-05, "epoch": 0.43310131477184843, "percentage": 21.88, "elapsed_time": "3:50:11", "remaining_time": "13:42:08"}
|
| 36 |
+
{"current_steps": 36, "total_steps": 160, "loss": 1.0793, "lr": 1.9063077870366504e-05, "epoch": 0.44547563805104406, "percentage": 22.5, "elapsed_time": "3:56:45", "remaining_time": "13:35:28"}
|
| 37 |
+
{"current_steps": 37, "total_steps": 160, "loss": 1.0764, "lr": 1.8968727415326885e-05, "epoch": 0.45784996133023975, "percentage": 23.12, "elapsed_time": "4:03:14", "remaining_time": "13:28:36"}
|
| 38 |
+
{"current_steps": 38, "total_steps": 160, "loss": 1.0586, "lr": 1.887010833178222e-05, "epoch": 0.47022428460943544, "percentage": 23.75, "elapsed_time": "4:09:45", "remaining_time": "13:21:51"}
|
| 39 |
+
{"current_steps": 39, "total_steps": 160, "loss": 1.0676, "lr": 1.876726755707508e-05, "epoch": 0.48259860788863107, "percentage": 24.38, "elapsed_time": "4:16:16", "remaining_time": "13:15:06"}
|
| 40 |
+
{"current_steps": 40, "total_steps": 160, "loss": 1.0653, "lr": 1.866025403784439e-05, "epoch": 0.49497293116782676, "percentage": 25.0, "elapsed_time": "4:22:52", "remaining_time": "13:08:37"}
|
| 41 |
+
{"current_steps": 41, "total_steps": 160, "loss": 1.0617, "lr": 1.854911870672947e-05, "epoch": 0.5073472544470224, "percentage": 25.62, "elapsed_time": "4:29:23", "remaining_time": "13:01:53"}
|
| 42 |
+
{"current_steps": 42, "total_steps": 160, "loss": 1.0661, "lr": 1.843391445812886e-05, "epoch": 0.5197215777262181, "percentage": 26.25, "elapsed_time": "4:35:54", "remaining_time": "12:55:11"}
|
| 43 |
+
{"current_steps": 43, "total_steps": 160, "loss": 1.0652, "lr": 1.8314696123025456e-05, "epoch": 0.5320959010054138, "percentage": 26.88, "elapsed_time": "4:42:26", "remaining_time": "12:48:31"}
|
| 44 |
+
{"current_steps": 44, "total_steps": 160, "loss": 1.0713, "lr": 1.819152044288992e-05, "epoch": 0.5444702242846094, "percentage": 27.5, "elapsed_time": "4:48:58", "remaining_time": "12:41:50"}
|
| 45 |
+
{"current_steps": 45, "total_steps": 160, "loss": 1.0591, "lr": 1.806444604267483e-05, "epoch": 0.5568445475638051, "percentage": 28.12, "elapsed_time": "4:55:28", "remaining_time": "12:35:06"}
|
| 46 |
+
{"current_steps": 46, "total_steps": 160, "loss": 1.0472, "lr": 1.7933533402912354e-05, "epoch": 0.5692188708430008, "percentage": 28.75, "elapsed_time": "5:02:03", "remaining_time": "12:28:34"}
|
| 47 |
+
{"current_steps": 47, "total_steps": 160, "loss": 1.0621, "lr": 1.7798844830928818e-05, "epoch": 0.5815931941221965, "percentage": 29.38, "elapsed_time": "5:08:37", "remaining_time": "12:21:59"}
|
| 48 |
+
{"current_steps": 48, "total_steps": 160, "loss": 1.0467, "lr": 1.766044443118978e-05, "epoch": 0.5939675174013921, "percentage": 30.0, "elapsed_time": "5:15:10", "remaining_time": "12:15:24"}
|
| 49 |
+
{"current_steps": 49, "total_steps": 160, "loss": 1.0654, "lr": 1.7518398074789776e-05, "epoch": 0.6063418406805878, "percentage": 30.63, "elapsed_time": "5:21:46", "remaining_time": "12:08:55"}
|
| 50 |
+
{"current_steps": 50, "total_steps": 160, "loss": 1.0477, "lr": 1.737277336810124e-05, "epoch": 0.6187161639597835, "percentage": 31.25, "elapsed_time": "5:28:16", "remaining_time": "12:02:11"}
|
| 51 |
+
{"current_steps": 51, "total_steps": 160, "loss": 1.0619, "lr": 1.7223639620597556e-05, "epoch": 0.6310904872389791, "percentage": 31.87, "elapsed_time": "5:34:50", "remaining_time": "11:55:39"}
|
| 52 |
+
{"current_steps": 52, "total_steps": 160, "loss": 1.0471, "lr": 1.7071067811865477e-05, "epoch": 0.6434648105181748, "percentage": 32.5, "elapsed_time": "5:41:21", "remaining_time": "11:48:58"}
|
| 53 |
+
{"current_steps": 53, "total_steps": 160, "loss": 1.0534, "lr": 1.6915130557822698e-05, "epoch": 0.6558391337973705, "percentage": 33.12, "elapsed_time": "5:47:54", "remaining_time": "11:42:23"}
|
| 54 |
+
{"current_steps": 54, "total_steps": 160, "loss": 1.0618, "lr": 1.6755902076156606e-05, "epoch": 0.6682134570765661, "percentage": 33.75, "elapsed_time": "5:54:26", "remaining_time": "11:35:46"}
|
| 55 |
+
{"current_steps": 55, "total_steps": 160, "loss": 1.0612, "lr": 1.659345815100069e-05, "epoch": 0.6805877803557618, "percentage": 34.38, "elapsed_time": "6:01:00", "remaining_time": "11:29:12"}
|
| 56 |
+
{"current_steps": 56, "total_steps": 160, "loss": 1.0495, "lr": 1.6427876096865394e-05, "epoch": 0.6929621036349575, "percentage": 35.0, "elapsed_time": "6:07:34", "remaining_time": "11:22:38"}
|
| 57 |
+
{"current_steps": 57, "total_steps": 160, "loss": 1.0646, "lr": 1.6259234721840595e-05, "epoch": 0.7053364269141531, "percentage": 35.62, "elapsed_time": "6:14:10", "remaining_time": "11:16:09"}
|
| 58 |
+
{"current_steps": 58, "total_steps": 160, "loss": 1.0578, "lr": 1.608761429008721e-05, "epoch": 0.7177107501933488, "percentage": 36.25, "elapsed_time": "6:20:43", "remaining_time": "11:09:33"}
|
| 59 |
+
{"current_steps": 59, "total_steps": 160, "loss": 1.045, "lr": 1.5913096483635827e-05, "epoch": 0.7300850734725445, "percentage": 36.88, "elapsed_time": "6:27:14", "remaining_time": "11:02:55"}
|
| 60 |
+
{"current_steps": 60, "total_steps": 160, "loss": 1.051, "lr": 1.573576436351046e-05, "epoch": 0.7424593967517401, "percentage": 37.5, "elapsed_time": "6:33:46", "remaining_time": "10:56:17"}
|
| 61 |
+
{"current_steps": 61, "total_steps": 160, "loss": 1.0533, "lr": 1.5555702330196024e-05, "epoch": 0.7548337200309359, "percentage": 38.12, "elapsed_time": "6:40:20", "remaining_time": "10:49:44"}
|
| 62 |
+
{"current_steps": 62, "total_steps": 160, "loss": 1.0595, "lr": 1.5372996083468242e-05, "epoch": 0.7672080433101315, "percentage": 38.75, "elapsed_time": "6:46:50", "remaining_time": "10:43:04"}
|
| 63 |
+
{"current_steps": 63, "total_steps": 160, "loss": 1.0503, "lr": 1.5187732581605217e-05, "epoch": 0.7795823665893271, "percentage": 39.38, "elapsed_time": "6:53:24", "remaining_time": "10:36:31"}
|
| 64 |
+
{"current_steps": 64, "total_steps": 160, "loss": 1.0328, "lr": 1.5000000000000002e-05, "epoch": 0.7919566898685229, "percentage": 40.0, "elapsed_time": "6:59:59", "remaining_time": "10:29:59"}
|
| 65 |
+
{"current_steps": 65, "total_steps": 160, "loss": 1.0479, "lr": 1.4809887689193878e-05, "epoch": 0.8043310131477185, "percentage": 40.62, "elapsed_time": "7:06:33", "remaining_time": "10:23:25"}
|
| 66 |
+
{"current_steps": 66, "total_steps": 160, "loss": 1.0514, "lr": 1.4617486132350343e-05, "epoch": 0.8167053364269141, "percentage": 41.25, "elapsed_time": "7:13:07", "remaining_time": "10:16:52"}
|
| 67 |
+
{"current_steps": 67, "total_steps": 160, "loss": 1.0387, "lr": 1.4422886902190014e-05, "epoch": 0.8290796597061099, "percentage": 41.88, "elapsed_time": "7:19:39", "remaining_time": "10:10:16"}
|
| 68 |
+
{"current_steps": 68, "total_steps": 160, "loss": 1.0399, "lr": 1.4226182617406996e-05, "epoch": 0.8414539829853055, "percentage": 42.5, "elapsed_time": "7:26:12", "remaining_time": "10:03:42"}
|
| 69 |
+
{"current_steps": 69, "total_steps": 160, "loss": 1.0403, "lr": 1.4027466898587375e-05, "epoch": 0.8538283062645011, "percentage": 43.12, "elapsed_time": "7:32:45", "remaining_time": "9:57:06"}
|
| 70 |
+
{"current_steps": 70, "total_steps": 160, "loss": 1.0378, "lr": 1.3826834323650899e-05, "epoch": 0.8662026295436969, "percentage": 43.75, "elapsed_time": "7:39:15", "remaining_time": "9:50:28"}
|
| 71 |
+
{"current_steps": 71, "total_steps": 160, "loss": 1.045, "lr": 1.3624380382837017e-05, "epoch": 0.8785769528228925, "percentage": 44.38, "elapsed_time": "7:45:44", "remaining_time": "9:43:49"}
|
| 72 |
+
{"current_steps": 72, "total_steps": 160, "loss": 1.0344, "lr": 1.342020143325669e-05, "epoch": 0.8909512761020881, "percentage": 45.0, "elapsed_time": "7:52:12", "remaining_time": "9:37:08"}
|
| 73 |
+
{"current_steps": 73, "total_steps": 160, "loss": 1.0428, "lr": 1.3214394653031616e-05, "epoch": 0.9033255993812839, "percentage": 45.62, "elapsed_time": "7:58:43", "remaining_time": "9:30:32"}
|
| 74 |
+
{"current_steps": 74, "total_steps": 160, "loss": 1.043, "lr": 1.300705799504273e-05, "epoch": 0.9156999226604795, "percentage": 46.25, "elapsed_time": "8:05:12", "remaining_time": "9:23:53"}
|
| 75 |
+
{"current_steps": 75, "total_steps": 160, "loss": 1.0453, "lr": 1.2798290140309924e-05, "epoch": 0.9280742459396751, "percentage": 46.88, "elapsed_time": "8:11:45", "remaining_time": "9:17:19"}
|
| 76 |
+
{"current_steps": 76, "total_steps": 160, "loss": 1.0341, "lr": 1.2588190451025209e-05, "epoch": 0.9404485692188709, "percentage": 47.5, "elapsed_time": "8:18:15", "remaining_time": "9:10:42"}
|
| 77 |
+
{"current_steps": 77, "total_steps": 160, "loss": 1.0462, "lr": 1.2376858923261732e-05, "epoch": 0.9528228924980665, "percentage": 48.12, "elapsed_time": "8:24:46", "remaining_time": "9:04:06"}
|
| 78 |
+
{"current_steps": 78, "total_steps": 160, "loss": 1.0446, "lr": 1.2164396139381029e-05, "epoch": 0.9651972157772621, "percentage": 48.75, "elapsed_time": "8:31:15", "remaining_time": "8:57:28"}
|
| 79 |
+
{"current_steps": 79, "total_steps": 160, "loss": 1.045, "lr": 1.1950903220161286e-05, "epoch": 0.9775715390564579, "percentage": 49.38, "elapsed_time": "8:37:47", "remaining_time": "8:50:53"}
|
| 80 |
+
{"current_steps": 80, "total_steps": 160, "loss": 1.0377, "lr": 1.1736481776669307e-05, "epoch": 0.9899458623356535, "percentage": 50.0, "elapsed_time": "8:44:20", "remaining_time": "8:44:20"}
|
| 81 |
+
{"current_steps": 81, "total_steps": 160, "loss": 2.0242, "lr": 1.1521233861899168e-05, "epoch": 1.0123743232791957, "percentage": 50.62, "elapsed_time": "8:55:08", "remaining_time": "8:41:55"}
|
| 82 |
+
{"current_steps": 82, "total_steps": 160, "loss": 0.9894, "lr": 1.130526192220052e-05, "epoch": 1.0247486465583913, "percentage": 51.25, "elapsed_time": "9:01:38", "remaining_time": "8:35:13"}
|
| 83 |
+
{"current_steps": 83, "total_steps": 160, "loss": 0.9824, "lr": 1.1088668748519646e-05, "epoch": 1.037122969837587, "percentage": 51.88, "elapsed_time": "9:08:08", "remaining_time": "8:28:31"}
|
| 84 |
+
{"current_steps": 84, "total_steps": 160, "loss": 0.971, "lr": 1.0871557427476585e-05, "epoch": 1.0494972931167827, "percentage": 52.5, "elapsed_time": "9:14:37", "remaining_time": "8:21:47"}
|
| 85 |
+
{"current_steps": 85, "total_steps": 160, "loss": 0.9799, "lr": 1.0654031292301432e-05, "epoch": 1.0618716163959783, "percentage": 53.12, "elapsed_time": "9:21:13", "remaining_time": "8:15:11"}
|
| 86 |
+
{"current_steps": 86, "total_steps": 160, "loss": 0.975, "lr": 1.0436193873653362e-05, "epoch": 1.074245939675174, "percentage": 53.75, "elapsed_time": "9:27:50", "remaining_time": "8:08:36"}
|
| 87 |
+
{"current_steps": 87, "total_steps": 160, "loss": 0.9633, "lr": 1.0218148850345613e-05, "epoch": 1.0866202629543698, "percentage": 54.37, "elapsed_time": "9:34:21", "remaining_time": "8:01:56"}
|
| 88 |
+
{"current_steps": 88, "total_steps": 160, "loss": 0.9802, "lr": 1e-05, "epoch": 1.0989945862335653, "percentage": 55.0, "elapsed_time": "9:40:51", "remaining_time": "7:55:14"}
|
| 89 |
+
{"current_steps": 89, "total_steps": 160, "loss": 0.9617, "lr": 9.78185114965439e-06, "epoch": 1.111368909512761, "percentage": 55.62, "elapsed_time": "9:47:21", "remaining_time": "7:48:33"}
|
| 90 |
+
{"current_steps": 90, "total_steps": 160, "loss": 0.9729, "lr": 9.563806126346643e-06, "epoch": 1.1237432327919568, "percentage": 56.25, "elapsed_time": "9:53:51", "remaining_time": "7:41:53"}
|
| 91 |
+
{"current_steps": 91, "total_steps": 160, "loss": 0.9787, "lr": 9.34596870769857e-06, "epoch": 1.1361175560711523, "percentage": 56.88, "elapsed_time": "10:00:21", "remaining_time": "7:35:13"}
|
| 92 |
+
{"current_steps": 92, "total_steps": 160, "loss": 0.9715, "lr": 9.128442572523418e-06, "epoch": 1.148491879350348, "percentage": 57.5, "elapsed_time": "10:06:59", "remaining_time": "7:28:38"}
|
| 93 |
+
{"current_steps": 93, "total_steps": 160, "loss": 0.973, "lr": 8.911331251480357e-06, "epoch": 1.1608662026295438, "percentage": 58.13, "elapsed_time": "10:13:30", "remaining_time": "7:21:59"}
|
| 94 |
+
{"current_steps": 94, "total_steps": 160, "loss": 0.9718, "lr": 8.694738077799487e-06, "epoch": 1.1732405259087393, "percentage": 58.75, "elapsed_time": "10:20:04", "remaining_time": "7:15:22"}
|
| 95 |
+
{"current_steps": 95, "total_steps": 160, "loss": 0.9653, "lr": 8.478766138100834e-06, "epoch": 1.185614849187935, "percentage": 59.38, "elapsed_time": "10:26:35", "remaining_time": "7:08:43"}
|
| 96 |
+
{"current_steps": 96, "total_steps": 160, "loss": 0.9696, "lr": 8.263518223330698e-06, "epoch": 1.1979891724671308, "percentage": 60.0, "elapsed_time": "10:33:07", "remaining_time": "7:02:04"}
|
| 97 |
+
{"current_steps": 97, "total_steps": 160, "loss": 0.9661, "lr": 8.04909677983872e-06, "epoch": 1.2103634957463263, "percentage": 60.62, "elapsed_time": "10:39:38", "remaining_time": "6:55:26"}
|
| 98 |
+
{"current_steps": 98, "total_steps": 160, "loss": 0.972, "lr": 7.835603860618973e-06, "epoch": 1.222737819025522, "percentage": 61.25, "elapsed_time": "10:46:10", "remaining_time": "6:48:48"}
|
| 99 |
+
{"current_steps": 99, "total_steps": 160, "loss": 0.971, "lr": 7.623141076738271e-06, "epoch": 1.2351121423047178, "percentage": 61.88, "elapsed_time": "10:52:41", "remaining_time": "6:42:09"}
|
| 100 |
+
{"current_steps": 100, "total_steps": 160, "loss": 0.9619, "lr": 7.411809548974792e-06, "epoch": 1.2474864655839133, "percentage": 62.5, "elapsed_time": "10:59:10", "remaining_time": "6:35:30"}
|
| 101 |
+
{"current_steps": 101, "total_steps": 160, "loss": 0.958, "lr": 7.201709859690081e-06, "epoch": 1.259860788863109, "percentage": 63.12, "elapsed_time": "11:12:16", "remaining_time": "6:32:42"}
|
| 102 |
+
{"current_steps": 102, "total_steps": 160, "loss": 0.9727, "lr": 6.992942004957271e-06, "epoch": 1.2722351121423048, "percentage": 63.75, "elapsed_time": "11:18:49", "remaining_time": "6:26:00"}
|
| 103 |
+
{"current_steps": 103, "total_steps": 160, "loss": 0.9639, "lr": 6.785605346968387e-06, "epoch": 1.2846094354215003, "percentage": 64.38, "elapsed_time": "11:25:22", "remaining_time": "6:19:16"}
|
| 104 |
+
{"current_steps": 104, "total_steps": 160, "loss": 0.9648, "lr": 6.579798566743314e-06, "epoch": 1.296983758700696, "percentage": 65.0, "elapsed_time": "11:31:52", "remaining_time": "6:12:32"}
|
| 105 |
+
{"current_steps": 105, "total_steps": 160, "loss": 0.9695, "lr": 6.375619617162985e-06, "epoch": 1.3093580819798918, "percentage": 65.62, "elapsed_time": "11:38:23", "remaining_time": "6:05:49"}
|
| 106 |
+
{"current_steps": 106, "total_steps": 160, "loss": 0.9505, "lr": 6.173165676349103e-06, "epoch": 1.3217324052590875, "percentage": 66.25, "elapsed_time": "11:44:52", "remaining_time": "5:59:05"}
|
| 107 |
+
{"current_steps": 107, "total_steps": 160, "loss": 0.9694, "lr": 5.97253310141263e-06, "epoch": 1.334106728538283, "percentage": 66.88, "elapsed_time": "11:51:22", "remaining_time": "5:52:21"}
|
| 108 |
+
{"current_steps": 108, "total_steps": 160, "loss": 0.9609, "lr": 5.773817382593008e-06, "epoch": 1.3464810518174788, "percentage": 67.5, "elapsed_time": "11:57:52", "remaining_time": "5:45:38"}
|
| 109 |
+
{"current_steps": 109, "total_steps": 160, "loss": 0.962, "lr": 5.5771130978099896e-06, "epoch": 1.3588553750966743, "percentage": 68.12, "elapsed_time": "12:04:23", "remaining_time": "5:38:56"}
|
| 110 |
+
{"current_steps": 110, "total_steps": 160, "loss": 0.9764, "lr": 5.382513867649663e-06, "epoch": 1.37122969837587, "percentage": 68.75, "elapsed_time": "12:10:52", "remaining_time": "5:32:13"}
|
| 111 |
+
{"current_steps": 111, "total_steps": 160, "loss": 0.9574, "lr": 5.190112310806126e-06, "epoch": 1.3836040216550658, "percentage": 69.38, "elapsed_time": "12:17:22", "remaining_time": "5:25:30"}
|
| 112 |
+
{"current_steps": 112, "total_steps": 160, "loss": 0.968, "lr": 5.000000000000003e-06, "epoch": 1.3959783449342615, "percentage": 70.0, "elapsed_time": "12:23:52", "remaining_time": "5:18:48"}
|
| 113 |
+
{"current_steps": 113, "total_steps": 160, "loss": 0.9563, "lr": 4.812267418394784e-06, "epoch": 1.408352668213457, "percentage": 70.62, "elapsed_time": "12:30:25", "remaining_time": "5:12:07"}
|
| 114 |
+
{"current_steps": 114, "total_steps": 160, "loss": 0.9594, "lr": 4.627003916531761e-06, "epoch": 1.4207269914926528, "percentage": 71.25, "elapsed_time": "12:36:58", "remaining_time": "5:05:26"}
|
| 115 |
+
{"current_steps": 115, "total_steps": 160, "loss": 0.951, "lr": 4.444297669803981e-06, "epoch": 1.4331013147718483, "percentage": 71.88, "elapsed_time": "12:43:31", "remaining_time": "4:58:46"}
|
| 116 |
+
{"current_steps": 116, "total_steps": 160, "loss": 0.9445, "lr": 4.264235636489542e-06, "epoch": 1.445475638051044, "percentage": 72.5, "elapsed_time": "12:50:00", "remaining_time": "4:52:04"}
|
| 117 |
+
{"current_steps": 117, "total_steps": 160, "loss": 0.9681, "lr": 4.086903516364179e-06, "epoch": 1.4578499613302398, "percentage": 73.12, "elapsed_time": "12:56:31", "remaining_time": "4:45:23"}
|
| 118 |
+
{"current_steps": 118, "total_steps": 160, "loss": 0.9654, "lr": 3.912385709912794e-06, "epoch": 1.4702242846094355, "percentage": 73.75, "elapsed_time": "13:03:00", "remaining_time": "4:38:41"}
|
| 119 |
+
{"current_steps": 119, "total_steps": 160, "loss": 0.9589, "lr": 3.7407652781594094e-06, "epoch": 1.482598607888631, "percentage": 74.38, "elapsed_time": "13:09:31", "remaining_time": "4:32:01"}
|
| 120 |
+
{"current_steps": 120, "total_steps": 160, "loss": 0.9614, "lr": 3.5721239031346067e-06, "epoch": 1.4949729311678268, "percentage": 75.0, "elapsed_time": "13:16:01", "remaining_time": "4:25:20"}
|
| 121 |
+
{"current_steps": 121, "total_steps": 160, "loss": 0.9687, "lr": 3.4065418489993118e-06, "epoch": 1.5073472544470223, "percentage": 75.62, "elapsed_time": "13:22:32", "remaining_time": "4:18:40"}
|
| 122 |
+
{"current_steps": 122, "total_steps": 160, "loss": 0.9556, "lr": 3.2440979238433977e-06, "epoch": 1.519721577726218, "percentage": 76.25, "elapsed_time": "13:29:08", "remaining_time": "4:12:01"}
|
| 123 |
+
{"current_steps": 123, "total_steps": 160, "loss": 0.9579, "lr": 3.0848694421773075e-06, "epoch": 1.5320959010054138, "percentage": 76.88, "elapsed_time": "13:35:39", "remaining_time": "4:05:21"}
|
| 124 |
+
{"current_steps": 124, "total_steps": 160, "loss": 0.9647, "lr": 2.9289321881345257e-06, "epoch": 1.5444702242846096, "percentage": 77.5, "elapsed_time": "13:42:08", "remaining_time": "3:58:41"}
|
| 125 |
+
{"current_steps": 125, "total_steps": 160, "loss": 0.9512, "lr": 2.776360379402445e-06, "epoch": 1.556844547563805, "percentage": 78.12, "elapsed_time": "13:48:45", "remaining_time": "3:52:03"}
|
| 126 |
+
{"current_steps": 126, "total_steps": 160, "loss": 0.9643, "lr": 2.6272266318987606e-06, "epoch": 1.5692188708430008, "percentage": 78.75, "elapsed_time": "13:55:18", "remaining_time": "3:45:24"}
|
| 127 |
+
{"current_steps": 127, "total_steps": 160, "loss": 0.9416, "lr": 2.4816019252102274e-06, "epoch": 1.5815931941221963, "percentage": 79.38, "elapsed_time": "14:01:55", "remaining_time": "3:38:46"}
|
| 128 |
+
{"current_steps": 128, "total_steps": 160, "loss": 0.9655, "lr": 2.339555568810221e-06, "epoch": 1.593967517401392, "percentage": 80.0, "elapsed_time": "14:08:29", "remaining_time": "3:32:07"}
|
| 129 |
+
{"current_steps": 129, "total_steps": 160, "loss": 0.9618, "lr": 2.201155169071184e-06, "epoch": 1.6063418406805878, "percentage": 80.62, "elapsed_time": "14:14:59", "remaining_time": "3:25:27"}
|
| 130 |
+
{"current_steps": 130, "total_steps": 160, "loss": 0.9559, "lr": 2.0664665970876496e-06, "epoch": 1.6187161639597836, "percentage": 81.25, "elapsed_time": "14:21:31", "remaining_time": "3:18:48"}
|
| 131 |
+
{"current_steps": 131, "total_steps": 160, "loss": 0.9561, "lr": 1.9355539573251737e-06, "epoch": 1.631090487238979, "percentage": 81.88, "elapsed_time": "14:28:08", "remaining_time": "3:12:11"}
|
| 132 |
+
{"current_steps": 132, "total_steps": 160, "loss": 0.9613, "lr": 1.808479557110081e-06, "epoch": 1.6434648105181748, "percentage": 82.5, "elapsed_time": "14:34:43", "remaining_time": "3:05:32"}
|
| 133 |
+
{"current_steps": 133, "total_steps": 160, "loss": 0.9633, "lr": 1.6853038769745466e-06, "epoch": 1.6558391337973704, "percentage": 83.12, "elapsed_time": "14:41:19", "remaining_time": "2:58:54"}
|
| 134 |
+
{"current_steps": 134, "total_steps": 160, "loss": 0.9524, "lr": 1.566085541871145e-06, "epoch": 1.668213457076566, "percentage": 83.75, "elapsed_time": "14:47:51", "remaining_time": "2:52:16"}
|
| 135 |
+
{"current_steps": 135, "total_steps": 160, "loss": 0.9564, "lr": 1.4508812932705364e-06, "epoch": 1.6805877803557618, "percentage": 84.38, "elapsed_time": "14:54:21", "remaining_time": "2:45:37"}
|
| 136 |
+
{"current_steps": 136, "total_steps": 160, "loss": 0.9581, "lr": 1.339745962155613e-06, "epoch": 1.6929621036349576, "percentage": 85.0, "elapsed_time": "15:00:52", "remaining_time": "2:38:58"}
|
| 137 |
+
{"current_steps": 137, "total_steps": 160, "loss": 0.9515, "lr": 1.2327324429249232e-06, "epoch": 1.705336426914153, "percentage": 85.62, "elapsed_time": "15:07:27", "remaining_time": "2:32:20"}
|
| 138 |
+
{"current_steps": 138, "total_steps": 160, "loss": 0.965, "lr": 1.129891668217783e-06, "epoch": 1.7177107501933488, "percentage": 86.25, "elapsed_time": "15:14:01", "remaining_time": "2:25:42"}
|
| 139 |
+
{"current_steps": 139, "total_steps": 160, "loss": 0.9627, "lr": 1.0312725846731174e-06, "epoch": 1.7300850734725444, "percentage": 86.88, "elapsed_time": "15:20:34", "remaining_time": "2:19:04"}
|
| 140 |
+
{"current_steps": 140, "total_steps": 160, "loss": 0.9638, "lr": 9.369221296335007e-07, "epoch": 1.74245939675174, "percentage": 87.5, "elapsed_time": "15:27:08", "remaining_time": "2:12:26"}
|
| 141 |
+
{"current_steps": 141, "total_steps": 160, "loss": 0.9511, "lr": 8.468852088055291e-07, "epoch": 1.7548337200309359, "percentage": 88.12, "elapsed_time": "15:33:40", "remaining_time": "2:05:48"}
|
| 142 |
+
{"current_steps": 142, "total_steps": 160, "loss": 0.9513, "lr": 7.612046748871327e-07, "epoch": 1.7672080433101316, "percentage": 88.75, "elapsed_time": "15:40:12", "remaining_time": "1:59:10"}
|
| 143 |
+
{"current_steps": 143, "total_steps": 160, "loss": 0.9522, "lr": 6.799213071720156e-07, "epoch": 1.7795823665893271, "percentage": 89.38, "elapsed_time": "15:46:41", "remaining_time": "1:52:32"}
|
| 144 |
+
{"current_steps": 144, "total_steps": 160, "loss": 0.9581, "lr": 6.030737921409169e-07, "epoch": 1.7919566898685229, "percentage": 90.0, "elapsed_time": "15:53:14", "remaining_time": "1:45:54"}
|
| 145 |
+
{"current_steps": 145, "total_steps": 160, "loss": 0.9579, "lr": 5.306987050489442e-07, "epoch": 1.8043310131477184, "percentage": 90.62, "elapsed_time": "15:59:45", "remaining_time": "1:39:17"}
|
| 146 |
+
{"current_steps": 146, "total_steps": 160, "loss": 0.9709, "lr": 4.628304925177318e-07, "epoch": 1.8167053364269141, "percentage": 91.25, "elapsed_time": "16:06:14", "remaining_time": "1:32:39"}
|
| 147 |
+
{"current_steps": 147, "total_steps": 160, "loss": 0.9512, "lr": 3.99501456140714e-07, "epoch": 1.8290796597061099, "percentage": 91.88, "elapsed_time": "16:12:45", "remaining_time": "1:26:01"}
|
| 148 |
+
{"current_steps": 148, "total_steps": 160, "loss": 0.9525, "lr": 3.4074173710931804e-07, "epoch": 1.8414539829853056, "percentage": 92.5, "elapsed_time": "16:19:15", "remaining_time": "1:19:23"}
|
| 149 |
+
{"current_steps": 149, "total_steps": 160, "loss": 0.9463, "lr": 2.865793018673857e-07, "epoch": 1.8538283062645011, "percentage": 93.12, "elapsed_time": "16:25:52", "remaining_time": "1:12:46"}
|
| 150 |
+
{"current_steps": 150, "total_steps": 160, "loss": 0.9469, "lr": 2.370399288006664e-07, "epoch": 1.8662026295436969, "percentage": 93.75, "elapsed_time": "16:32:24", "remaining_time": "1:06:09"}
|
| 151 |
+
{"current_steps": 151, "total_steps": 160, "loss": 0.961, "lr": 1.921471959676957e-07, "epoch": 1.8785769528228924, "percentage": 94.38, "elapsed_time": "16:38:59", "remaining_time": "0:59:32"}
|
| 152 |
+
{"current_steps": 152, "total_steps": 160, "loss": 0.9465, "lr": 1.519224698779198e-07, "epoch": 1.8909512761020881, "percentage": 95.0, "elapsed_time": "16:45:33", "remaining_time": "0:52:55"}
|
| 153 |
+
{"current_steps": 153, "total_steps": 160, "loss": 0.9539, "lr": 1.1638489532239339e-07, "epoch": 1.9033255993812839, "percentage": 95.62, "elapsed_time": "16:52:04", "remaining_time": "0:46:18"}
|
| 154 |
+
{"current_steps": 154, "total_steps": 160, "loss": 0.9512, "lr": 8.555138626189619e-08, "epoch": 1.9156999226604796, "percentage": 96.25, "elapsed_time": "16:58:35", "remaining_time": "0:39:41"}
|
| 155 |
+
{"current_steps": 155, "total_steps": 160, "loss": 0.9656, "lr": 5.943661777680354e-08, "epoch": 1.9280742459396751, "percentage": 96.88, "elapsed_time": "17:05:07", "remaining_time": "0:33:04"}
|
| 156 |
+
{"current_steps": 156, "total_steps": 160, "loss": 0.9528, "lr": 3.805301908254455e-08, "epoch": 1.9404485692188709, "percentage": 97.5, "elapsed_time": "17:11:39", "remaining_time": "0:26:27"}
|
| 157 |
+
{"current_steps": 157, "total_steps": 160, "loss": 0.9609, "lr": 2.1410767613965212e-08, "epoch": 1.9528228924980664, "percentage": 98.12, "elapsed_time": "17:18:14", "remaining_time": "0:19:50"}
|
| 158 |
+
{"current_steps": 158, "total_steps": 160, "loss": 0.962, "lr": 9.517784181422018e-09, "epoch": 1.9651972157772621, "percentage": 98.75, "elapsed_time": "17:24:45", "remaining_time": "0:13:13"}
|
| 159 |
+
{"current_steps": 159, "total_steps": 160, "loss": 0.9612, "lr": 2.379729200908676e-09, "epoch": 1.9775715390564579, "percentage": 99.38, "elapsed_time": "17:31:16", "remaining_time": "0:06:36"}
|
| 160 |
+
{"current_steps": 160, "total_steps": 160, "loss": 0.9597, "lr": 0.0, "epoch": 1.9899458623356536, "percentage": 100.0, "elapsed_time": "17:37:46", "remaining_time": "0:00:00"}
|
| 161 |
+
{"current_steps": 160, "total_steps": 160, "epoch": 1.9899458623356536, "percentage": 100.0, "elapsed_time": "17:45:01", "remaining_time": "0:00:00"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7736
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05f1aa67890e57a74ebaa46fadabcff22deb3bb50e42f0179e1a1cfadaa403fd
|
| 3 |
size 7736
|