Training in progress, step 500
Browse files- config.json +2 -2
- model.safetensors +2 -2
- runs/Oct07_00-31-56_fba93fe4b606/events.out.tfevents.1728261117.fba93fe4b606.339.1 +3 -0
- runs/Oct07_01-55-45_fba93fe4b606/events.out.tfevents.1728266148.fba93fe4b606.14368.1 +3 -0
- runs/Oct07_01-56-58_fba93fe4b606/events.out.tfevents.1728266219.fba93fe4b606.14368.2 +3 -0
- runs/Oct07_01-57-07_fba93fe4b606/events.out.tfevents.1728266228.fba93fe4b606.14368.3 +3 -0
- runs/Oct07_01-57-14_fba93fe4b606/events.out.tfevents.1728266236.fba93fe4b606.14368.4 +3 -0
- training_args.bin +1 -1
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "google/long-t5-
|
| 3 |
"architectures": [
|
| 4 |
"LongT5ForConditionalGeneration"
|
| 5 |
],
|
|
@@ -9,7 +9,7 @@
|
|
| 9 |
"decoder_start_token_id": 0,
|
| 10 |
"dense_act_fn": "gelu_new",
|
| 11 |
"dropout_rate": 0.1,
|
| 12 |
-
"encoder_attention_type": "
|
| 13 |
"eos_token_id": 1,
|
| 14 |
"feed_forward_proj": "gated-gelu",
|
| 15 |
"global_block_size": 16,
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "google/long-t5-tglobal-base",
|
| 3 |
"architectures": [
|
| 4 |
"LongT5ForConditionalGeneration"
|
| 5 |
],
|
|
|
|
| 9 |
"decoder_start_token_id": 0,
|
| 10 |
"dense_act_fn": "gelu_new",
|
| 11 |
"dropout_rate": 0.1,
|
| 12 |
+
"encoder_attention_type": "transient-global",
|
| 13 |
"eos_token_id": 1,
|
| 14 |
"feed_forward_proj": "gated-gelu",
|
| 15 |
"global_block_size": 16,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5262ebc1956a5e5e53b4a46ffdb877dee40648cb4599bb18c1b98aef9b7da640
|
| 3 |
+
size 1187780840
|
runs/Oct07_00-31-56_fba93fe4b606/events.out.tfevents.1728261117.fba93fe4b606.339.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d2abf10f25a5a144af8812b9ca50f1dc655983e50dca45576063779df14969a
|
| 3 |
+
size 5304
|
runs/Oct07_01-55-45_fba93fe4b606/events.out.tfevents.1728266148.fba93fe4b606.14368.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc7e3030b8cc8e81f9f4f4aba05ba4f6a1bb42b80f809bfddbb4acb15fda50c0
|
| 3 |
+
size 5304
|
runs/Oct07_01-56-58_fba93fe4b606/events.out.tfevents.1728266219.fba93fe4b606.14368.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:73042c17c5528d83eba7481580b0a5a9c0bcc7b4c253c5f48f0f40feb0b875e2
|
| 3 |
+
size 5304
|
runs/Oct07_01-57-07_fba93fe4b606/events.out.tfevents.1728266228.fba93fe4b606.14368.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e81fd8938ba4ee70da027080ddf8fa3979a874f4f74b28950c72d40d258de9c
|
| 3 |
+
size 5304
|
runs/Oct07_01-57-14_fba93fe4b606/events.out.tfevents.1728266236.fba93fe4b606.14368.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:24a6e13ce229e07045565220c08df0c1956fd74f8c8e892eacdbe0fc2597e832
|
| 3 |
+
size 6040
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5304
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7322e553a407a45ed3734bcdc3c3fc6859d445261f6e68e9c1cd41cd5691c007
|
| 3 |
size 5304
|