Training in progress, step 500
Browse files
config.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "
|
| 3 |
"architectures": [
|
| 4 |
-
"
|
| 5 |
],
|
| 6 |
"classifier_dropout": 0.0,
|
| 7 |
"d_ff": 1024,
|
|
@@ -16,7 +16,7 @@
|
|
| 16 |
"is_encoder_decoder": true,
|
| 17 |
"is_gated_act": true,
|
| 18 |
"layer_norm_epsilon": 1e-06,
|
| 19 |
-
"model_type": "
|
| 20 |
"num_decoder_layers": 8,
|
| 21 |
"num_heads": 6,
|
| 22 |
"num_layers": 8,
|
|
@@ -28,5 +28,5 @@
|
|
| 28 |
"torch_dtype": "float32",
|
| 29 |
"transformers_version": "4.38.2",
|
| 30 |
"use_cache": true,
|
| 31 |
-
"vocab_size":
|
| 32 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "frt5-base",
|
| 3 |
"architectures": [
|
| 4 |
+
"T5ForConditionalGeneration"
|
| 5 |
],
|
| 6 |
"classifier_dropout": 0.0,
|
| 7 |
"d_ff": 1024,
|
|
|
|
| 16 |
"is_encoder_decoder": true,
|
| 17 |
"is_gated_act": true,
|
| 18 |
"layer_norm_epsilon": 1e-06,
|
| 19 |
+
"model_type": "t5",
|
| 20 |
"num_decoder_layers": 8,
|
| 21 |
"num_heads": 6,
|
| 22 |
"num_layers": 8,
|
|
|
|
| 28 |
"torch_dtype": "float32",
|
| 29 |
"transformers_version": "4.38.2",
|
| 30 |
"use_cache": true,
|
| 31 |
+
"vocab_size": 10666
|
| 32 |
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:463198ac43bc776ec376aa9a0124ab220e44e70a7bb8a4e26a9ab10acd905ce6
|
| 3 |
+
size 219958696
|
runs/Mar16_22-20-15_5d4177ac2335/events.out.tfevents.1710627615.5d4177ac2335.11191.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90062438be22a724a8f33efa767340e752286c58c721db858b24caad12ddb026
|
| 3 |
+
size 4840
|
runs/Mar16_22-20-56_5d4177ac2335/events.out.tfevents.1710627657.5d4177ac2335.11191.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eac35e5d08fedd26e7d3054144d98a0b5d0651270ddff2c69ba7a8099d34badd
|
| 3 |
+
size 5053
|
spiece.model
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:353d57e9d6e540b17f88d54025ea29a774aa4cfa953381fdeb0dd1e4dd7c2859
|
| 3 |
+
size 426213
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5048
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3918e19caec8a47fc0af352020526af4be5783331f1e127eb09fdc9ae45e74a3
|
| 3 |
size 5048
|