Training in progress, step 100
Browse files- .gitignore +1 -0
- config.json +27 -0
- pytorch_model.bin +3 -0
- runs/Apr06_21-43-46_jupyter/events.out.tfevents.1712440020.jupyter.1095181.0 +3 -0
- runs/Apr06_21-49-15_jupyter/events.out.tfevents.1712440167.jupyter.1095655.0 +3 -0
- runs/Apr06_22-21-37_jupyter/events.out.tfevents.1712442120.jupyter.1096218.0 +3 -0
- runs/Apr06_22-23-31_jupyter/events.out.tfevents.1712442221.jupyter.1096677.0 +3 -0
- runs/Apr06_22-25-43_jupyter/events.out.tfevents.1712442471.jupyter.1097115.0 +3 -0
- runs/Apr06_22-29-12_jupyter/events.out.tfevents.1712442560.jupyter.1098082.0 +3 -0
- runs/Apr06_22-57-17_jupyter/events.out.tfevents.1712444248.jupyter.1098636.0 +3 -0
- runs/Apr06_22-59-26_jupyter/events.out.tfevents.1712444398.jupyter.1099087.0 +3 -0
- runs/Apr06_23-01-01_jupyter/events.out.tfevents.1712444493.jupyter.1099525.0 +3 -0
- runs/Apr06_23-02-53_jupyter/events.out.tfevents.1712444580.jupyter.1099963.0 +3 -0
- runs/Apr07_06-41-28_jupyter/events.out.tfevents.1712472176.jupyter.1213479.0 +3 -0
- runs/Apr07_07-09-05_jupyter/events.out.tfevents.1712473787.jupyter.1215769.0 +3 -0
- runs/Apr07_07-14-08_jupyter/events.out.tfevents.1712474072.jupyter.1216486.0 +3 -0
- runs/Apr07_07-15-22_jupyter/events.out.tfevents.1712474149.jupyter.1216486.1 +3 -0
- training_args.bin +3 -0
.gitignore
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
checkpoint-*/
|
config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_name_or_path": "roberta-base",
|
| 3 |
+
"architectures": [
|
| 4 |
+
"RobertaForMaskedLM"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"classifier_dropout": null,
|
| 9 |
+
"eos_token_id": 2,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 768,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 3072,
|
| 15 |
+
"layer_norm_eps": 1e-05,
|
| 16 |
+
"max_position_embeddings": 514,
|
| 17 |
+
"model_type": "roberta",
|
| 18 |
+
"num_attention_heads": 12,
|
| 19 |
+
"num_hidden_layers": 12,
|
| 20 |
+
"pad_token_id": 1,
|
| 21 |
+
"position_embedding_type": "absolute",
|
| 22 |
+
"torch_dtype": "float32",
|
| 23 |
+
"transformers_version": "4.30.2",
|
| 24 |
+
"type_vocab_size": 1,
|
| 25 |
+
"use_cache": true,
|
| 26 |
+
"vocab_size": 50265
|
| 27 |
+
}
|
pytorch_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9bedff8a96f5b0c1dc56fbc266f1a73af8af1efcdbbe9c63954271cceadacfb0
|
| 3 |
+
size 498861675
|
runs/Apr06_21-43-46_jupyter/events.out.tfevents.1712440020.jupyter.1095181.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1df1292ea3a23800ec4bb39342d61796ca9a5e0781c7ba8d396ea4e37e599a4b
|
| 3 |
+
size 249
|
runs/Apr06_21-49-15_jupyter/events.out.tfevents.1712440167.jupyter.1095655.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fbed67aca18b7b54a4a2e60021a442b27227f2e1c14c15c5a02225fc955a090d
|
| 3 |
+
size 4020
|
runs/Apr06_22-21-37_jupyter/events.out.tfevents.1712442120.jupyter.1096218.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c14a5dacb4f23d374bf7f074c5ae3bcdab6e985c5151634c7596dfbd996a1a38
|
| 3 |
+
size 40
|
runs/Apr06_22-23-31_jupyter/events.out.tfevents.1712442221.jupyter.1096677.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac1e5282f6cac753b4263a4c4b7ade1a92eac2bdc717a3d2e89ca86079e62f4e
|
| 3 |
+
size 40
|
runs/Apr06_22-25-43_jupyter/events.out.tfevents.1712442471.jupyter.1097115.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae61c22a6ed0a4f24ad79c05c698c61a0b79b670fb0fbe43c9d2ac2bda9092e0
|
| 3 |
+
size 249
|
runs/Apr06_22-29-12_jupyter/events.out.tfevents.1712442560.jupyter.1098082.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8421d01418815ade49d98a6d218556679e01ecd2e286bbaececa98a20b7fa88b
|
| 3 |
+
size 4136
|
runs/Apr06_22-57-17_jupyter/events.out.tfevents.1712444248.jupyter.1098636.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4cdf6e8af85ac5f07fac9e3c74ea9c3a8ec14ac6fa896846c0f87381e38cdb0b
|
| 3 |
+
size 40
|
runs/Apr06_22-59-26_jupyter/events.out.tfevents.1712444398.jupyter.1099087.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d877975042db3dbc0375ca7adf98a02b9580432630547db31275ca19ee451526
|
| 3 |
+
size 40
|
runs/Apr06_23-01-01_jupyter/events.out.tfevents.1712444493.jupyter.1099525.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cf8a3b39e40136382ebc46e6182ec78a78cd654122c7039d7abec1acf96a973
|
| 3 |
+
size 40
|
runs/Apr06_23-02-53_jupyter/events.out.tfevents.1712444580.jupyter.1099963.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:928f0a13309b95ab77c4fbd9e362b3d9e92a8f11ccec54a8f27d85015afb3b40
|
| 3 |
+
size 4019
|
runs/Apr07_06-41-28_jupyter/events.out.tfevents.1712472176.jupyter.1213479.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af163002d477c22c311c12191eb9ae7b873187c9c5602bf7f725ebcd98d60370
|
| 3 |
+
size 4019
|
runs/Apr07_07-09-05_jupyter/events.out.tfevents.1712473787.jupyter.1215769.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4436c20bc2806997a7f1a4b0a65040762e7ab3ea2790b04dbb20138af96a85b4
|
| 3 |
+
size 40
|
runs/Apr07_07-14-08_jupyter/events.out.tfevents.1712474072.jupyter.1216486.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c25d7e7dff5806302d8fdc4a91a5506549e02e950913c95bfd428878244d04dc
|
| 3 |
+
size 249
|
runs/Apr07_07-15-22_jupyter/events.out.tfevents.1712474149.jupyter.1216486.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af395f94782271a65189a0ef49eceb14cf84b029e5281ee3f3ef8eb696cefba1
|
| 3 |
+
size 6886
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31e01243357afc8f1679c48f2f1789489e459ae3b42e8e0b0c3d864f0a5f8026
|
| 3 |
+
size 3951
|