Training in progress, step 500
Browse files- .gitattributes +1 -0
- config.json +66 -0
- model.safetensors +3 -0
- runs/Apr06_11-20-31_gp01/events.out.tfevents.1743938436.gp01.4008839.0 +3 -0
- runs/Apr06_12-55-42_gp01/events.out.tfevents.1743944147.gp01.4048216.0 +3 -0
- runs/Apr07_10-00-55_gp01/events.out.tfevents.1744020060.gp01.313777.0 +3 -0
- runs/Apr07_10-18-52_gp01/events.out.tfevents.1744021136.gp01.318140.0 +3 -0
- runs/Apr07_10-24-08_gp01/events.out.tfevents.1744021453.gp01.320760.0 +3 -0
- runs/Apr07_10-36-39_gp01/events.out.tfevents.1744022204.gp01.326123.0 +3 -0
- runs/Apr07_10-42-40_gp01/events.out.tfevents.1744022565.gp01.328824.0 +3 -0
- runs/Apr07_12-13-53_gp01/events.out.tfevents.1744028038.gp01.381148.0 +3 -0
- runs/Apr07_20-38-06_gp01/events.out.tfevents.1744058290.gp01.491979.0 +3 -0
- runs/Apr07_20-43-05_gp01/events.out.tfevents.1744058589.gp01.494154.0 +3 -0
- runs/Apr07_20-55-42_gp01/events.out.tfevents.1744059346.gp01.500835.0 +3 -0
- runs/Apr12_10-29-06_gp01/events.out.tfevents.1744453751.gp01.3472498.0 +3 -0
- runs/Apr12_10-33-44_gp01/events.out.tfevents.1744454029.gp01.3478016.0 +3 -0
- runs/Apr12_10-52-43_gp01/events.out.tfevents.1744455168.gp01.3495757.0 +3 -0
- runs/Apr12_13-12-32_gp01/events.out.tfevents.1744463556.gp01.3633647.0 +3 -0
- runs/Apr12_13-18-11_gp01/events.out.tfevents.1744463896.gp01.3636918.0 +3 -0
- runs/Apr21_10-18-25_gp01/events.out.tfevents.1745230712.gp01.2087389.0 +3 -0
- runs/Apr21_10-31-04_gp01/events.out.tfevents.1745231470.gp01.2095885.0 +3 -0
- runs/Apr21_12-21-30_gp01/events.out.tfevents.1745238097.gp01.2141558.0 +3 -0
- runs/Apr21_12-32-12_gp01/events.out.tfevents.1745238738.gp01.2147951.0 +3 -0
- runs/Apr21_12-37-41_gp01/events.out.tfevents.1745239067.gp01.2150943.0 +3 -0
- special_tokens_map.json +51 -0
- tokenizer.json +3 -0
- tokenizer_config.json +55 -0
- training_args.bin +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
|
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"XLMRobertaLoRA"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"auto_map": {
|
| 7 |
+
"AutoConfig": "jinaai/xlm-roberta-flash-implementation--configuration_xlm_roberta.XLMRobertaFlashConfig",
|
| 8 |
+
"AutoModel": "jinaai/xlm-roberta-flash-implementation--modeling_lora.XLMRobertaLoRA",
|
| 9 |
+
"AutoModelForMaskedLM": "jinaai/xlm-roberta-flash-implementation--modeling_xlm_roberta.XLMRobertaForMaskedLM",
|
| 10 |
+
"AutoModelForPreTraining": "jinaai/xlm-roberta-flash-implementation--modeling_xlm_roberta.XLMRobertaForPreTraining"
|
| 11 |
+
},
|
| 12 |
+
"bos_token_id": 0,
|
| 13 |
+
"classifier_dropout": null,
|
| 14 |
+
"emb_pooler": null,
|
| 15 |
+
"eos_token_id": 2,
|
| 16 |
+
"hidden_act": "gelu",
|
| 17 |
+
"hidden_dropout_prob": 0.1,
|
| 18 |
+
"hidden_size": 1024,
|
| 19 |
+
"initializer_range": 0.02,
|
| 20 |
+
"intermediate_size": 4096,
|
| 21 |
+
"layer_norm_eps": 1e-05,
|
| 22 |
+
"load_trained_adapters": true,
|
| 23 |
+
"lora_adaptations": [
|
| 24 |
+
"hadith_retrieval.query",
|
| 25 |
+
"hadith_retrieval.passage",
|
| 26 |
+
"separation",
|
| 27 |
+
"classification",
|
| 28 |
+
"text-matching"
|
| 29 |
+
],
|
| 30 |
+
"lora_alpha": 1,
|
| 31 |
+
"lora_dropout_p": 0.0,
|
| 32 |
+
"lora_main_params_trainable": false,
|
| 33 |
+
"lora_rank": 4,
|
| 34 |
+
"matryoshka_dimensions": [
|
| 35 |
+
32,
|
| 36 |
+
64,
|
| 37 |
+
128,
|
| 38 |
+
256,
|
| 39 |
+
512,
|
| 40 |
+
768,
|
| 41 |
+
1024
|
| 42 |
+
],
|
| 43 |
+
"max_position_embeddings": 8194,
|
| 44 |
+
"model_type": "xlm-roberta",
|
| 45 |
+
"num_attention_heads": 16,
|
| 46 |
+
"num_hidden_layers": 24,
|
| 47 |
+
"output_past": true,
|
| 48 |
+
"pad_token_id": 1,
|
| 49 |
+
"position_embedding_type": "rotary",
|
| 50 |
+
"rotary_emb_base": 20000.0,
|
| 51 |
+
"task_instructions": {
|
| 52 |
+
"classification": "",
|
| 53 |
+
"hadith_retrieval.passage": "Represent the hadith for retrieval: ",
|
| 54 |
+
"hadith_retrieval.query": "Represent the query for retrieving related hadiths: ",
|
| 55 |
+
"separation": "",
|
| 56 |
+
"text-matching": ""
|
| 57 |
+
},
|
| 58 |
+
"torch_dtype": "bfloat16",
|
| 59 |
+
"transformers_version": "4.50.3",
|
| 60 |
+
"truncate_dim": null,
|
| 61 |
+
"type_vocab_size": 1,
|
| 62 |
+
"use_cache": true,
|
| 63 |
+
"use_flash_attn": true,
|
| 64 |
+
"use_reentrant": false,
|
| 65 |
+
"vocab_size": 250002
|
| 66 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee6d5757440d99428055d93ab30fe871e38a64f3f9fcf0344302b92040b3d6fc
|
| 3 |
+
size 1144685320
|
runs/Apr06_11-20-31_gp01/events.out.tfevents.1743938436.gp01.4008839.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd3bc49a88e4e8df4a15a2ab4a5483003c00e28f2071c02066838043423ecb84
|
| 3 |
+
size 4423
|
runs/Apr06_12-55-42_gp01/events.out.tfevents.1743944147.gp01.4048216.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18bfd406021aa752f76bfb3d0abe142cb8ab0a7ecf9488d2e6efa4acc5ad20e0
|
| 3 |
+
size 4423
|
runs/Apr07_10-00-55_gp01/events.out.tfevents.1744020060.gp01.313777.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e81abd8250cad167df98021769d00021b19a99fb10270914f6697f7b99270b2c
|
| 3 |
+
size 4771
|
runs/Apr07_10-18-52_gp01/events.out.tfevents.1744021136.gp01.318140.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bb72618276e4093c43b96fcb04a30c95ed03d0b6bd067ff1adc9a6c8e1b052fb
|
| 3 |
+
size 4772
|
runs/Apr07_10-24-08_gp01/events.out.tfevents.1744021453.gp01.320760.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:85c782890440e4112f9b86274f6bae974b9d6f79adb4599621269b3220e88abc
|
| 3 |
+
size 4773
|
runs/Apr07_10-36-39_gp01/events.out.tfevents.1744022204.gp01.326123.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe47108707d18916b6ce30594338c3ca615f699f9ddb45a81fd5d3e0ed249c30
|
| 3 |
+
size 4424
|
runs/Apr07_10-42-40_gp01/events.out.tfevents.1744022565.gp01.328824.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f20dc7513c761344d076efbe00a8c8dedf7392415d33193b462f92f6d70c440
|
| 3 |
+
size 6534
|
runs/Apr07_12-13-53_gp01/events.out.tfevents.1744028038.gp01.381148.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7675eeab03688fd76abe778f44cbf8039b8f3b8568c59f9b639054ff901349c
|
| 3 |
+
size 6534
|
runs/Apr07_20-38-06_gp01/events.out.tfevents.1744058290.gp01.491979.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b1cf95b5e7cf99bec098a63c0d49263714e8b461dcaaaea576e0df62bf400b4
|
| 3 |
+
size 4424
|
runs/Apr07_20-43-05_gp01/events.out.tfevents.1744058589.gp01.494154.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22ad757a0eae378e7ff7fec4a998a47abe5fdd2eaac2e10ad7a56b6882b80c98
|
| 3 |
+
size 4636
|
runs/Apr07_20-55-42_gp01/events.out.tfevents.1744059346.gp01.500835.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e4c6bbf72059c0ec0d11eb02748a2fcace2998155d9b3bd8ebcc96307d6e5d84
|
| 3 |
+
size 14332
|
runs/Apr12_10-29-06_gp01/events.out.tfevents.1744453751.gp01.3472498.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27aa67fc107b585c462ea644e3eabcd8dcf5923426c3c7f5c5b84ea62b78cdd0
|
| 3 |
+
size 4877
|
runs/Apr12_10-33-44_gp01/events.out.tfevents.1744454029.gp01.3478016.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d842973a5c6c603d05f1cb781f7a2f43b88d632fbba0a9014cc978b60b00030b
|
| 3 |
+
size 4877
|
runs/Apr12_10-52-43_gp01/events.out.tfevents.1744455168.gp01.3495757.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4048e137f685d0cf125ca319158a9b5c253f1f71b91aef9259be89a261f95c8b
|
| 3 |
+
size 6343
|
runs/Apr12_13-12-32_gp01/events.out.tfevents.1744463556.gp01.3633647.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c12eb4f68f3bdb2ca70a2d3ba01a95200f2ce1342388df32cbe7b2b20d3058ee
|
| 3 |
+
size 4877
|
runs/Apr12_13-18-11_gp01/events.out.tfevents.1744463896.gp01.3636918.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e4cda083d26d05365b349c28e53a6136688c2fc625ad3dc6e404c7df8c4123f
|
| 3 |
+
size 31129
|
runs/Apr21_10-18-25_gp01/events.out.tfevents.1745230712.gp01.2087389.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee44c0696e1db5ca035c8dfc5e30d4dc7f1c8a27e8206bd951c916953cdd57b0
|
| 3 |
+
size 4876
|
runs/Apr21_10-31-04_gp01/events.out.tfevents.1745231470.gp01.2095885.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf7139866f90ec2841c6a05e1bb910a05652ffed755e27d0bae0b5fff9a1bd29
|
| 3 |
+
size 4876
|
runs/Apr21_12-21-30_gp01/events.out.tfevents.1745238097.gp01.2141558.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:afc61eceffafe2dadb522e241248774fd1977d914e88f2fab9ce8191555abd53
|
| 3 |
+
size 5132
|
runs/Apr21_12-32-12_gp01/events.out.tfevents.1745238738.gp01.2147951.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c32a78ca3afa9bfb5390be5d644ad184b024fc6742c5f5c382a9acd46a292c2d
|
| 3 |
+
size 4877
|
runs/Apr21_12-37-41_gp01/events.out.tfevents.1745239067.gp01.2150943.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:301740f6368aa8adec46214ae7a2cd554c5eafa0e08f3ae6c769869d0ac27561
|
| 3 |
+
size 5424
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"cls_token": {
|
| 10 |
+
"content": "<s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"eos_token": {
|
| 17 |
+
"content": "</s>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"mask_token": {
|
| 24 |
+
"content": "<mask>",
|
| 25 |
+
"lstrip": true,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"pad_token": {
|
| 31 |
+
"content": "<pad>",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
},
|
| 37 |
+
"sep_token": {
|
| 38 |
+
"content": "</s>",
|
| 39 |
+
"lstrip": false,
|
| 40 |
+
"normalized": false,
|
| 41 |
+
"rstrip": false,
|
| 42 |
+
"single_word": false
|
| 43 |
+
},
|
| 44 |
+
"unk_token": {
|
| 45 |
+
"content": "<unk>",
|
| 46 |
+
"lstrip": false,
|
| 47 |
+
"normalized": false,
|
| 48 |
+
"rstrip": false,
|
| 49 |
+
"single_word": false
|
| 50 |
+
}
|
| 51 |
+
}
|
tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e19cd8c08f528b481e909f73dbd1fd62b1e8b1117579ba205e477801237f9e0
|
| 3 |
+
size 17082988
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "<s>",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<pad>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "</s>",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "<unk>",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"250001": {
|
| 36 |
+
"content": "<mask>",
|
| 37 |
+
"lstrip": true,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"bos_token": "<s>",
|
| 45 |
+
"clean_up_tokenization_spaces": true,
|
| 46 |
+
"cls_token": "<s>",
|
| 47 |
+
"eos_token": "</s>",
|
| 48 |
+
"extra_special_tokens": {},
|
| 49 |
+
"mask_token": "<mask>",
|
| 50 |
+
"model_max_length": 8194,
|
| 51 |
+
"pad_token": "<pad>",
|
| 52 |
+
"sep_token": "</s>",
|
| 53 |
+
"tokenizer_class": "XLMRobertaTokenizerFast",
|
| 54 |
+
"unk_token": "<unk>"
|
| 55 |
+
}
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:efbec979f53d5e9c05d32c9cb9bf8ef20cbfd829f8b126b2a71d818a4e64138c
|
| 3 |
+
size 5816
|