diff --git a/.gitattributes b/.gitattributes
index 8aa863d30fd5de8ae287f94c801d09831b42fad8..9ad638b7f0eb54f86a3d3831f846e50144e8beb1 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -36,3 +36,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
arabic_corpus.csv filter=lfs diff=lfs merge=lfs -text
hindi_corpus.csv filter=lfs diff=lfs merge=lfs -text
russian_corpus.csv filter=lfs diff=lfs merge=lfs -text
+checkpoint-1000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-1500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-2000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-2500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-3000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-3500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-4000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-4500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-5000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-5500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-6000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-6500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
diff --git a/checkpoint-1000/config.json b/checkpoint-1000/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-1000/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-1000/optimizer.pt b/checkpoint-1000/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..6297b26b12de8d33ce73fb2094ab7e9664ed4aef
--- /dev/null
+++ b/checkpoint-1000/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:035111fdb4d604ca283c9b9144812f36070c5ffaed16acb0c6b9f06e9885d8ef
+size 2224498234
diff --git a/checkpoint-1000/pytorch_model.bin b/checkpoint-1000/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..48a6ef154958f7fd992f7ae9bb5fd69f061844e2
--- /dev/null
+++ b/checkpoint-1000/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6e543d77fd926d39ab1d2f039fc0d394395d4ce30ff5d798aabd4d7839fb648e
+size 1112263858
diff --git a/checkpoint-1000/rng_state.pth b/checkpoint-1000/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..ca0f50de1a5b705770b30d6f2516dd13abf74e3d
--- /dev/null
+++ b/checkpoint-1000/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:beb31bbdf7d9c5b7925e77559815c830119baa2fca30f37fb6aaab50bb6d991e
+size 14244
diff --git a/checkpoint-1000/scaler.pt b/checkpoint-1000/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..d94c5393f9a0ea261b878365d01e00ce7e9a48f5
--- /dev/null
+++ b/checkpoint-1000/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8c5bcf736f1b79303746fdacc768ece77446afaa1877de8dda3da8348fbcc7d5
+size 988
diff --git a/checkpoint-1000/scheduler.pt b/checkpoint-1000/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..b827acba45350261c0d00d6f6dc874e6719a18ae
--- /dev/null
+++ b/checkpoint-1000/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9878794dee7a9fc2f1e2977e16568f0d445f879bd810524aafb5aa9662642230
+size 1064
diff --git a/checkpoint-1000/sentencepiece.bpe.model b/checkpoint-1000/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-1000/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-1000/special_tokens_map.json b/checkpoint-1000/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-1000/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-1000/tokenizer.json b/checkpoint-1000/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-1000/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-1000/tokenizer_config.json b/checkpoint-1000/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-1000/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-1000/trainer_state.json b/checkpoint-1000/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..583a2065823e4dd5b7eda0f61671e73056aae577
--- /dev/null
+++ b/checkpoint-1000/trainer_state.json
@@ -0,0 +1,15 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 0.30012004801920766,
+ "global_step": 1000,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 2289752745025152.0,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-1000/training_args.bin b/checkpoint-1000/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-1000/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-1500/config.json b/checkpoint-1500/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-1500/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-1500/optimizer.pt b/checkpoint-1500/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..d2d01d7b29144b0c990228f4a676a189c9a06e06
--- /dev/null
+++ b/checkpoint-1500/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8939341b8e960508664efe97d5c04b21d50d002d6e34a5255ccd9be656fa4583
+size 2224498234
diff --git a/checkpoint-1500/pytorch_model.bin b/checkpoint-1500/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3139d533845ac4e82c6082cc96e4cfb4d2f05c01
--- /dev/null
+++ b/checkpoint-1500/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0e3bea9b0c14ea4d6002d6b6b3fe155ebdf941aae1b2032500030036c92aa6f9
+size 1112263858
diff --git a/checkpoint-1500/rng_state.pth b/checkpoint-1500/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..44b87b5928f34680ca95cba2120b3185adf2d84f
--- /dev/null
+++ b/checkpoint-1500/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0e2e9972f20a1c6a3e1f3d986d339d5b18060252505bf307e90192b5ff67bee9
+size 14244
diff --git a/checkpoint-1500/scaler.pt b/checkpoint-1500/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..ee46283434e08199c2a86c70151e1c4e2fb928d0
--- /dev/null
+++ b/checkpoint-1500/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0617efbfbb7fc93b69f89ca8af67f24948e1b623a640583096a01c1e14d1a779
+size 988
diff --git a/checkpoint-1500/scheduler.pt b/checkpoint-1500/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..9f0fdb951bd1ecac6bdc19bc08fe7002549fd3be
--- /dev/null
+++ b/checkpoint-1500/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:947bcff8be39e16d93459c65045979b4f4e7391de422d205370ed75adf2cf818
+size 1064
diff --git a/checkpoint-1500/sentencepiece.bpe.model b/checkpoint-1500/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-1500/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-1500/special_tokens_map.json b/checkpoint-1500/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-1500/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-1500/tokenizer.json b/checkpoint-1500/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-1500/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-1500/tokenizer_config.json b/checkpoint-1500/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-1500/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-1500/trainer_state.json b/checkpoint-1500/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..d6db5d0cd099ca0cc48c46b6916254d8432131b9
--- /dev/null
+++ b/checkpoint-1500/trainer_state.json
@@ -0,0 +1,15 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 0.45018007202881155,
+ "global_step": 1500,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 3427344033968256.0,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-1500/training_args.bin b/checkpoint-1500/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-1500/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-2000/config.json b/checkpoint-2000/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-2000/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-2000/optimizer.pt b/checkpoint-2000/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..3aa7e74e789efe29445b985def6e34d4bfeab939
--- /dev/null
+++ b/checkpoint-2000/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e5c9506e4f39cdbc3af672d4d67543ed0aac71410a09676e08b4dd242997ec24
+size 2224498234
diff --git a/checkpoint-2000/pytorch_model.bin b/checkpoint-2000/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f776e5087d2c0cd18eb5122f21178c795d210e99
--- /dev/null
+++ b/checkpoint-2000/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9411f3ca927abef81eea2d70d8c9924b86ba017963d0dc3120a597df8b1d7523
+size 1112263858
diff --git a/checkpoint-2000/rng_state.pth b/checkpoint-2000/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..a1410bfc428b484074cff2189a5249635c4e58fb
--- /dev/null
+++ b/checkpoint-2000/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e66fbaebc79bf7c3a7d803385b9042c1ee2e1282975ecb6e28bdddf202c62b45
+size 14244
diff --git a/checkpoint-2000/scaler.pt b/checkpoint-2000/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..ea3614f9d51f0c0f07ac70cec8983eb426058f4f
--- /dev/null
+++ b/checkpoint-2000/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c494b3df6951b3dfb8d6d667cd822246eceb1361f5933fe08326cb830fde1b2c
+size 988
diff --git a/checkpoint-2000/scheduler.pt b/checkpoint-2000/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..375bf05f7258086d5b4bee24f2758c7f9aa74440
--- /dev/null
+++ b/checkpoint-2000/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4dcecb64fbe503a9351db23cde6507c02a6349d16bd78d72f1f281cb8a2eb4d6
+size 1064
diff --git a/checkpoint-2000/sentencepiece.bpe.model b/checkpoint-2000/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-2000/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-2000/special_tokens_map.json b/checkpoint-2000/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-2000/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-2000/tokenizer.json b/checkpoint-2000/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-2000/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-2000/tokenizer_config.json b/checkpoint-2000/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-2000/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-2000/trainer_state.json b/checkpoint-2000/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..441c14871e4be7e9792d8e2c633143dd25f4cb8c
--- /dev/null
+++ b/checkpoint-2000/trainer_state.json
@@ -0,0 +1,15 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 0.6002400960384153,
+ "global_step": 2000,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 4569868788082560.0,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-2000/training_args.bin b/checkpoint-2000/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-2000/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-2500/config.json b/checkpoint-2500/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-2500/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-2500/optimizer.pt b/checkpoint-2500/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..e2a1a46a5df264a3c2c7a5e84482cb37dcaae0a5
--- /dev/null
+++ b/checkpoint-2500/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b2f34072663e7d19b085d14a6f6f603f3593a02c04e5a7cf45021c74be20df72
+size 2224498234
diff --git a/checkpoint-2500/pytorch_model.bin b/checkpoint-2500/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ab2960e383f9aaec912e18139027eac87e2e1569
--- /dev/null
+++ b/checkpoint-2500/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f737b6e4f38cf9d48930ebd4c3aa7355c176d29ad78fc2b97870d070d9a8f15a
+size 1112263858
diff --git a/checkpoint-2500/rng_state.pth b/checkpoint-2500/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..aea92f92ba3895e0a8ad2f8c618d7dd22ad29525
--- /dev/null
+++ b/checkpoint-2500/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aaca9360678d07ba300097459dfbc25ecbad4780b3d504bd52723840f51b3895
+size 14244
diff --git a/checkpoint-2500/scaler.pt b/checkpoint-2500/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..155c6588094fa0e3c56029dea7908beef7aac6e3
--- /dev/null
+++ b/checkpoint-2500/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e327e2fc109e7cb11a5de71c5b47a658cf81d9ad28f6990f404bf0161361e673
+size 988
diff --git a/checkpoint-2500/scheduler.pt b/checkpoint-2500/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..a1937d1b0fb572f4789ab461a060adefe425ef73
--- /dev/null
+++ b/checkpoint-2500/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:de0a9d338f40108c37209c103e3542be6a7bb598a8dc5b0c8ee11bc6e244c010
+size 1064
diff --git a/checkpoint-2500/sentencepiece.bpe.model b/checkpoint-2500/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-2500/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-2500/special_tokens_map.json b/checkpoint-2500/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-2500/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-2500/tokenizer.json b/checkpoint-2500/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-2500/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-2500/tokenizer_config.json b/checkpoint-2500/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-2500/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-2500/trainer_state.json b/checkpoint-2500/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..6a144d377f5a294dbd8e3463b157fe71397a6a2a
--- /dev/null
+++ b/checkpoint-2500/trainer_state.json
@@ -0,0 +1,15 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 0.7503001200480192,
+ "global_step": 2500,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 5704763116065408.0,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-2500/training_args.bin b/checkpoint-2500/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-2500/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-3000/config.json b/checkpoint-3000/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-3000/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-3000/optimizer.pt b/checkpoint-3000/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..9e52ad11da68886e23f08e728dc376de5e213f4e
--- /dev/null
+++ b/checkpoint-3000/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7c343bbaa8ddbc24f6aa61b62b15d8f75feba7afb23c5b62149faf4a10dd9b8b
+size 2224498234
diff --git a/checkpoint-3000/pytorch_model.bin b/checkpoint-3000/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..52cb7730b9255bb9e06723b9b37e72f538eaecb1
--- /dev/null
+++ b/checkpoint-3000/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e46dffa55535486a8acab06cc84a1d925a48e4e491a28e806238c72f1809030c
+size 1112263858
diff --git a/checkpoint-3000/rng_state.pth b/checkpoint-3000/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..0944744b96abe8cf399ebdaa9cff47bdf6aaebe3
--- /dev/null
+++ b/checkpoint-3000/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ce3c9c7c1836a8854e95828187436ca984ce5618080c1de46f7781ae68338f56
+size 14244
diff --git a/checkpoint-3000/scaler.pt b/checkpoint-3000/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..64d3ff09bb87e9994d8e76e600ae76ac103bb3d8
--- /dev/null
+++ b/checkpoint-3000/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:70ab76333d06d884d5e443a2ad621fc4a5a7d6a50f51ad1cce2e0e2d30b5327b
+size 988
diff --git a/checkpoint-3000/scheduler.pt b/checkpoint-3000/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..32456e12dcf3b1de9989d94317382ad2bd52fc0b
--- /dev/null
+++ b/checkpoint-3000/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:300c998e2cc30e9e152e3c87f68429a387b1581d00cf57926b84ae58e39a0d51
+size 1064
diff --git a/checkpoint-3000/sentencepiece.bpe.model b/checkpoint-3000/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-3000/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-3000/special_tokens_map.json b/checkpoint-3000/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-3000/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-3000/tokenizer.json b/checkpoint-3000/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-3000/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-3000/tokenizer_config.json b/checkpoint-3000/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-3000/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-3000/trainer_state.json b/checkpoint-3000/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..aed8ed3da6e25f3c57ba2cf940c8b15717fda2c4
--- /dev/null
+++ b/checkpoint-3000/trainer_state.json
@@ -0,0 +1,15 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 0.9003601440576231,
+ "global_step": 3000,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 6835875120750336.0,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-3000/training_args.bin b/checkpoint-3000/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-3000/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-3500/config.json b/checkpoint-3500/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-3500/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-3500/optimizer.pt b/checkpoint-3500/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..4139cbc642e689d46a53d93c5cd1ee0ed93e5257
--- /dev/null
+++ b/checkpoint-3500/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eaddc3a4d410ef152641700ca133c318da086d88e624e9cf0c85dbb44a0e9033
+size 2224498234
diff --git a/checkpoint-3500/pytorch_model.bin b/checkpoint-3500/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4b1bcc4a10b0df71301e5ccd92756585ae75266c
--- /dev/null
+++ b/checkpoint-3500/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:59dd34f7a1b24f22539b3e150c1e29296165b4065d293999123f2b1d4993c304
+size 1112263858
diff --git a/checkpoint-3500/rng_state.pth b/checkpoint-3500/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..27b2a526993c0971e4b4b99c06151694e584a18f
--- /dev/null
+++ b/checkpoint-3500/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c57cda6f0fd2c17c84bfc2dae3e2afd1f3fd1f81677f65b29ce2cdc3f5b45ac4
+size 14244
diff --git a/checkpoint-3500/scaler.pt b/checkpoint-3500/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..6321d7c7270b6bfa83421d487dec4378c1bf64b5
--- /dev/null
+++ b/checkpoint-3500/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dbdb7492a0661aca7d7ba8026bad4935918d9a2cd6ddeb5e7d11db4707b6d6a7
+size 988
diff --git a/checkpoint-3500/scheduler.pt b/checkpoint-3500/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..290a5f6699a2876382b897f36c6bf21677a82c02
--- /dev/null
+++ b/checkpoint-3500/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0e84bf4be2ade1c3d9ef167425dd3c6629ae186978d3326ae10c5b3388e07800
+size 1064
diff --git a/checkpoint-3500/sentencepiece.bpe.model b/checkpoint-3500/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-3500/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-3500/special_tokens_map.json b/checkpoint-3500/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-3500/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-3500/tokenizer.json b/checkpoint-3500/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-3500/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-3500/tokenizer_config.json b/checkpoint-3500/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-3500/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-3500/trainer_state.json b/checkpoint-3500/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..50bf4495523955e48063ca503f51a1471741209f
--- /dev/null
+++ b/checkpoint-3500/trainer_state.json
@@ -0,0 +1,32 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 1.050420168067227,
+ "global_step": 3500,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [
+ {
+ "epoch": 1.0,
+ "learning_rate": 1.0015006002400962e-05,
+ "loss": 0.0212,
+ "step": 3331
+ },
+ {
+ "epoch": 1.0,
+ "eval_accuracy": 0.9995778453225261,
+ "eval_f1": 0.9995778832712353,
+ "eval_loss": 0.0017540693515911698,
+ "eval_runtime": 27.5028,
+ "eval_samples_per_second": 861.295,
+ "eval_steps_per_second": 6.763,
+ "step": 3332
+ }
+ ],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 7964693064130656.0,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-3500/training_args.bin b/checkpoint-3500/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-3500/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-4000/config.json b/checkpoint-4000/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-4000/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-4000/optimizer.pt b/checkpoint-4000/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..07a6a27a7a1c9f88d3aed0e993cb880f62eb3b80
--- /dev/null
+++ b/checkpoint-4000/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bfdb07d6b317742b52ef24e922d654dba7c39b19728e54f3e8a001460cbbcc10
+size 2224498234
diff --git a/checkpoint-4000/pytorch_model.bin b/checkpoint-4000/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..95772af40855102a2291d7476fbb808622bd5fe6
--- /dev/null
+++ b/checkpoint-4000/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1ce808fff64259caedfc00d1a13dd0c0b5ba1e82a5f8f7b5fcd73a8a8d903407
+size 1112263858
diff --git a/checkpoint-4000/rng_state.pth b/checkpoint-4000/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..f179dd1cd4d8c3ef79746d6f408289ada681f171
--- /dev/null
+++ b/checkpoint-4000/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f41338c7f8329e9652749236c1c77dd0268a24048905062b119e1f17578893a8
+size 14244
diff --git a/checkpoint-4000/scaler.pt b/checkpoint-4000/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..87cb1bd0266bfc950996dd18a13ca44c002b2ef4
--- /dev/null
+++ b/checkpoint-4000/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f78956da0255b4f3c7028d2db42721c8359c50d974c8de242310c44135fd3fb3
+size 988
diff --git a/checkpoint-4000/scheduler.pt b/checkpoint-4000/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..77e68edd84314eb0cd9483a825ec4f48444dca65
--- /dev/null
+++ b/checkpoint-4000/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ad38463a9ae2261fb2700c27dddf0424bba42530c078813c5cb52c3e890dead0
+size 1064
diff --git a/checkpoint-4000/sentencepiece.bpe.model b/checkpoint-4000/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-4000/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-4000/special_tokens_map.json b/checkpoint-4000/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-4000/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-4000/tokenizer.json b/checkpoint-4000/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-4000/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-4000/tokenizer_config.json b/checkpoint-4000/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-4000/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-4000/trainer_state.json b/checkpoint-4000/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..aed8f5a517c6b22e5ec1d284fb0ccda78d2a12f0
--- /dev/null
+++ b/checkpoint-4000/trainer_state.json
@@ -0,0 +1,32 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 1.2004801920768307,
+ "global_step": 4000,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [
+ {
+ "epoch": 1.0,
+ "learning_rate": 1.0015006002400962e-05,
+ "loss": 0.0212,
+ "step": 3331
+ },
+ {
+ "epoch": 1.0,
+ "eval_accuracy": 0.9995778453225261,
+ "eval_f1": 0.9995778832712353,
+ "eval_loss": 0.0017540693515911698,
+ "eval_runtime": 27.5028,
+ "eval_samples_per_second": 861.295,
+ "eval_steps_per_second": 6.763,
+ "step": 3332
+ }
+ ],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 9105836447997024.0,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-4000/training_args.bin b/checkpoint-4000/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-4000/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-4500/config.json b/checkpoint-4500/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-4500/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-4500/optimizer.pt b/checkpoint-4500/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..df625c0bce3ce132eaf408a2778e25e2c5c241c4
--- /dev/null
+++ b/checkpoint-4500/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2ede5a968107e376f623e9e723a94c58e73cc60e513a70a9a8263d8b1d362f43
+size 2224498234
diff --git a/checkpoint-4500/pytorch_model.bin b/checkpoint-4500/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..632127a510876a379d59d99a38c7e46f14fe8692
--- /dev/null
+++ b/checkpoint-4500/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af6ed4d8f40fe590b8543c1fb8189c3f2682ad3d78beddf10fc314e7639f6be2
+size 1112263858
diff --git a/checkpoint-4500/rng_state.pth b/checkpoint-4500/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..5e56df358ac5a6cee846d2b86130ccd2bd340af5
--- /dev/null
+++ b/checkpoint-4500/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37813bafa05604126a78a60288a15bbd5cce316c658d44673ce0b26eaf8cd220
+size 14244
diff --git a/checkpoint-4500/scaler.pt b/checkpoint-4500/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..5c6bb1073dec0b26a3ac7ccb3ed25fc82e392454
--- /dev/null
+++ b/checkpoint-4500/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c80c64ef7099feee387f2e29d9a055fad893d0c2cfee38dc1c50180d92ac3b4a
+size 988
diff --git a/checkpoint-4500/scheduler.pt b/checkpoint-4500/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..d15dfaa718146d2f0d10824df0a47e40a4454f40
--- /dev/null
+++ b/checkpoint-4500/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:05e265c3e508d7623e1cb2276b267462b4f28022f353f7d5793df0b166fbb48f
+size 1064
diff --git a/checkpoint-4500/sentencepiece.bpe.model b/checkpoint-4500/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-4500/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-4500/special_tokens_map.json b/checkpoint-4500/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-4500/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-4500/tokenizer.json b/checkpoint-4500/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-4500/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-4500/tokenizer_config.json b/checkpoint-4500/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-4500/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-4500/trainer_state.json b/checkpoint-4500/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..dc9f24579eb774000788ab5779abf6b6a90ff7e4
--- /dev/null
+++ b/checkpoint-4500/trainer_state.json
@@ -0,0 +1,32 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 1.3505402160864346,
+ "global_step": 4500,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [
+ {
+ "epoch": 1.0,
+ "learning_rate": 1.0015006002400962e-05,
+ "loss": 0.0212,
+ "step": 3331
+ },
+ {
+ "epoch": 1.0,
+ "eval_accuracy": 0.9995778453225261,
+ "eval_f1": 0.9995778832712353,
+ "eval_loss": 0.0017540693515911698,
+ "eval_runtime": 27.5028,
+ "eval_samples_per_second": 861.295,
+ "eval_steps_per_second": 6.763,
+ "step": 3332
+ }
+ ],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 1.02494794542168e+16,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-4500/training_args.bin b/checkpoint-4500/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-4500/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-500/config.json b/checkpoint-500/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-500/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-500/optimizer.pt b/checkpoint-500/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..08f652119c121517ece42c771d3353f287d598e0
--- /dev/null
+++ b/checkpoint-500/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f08f0055cc0b2063c50a944fd65da8d5cd7d29d2276653def7d94bbef0620aa7
+size 2224498234
diff --git a/checkpoint-500/pytorch_model.bin b/checkpoint-500/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..86d0ddcd0d7c0977c5efcf3ce89bc33196836668
--- /dev/null
+++ b/checkpoint-500/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bfb25cbc7a4f8b46ad4397c396b128bc344cfbc8f2ce825bb7abea261f7944e1
+size 1112263858
diff --git a/checkpoint-500/rng_state.pth b/checkpoint-500/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..e70115011f9f37b19369b0324e6795904371e48e
--- /dev/null
+++ b/checkpoint-500/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9cb4e37d624ed2885a6f31e04584af4b86b3fb8a74a12c56443a363c9a9f544d
+size 14244
diff --git a/checkpoint-500/scaler.pt b/checkpoint-500/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..5ad8cffce393d48d2f085bee3a95ae48a091b2d6
--- /dev/null
+++ b/checkpoint-500/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e0d8adddd1388932d2ed9b90b5c277a7847c95951a525f62dc60f3bd12186b70
+size 988
diff --git a/checkpoint-500/scheduler.pt b/checkpoint-500/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..fc09397bd58a53e3114fd92ffa59b3de16112a21
--- /dev/null
+++ b/checkpoint-500/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:21dbdba64bd4741def0eef0be431357dfbc15db76e27b6425669ff9cf8e73c1f
+size 1064
diff --git a/checkpoint-500/sentencepiece.bpe.model b/checkpoint-500/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-500/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-500/special_tokens_map.json b/checkpoint-500/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-500/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-500/tokenizer.json b/checkpoint-500/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-500/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-500/tokenizer_config.json b/checkpoint-500/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-500/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-500/trainer_state.json b/checkpoint-500/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..c48ec11caea8c067f8a87e16aef3de2ac5ddb5d1
--- /dev/null
+++ b/checkpoint-500/trainer_state.json
@@ -0,0 +1,15 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 0.15006002400960383,
+ "global_step": 500,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 1135453454035584.0,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-500/training_args.bin b/checkpoint-500/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-500/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-5000/config.json b/checkpoint-5000/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-5000/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-5000/optimizer.pt b/checkpoint-5000/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..2202ff48a17ede16f42eb38c8b92b7e62e501177
--- /dev/null
+++ b/checkpoint-5000/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d4178238e255eab6b08d139885ddf7e272c02062e8efb84fbdcaae347b85e6e3
+size 2224498234
diff --git a/checkpoint-5000/pytorch_model.bin b/checkpoint-5000/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..563b64b15c85dc7604923bf6e4e0abeb064193ba
--- /dev/null
+++ b/checkpoint-5000/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f79c3e447a394201bb56e5fa3520412996e5c43b78d7a1f685ac8c615bfb1c2
+size 1112263858
diff --git a/checkpoint-5000/rng_state.pth b/checkpoint-5000/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..9c80cfc17a599048089da3b5da1d96fbd2094540
--- /dev/null
+++ b/checkpoint-5000/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6e40bdff45954b2de186da9b7a8828193f488320b7e637d6c1011128ea88d7f5
+size 14244
diff --git a/checkpoint-5000/scaler.pt b/checkpoint-5000/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..91677e0386653af46263f12bc74bf93bcd324b77
--- /dev/null
+++ b/checkpoint-5000/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4b9dc27fbd1463c1c244b47b0f00093a364926c54babc4c59f05d717764f712e
+size 988
diff --git a/checkpoint-5000/scheduler.pt b/checkpoint-5000/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..2dfd1b59f956d27da77717af56e39182a25eed6e
--- /dev/null
+++ b/checkpoint-5000/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ebf6b2ee598f0ac4335df31d040667462dd02e3d1eac62858ee5b8679cfc7d7e
+size 1064
diff --git a/checkpoint-5000/sentencepiece.bpe.model b/checkpoint-5000/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-5000/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-5000/special_tokens_map.json b/checkpoint-5000/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-5000/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-5000/tokenizer.json b/checkpoint-5000/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-5000/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-5000/tokenizer_config.json b/checkpoint-5000/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-5000/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-5000/trainer_state.json b/checkpoint-5000/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..4f8a18d4ffdc2e01f9509bb0dd4159f8853ceab5
--- /dev/null
+++ b/checkpoint-5000/trainer_state.json
@@ -0,0 +1,32 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 1.5006002400960385,
+ "global_step": 5000,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [
+ {
+ "epoch": 1.0,
+ "learning_rate": 1.0015006002400962e-05,
+ "loss": 0.0212,
+ "step": 3331
+ },
+ {
+ "epoch": 1.0,
+ "eval_accuracy": 0.9995778453225261,
+ "eval_f1": 0.9995778832712353,
+ "eval_loss": 0.0017540693515911698,
+ "eval_runtime": 27.5028,
+ "eval_samples_per_second": 861.295,
+ "eval_steps_per_second": 6.763,
+ "step": 3332
+ }
+ ],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 1.1390524168779744e+16,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-5000/training_args.bin b/checkpoint-5000/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-5000/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-5500/config.json b/checkpoint-5500/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-5500/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-5500/optimizer.pt b/checkpoint-5500/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..60a10712b05d593feae831ab70e3f3103aa53e02
--- /dev/null
+++ b/checkpoint-5500/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8dfc1cd3e1438a9b967ab46ab6700369f95fe6b8d0e0ca651fde85b3f4b19a9b
+size 2224498234
diff --git a/checkpoint-5500/pytorch_model.bin b/checkpoint-5500/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..76a5f23fe31befdd0ba4f04eddfe090b80beb0b6
--- /dev/null
+++ b/checkpoint-5500/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4ab602fbbd80d582a8319cad6f85b8f3ec956b70ab486d71c941fbce80f84492
+size 1112263858
diff --git a/checkpoint-5500/rng_state.pth b/checkpoint-5500/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..5cd3bb473d5b1e86b49a9084a0ffea1ce5ebf17e
--- /dev/null
+++ b/checkpoint-5500/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:76aa3360d7d58394dde61580a71ef09a36386de9bc069b58648a4b7eb7956764
+size 14244
diff --git a/checkpoint-5500/scaler.pt b/checkpoint-5500/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..04352e611065685e4a7e376ea393b1139861ae56
--- /dev/null
+++ b/checkpoint-5500/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b0c5f5318dbfd4ec3e3f1b738f1106bdfe27e69649a8191846c8955cd547df61
+size 988
diff --git a/checkpoint-5500/scheduler.pt b/checkpoint-5500/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..a1549c7486ec2af46bf68bd19d965d792a243cb2
--- /dev/null
+++ b/checkpoint-5500/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:172090f82e3fcbc5b15497fa960d62e6c96e5417c8582bd8c3a152c42f43a439
+size 1064
diff --git a/checkpoint-5500/sentencepiece.bpe.model b/checkpoint-5500/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-5500/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-5500/special_tokens_map.json b/checkpoint-5500/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-5500/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-5500/tokenizer.json b/checkpoint-5500/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-5500/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-5500/tokenizer_config.json b/checkpoint-5500/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-5500/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-5500/trainer_state.json b/checkpoint-5500/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..f696ddcc5ef2f9062597fa8b95922163ccde8022
--- /dev/null
+++ b/checkpoint-5500/trainer_state.json
@@ -0,0 +1,32 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 1.6506602641056423,
+ "global_step": 5500,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [
+ {
+ "epoch": 1.0,
+ "learning_rate": 1.0015006002400962e-05,
+ "loss": 0.0212,
+ "step": 3331
+ },
+ {
+ "epoch": 1.0,
+ "eval_accuracy": 0.9995778453225261,
+ "eval_f1": 0.9995778832712353,
+ "eval_loss": 0.0017540693515911698,
+ "eval_runtime": 27.5028,
+ "eval_samples_per_second": 861.295,
+ "eval_steps_per_second": 6.763,
+ "step": 3332
+ }
+ ],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 1.2531404434503648e+16,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-5500/training_args.bin b/checkpoint-5500/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-5500/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-6000/config.json b/checkpoint-6000/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-6000/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-6000/optimizer.pt b/checkpoint-6000/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..22dc4f17be5de49fd994c2a713f8dd97f63c23d4
--- /dev/null
+++ b/checkpoint-6000/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8ed485bf2f5e145ecd29e12ec22b056a95dd18b55c2f3f80fcd2cb0e7e44ea56
+size 2224498234
diff --git a/checkpoint-6000/pytorch_model.bin b/checkpoint-6000/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0166dd7746fc56fb7c5d814de77ae30211d73602
--- /dev/null
+++ b/checkpoint-6000/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b8c2001ea07d6e0b3806c5920b574eb2727fe105a8d3e3ad5baa7f55da8d29a8
+size 1112263858
diff --git a/checkpoint-6000/rng_state.pth b/checkpoint-6000/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..493f0974417e26103b8008fb31a76f777143f3aa
--- /dev/null
+++ b/checkpoint-6000/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3613a86fedc1c5ca98b5397a6b85ac0af7166ac0cfa7db2884a422a6ad6d9e4
+size 14244
diff --git a/checkpoint-6000/scaler.pt b/checkpoint-6000/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..a60b866a2bae2570772d5dd4bdbaa3c5d4ae7007
--- /dev/null
+++ b/checkpoint-6000/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6dce5f63b5dd43a0656a34bc3613915acebc1141d3be72ea7bb2c6992bbeae0a
+size 988
diff --git a/checkpoint-6000/scheduler.pt b/checkpoint-6000/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..ca0b7f67abab5968b9a53888b22ebb4e09a87e83
--- /dev/null
+++ b/checkpoint-6000/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:839295a4446eff234c3d35d9f2f87aae80ea3cce7c4ed455babe53a7ad6c6897
+size 1064
diff --git a/checkpoint-6000/sentencepiece.bpe.model b/checkpoint-6000/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-6000/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-6000/special_tokens_map.json b/checkpoint-6000/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-6000/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-6000/tokenizer.json b/checkpoint-6000/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-6000/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-6000/tokenizer_config.json b/checkpoint-6000/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-6000/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-6000/trainer_state.json b/checkpoint-6000/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..05318f9b379ce8b99d7c3bc1e85954ae8f4bceb8
--- /dev/null
+++ b/checkpoint-6000/trainer_state.json
@@ -0,0 +1,32 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 1.800720288115246,
+ "global_step": 6000,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [
+ {
+ "epoch": 1.0,
+ "learning_rate": 1.0015006002400962e-05,
+ "loss": 0.0212,
+ "step": 3331
+ },
+ {
+ "epoch": 1.0,
+ "eval_accuracy": 0.9995778453225261,
+ "eval_f1": 0.9995778832712353,
+ "eval_loss": 0.0017540693515911698,
+ "eval_runtime": 27.5028,
+ "eval_samples_per_second": 861.295,
+ "eval_steps_per_second": 6.763,
+ "step": 3332
+ }
+ ],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 1.3667449904359776e+16,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-6000/training_args.bin b/checkpoint-6000/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-6000/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/checkpoint-6500/config.json b/checkpoint-6500/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252
--- /dev/null
+++ b/checkpoint-6500/config.json
@@ -0,0 +1,43 @@
+{
+ "_name_or_path": "xlm-roberta-base",
+ "architectures": [
+ "XLMRobertaForSequenceClassification"
+ ],
+ "attention_probs_dropout_prob": 0.1,
+ "bos_token_id": 0,
+ "classifier_dropout": null,
+ "eos_token_id": 2,
+ "hidden_act": "gelu",
+ "hidden_dropout_prob": 0.1,
+ "hidden_size": 768,
+ "id2label": {
+ "0": "arabic",
+ "1": "english",
+ "2": "french",
+ "3": "german",
+ "4": "russian"
+ },
+ "initializer_range": 0.02,
+ "intermediate_size": 3072,
+ "label2id": {
+ "arabic": 0,
+ "english": 1,
+ "french": 2,
+ "german": 3,
+ "russian": 4
+ },
+ "layer_norm_eps": 1e-05,
+ "max_position_embeddings": 514,
+ "model_type": "xlm-roberta",
+ "num_attention_heads": 12,
+ "num_hidden_layers": 12,
+ "output_past": true,
+ "pad_token_id": 1,
+ "position_embedding_type": "absolute",
+ "problem_type": "single_label_classification",
+ "torch_dtype": "float32",
+ "transformers_version": "4.28.0",
+ "type_vocab_size": 1,
+ "use_cache": true,
+ "vocab_size": 250002
+}
diff --git a/checkpoint-6500/optimizer.pt b/checkpoint-6500/optimizer.pt
new file mode 100644
index 0000000000000000000000000000000000000000..bee317cda419af90fde0adc2a83305abfdccdcbe
--- /dev/null
+++ b/checkpoint-6500/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d2cfad20cffe487f12be9be3ff681919ced6737908b77141e20e70034f3d413c
+size 2224498234
diff --git a/checkpoint-6500/pytorch_model.bin b/checkpoint-6500/pytorch_model.bin
new file mode 100644
index 0000000000000000000000000000000000000000..23aaaac74b7ae0a01869715f2ae5bbc21fd4e9a1
--- /dev/null
+++ b/checkpoint-6500/pytorch_model.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d0dad78c51d82d6311378bc2b3f90957a56d82d5e95e7ee81b6ffdf2d901db91
+size 1112263858
diff --git a/checkpoint-6500/rng_state.pth b/checkpoint-6500/rng_state.pth
new file mode 100644
index 0000000000000000000000000000000000000000..c4c701e704bd111229d851afdea7cbbb2a4a7ffe
--- /dev/null
+++ b/checkpoint-6500/rng_state.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:66b6ca701ad91ec0d02c670628f7f41a47ddf196f3b3bf2c9636895be039ef9b
+size 14244
diff --git a/checkpoint-6500/scaler.pt b/checkpoint-6500/scaler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..ae3cfb18b44e35d96129db1122ff7c0101d7ece8
--- /dev/null
+++ b/checkpoint-6500/scaler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6d128ac992361b84f58da2d39bcc05cf0200f1c98c9a834dfd72247aecce8cd
+size 988
diff --git a/checkpoint-6500/scheduler.pt b/checkpoint-6500/scheduler.pt
new file mode 100644
index 0000000000000000000000000000000000000000..a02d47686cb912db604765cd6e4e8a977ae8a5ab
--- /dev/null
+++ b/checkpoint-6500/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c9f5d32cd992b7f052e1858a521ac70520a4b9ffa161d4dcb4c241caa4753167
+size 1064
diff --git a/checkpoint-6500/sentencepiece.bpe.model b/checkpoint-6500/sentencepiece.bpe.model
new file mode 100644
index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c
--- /dev/null
+++ b/checkpoint-6500/sentencepiece.bpe.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051
diff --git a/checkpoint-6500/special_tokens_map.json b/checkpoint-6500/special_tokens_map.json
new file mode 100644
index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e
--- /dev/null
+++ b/checkpoint-6500/special_tokens_map.json
@@ -0,0 +1,15 @@
+{
+ "bos_token": "",
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "content": "",
+ "lstrip": true,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "pad_token": "",
+ "sep_token": "",
+ "unk_token": ""
+}
diff --git a/checkpoint-6500/tokenizer.json b/checkpoint-6500/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5
--- /dev/null
+++ b/checkpoint-6500/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0
+size 17082758
diff --git a/checkpoint-6500/tokenizer_config.json b/checkpoint-6500/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f
--- /dev/null
+++ b/checkpoint-6500/tokenizer_config.json
@@ -0,0 +1,19 @@
+{
+ "bos_token": "",
+ "clean_up_tokenization_spaces": true,
+ "cls_token": "",
+ "eos_token": "",
+ "mask_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": true,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "model_max_length": 512,
+ "pad_token": "",
+ "sep_token": "",
+ "tokenizer_class": "XLMRobertaTokenizer",
+ "unk_token": ""
+}
diff --git a/checkpoint-6500/trainer_state.json b/checkpoint-6500/trainer_state.json
new file mode 100644
index 0000000000000000000000000000000000000000..087ddb0d5ee012b574e91e9492271f92da5da4fc
--- /dev/null
+++ b/checkpoint-6500/trainer_state.json
@@ -0,0 +1,32 @@
+{
+ "best_metric": null,
+ "best_model_checkpoint": null,
+ "epoch": 1.95078031212485,
+ "global_step": 6500,
+ "is_hyper_param_search": false,
+ "is_local_process_zero": true,
+ "is_world_process_zero": true,
+ "log_history": [
+ {
+ "epoch": 1.0,
+ "learning_rate": 1.0015006002400962e-05,
+ "loss": 0.0212,
+ "step": 3331
+ },
+ {
+ "epoch": 1.0,
+ "eval_accuracy": 0.9995778453225261,
+ "eval_f1": 0.9995778832712353,
+ "eval_loss": 0.0017540693515911698,
+ "eval_runtime": 27.5028,
+ "eval_samples_per_second": 861.295,
+ "eval_steps_per_second": 6.763,
+ "step": 3332
+ }
+ ],
+ "max_steps": 6664,
+ "num_train_epochs": 2,
+ "total_flos": 1.480339670491248e+16,
+ "trial_name": null,
+ "trial_params": null
+}
diff --git a/checkpoint-6500/training_args.bin b/checkpoint-6500/training_args.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125
--- /dev/null
+++ b/checkpoint-6500/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d
+size 4024
diff --git a/runs/Nov04_10-20-14_31c5388b0a70/1699093224.5860944/events.out.tfevents.1699093224.31c5388b0a70.434.1 b/runs/Nov04_10-20-14_31c5388b0a70/1699093224.5860944/events.out.tfevents.1699093224.31c5388b0a70.434.1
new file mode 100644
index 0000000000000000000000000000000000000000..27249433dd1905aae984f73117a306939c03d1cd
--- /dev/null
+++ b/runs/Nov04_10-20-14_31c5388b0a70/1699093224.5860944/events.out.tfevents.1699093224.31c5388b0a70.434.1
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cd53b4918d203d7e763e4d2703ae33f3029bb625e6041e8ed0a307a12ebb432a
+size 5883
diff --git a/runs/Nov04_10-20-14_31c5388b0a70/events.out.tfevents.1699093224.31c5388b0a70.434.0 b/runs/Nov04_10-20-14_31c5388b0a70/events.out.tfevents.1699093224.31c5388b0a70.434.0
new file mode 100644
index 0000000000000000000000000000000000000000..af1a8774f398505a7b5e4dc4553f5f7fa0bad024
--- /dev/null
+++ b/runs/Nov04_10-20-14_31c5388b0a70/events.out.tfevents.1699093224.31c5388b0a70.434.0
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e42f5d8713406909ed105eb61109d8ca67fb09d36a1dbe43ad99f509be6b55ac
+size 5673