diff --git a/.gitattributes b/.gitattributes index 8aa863d30fd5de8ae287f94c801d09831b42fad8..9ad638b7f0eb54f86a3d3831f846e50144e8beb1 100644 --- a/.gitattributes +++ b/.gitattributes @@ -36,3 +36,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text arabic_corpus.csv filter=lfs diff=lfs merge=lfs -text hindi_corpus.csv filter=lfs diff=lfs merge=lfs -text russian_corpus.csv filter=lfs diff=lfs merge=lfs -text +checkpoint-1000/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-1500/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-2000/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-2500/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-3000/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-3500/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-4000/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-4500/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-5000/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-5500/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-6000/tokenizer.json filter=lfs diff=lfs merge=lfs -text +checkpoint-6500/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/checkpoint-1000/config.json b/checkpoint-1000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-1000/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-1000/optimizer.pt b/checkpoint-1000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6297b26b12de8d33ce73fb2094ab7e9664ed4aef --- /dev/null +++ b/checkpoint-1000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:035111fdb4d604ca283c9b9144812f36070c5ffaed16acb0c6b9f06e9885d8ef +size 2224498234 diff --git a/checkpoint-1000/pytorch_model.bin b/checkpoint-1000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..48a6ef154958f7fd992f7ae9bb5fd69f061844e2 --- /dev/null +++ b/checkpoint-1000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e543d77fd926d39ab1d2f039fc0d394395d4ce30ff5d798aabd4d7839fb648e +size 1112263858 diff --git a/checkpoint-1000/rng_state.pth b/checkpoint-1000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..ca0f50de1a5b705770b30d6f2516dd13abf74e3d --- /dev/null +++ b/checkpoint-1000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beb31bbdf7d9c5b7925e77559815c830119baa2fca30f37fb6aaab50bb6d991e +size 14244 diff --git a/checkpoint-1000/scaler.pt b/checkpoint-1000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d94c5393f9a0ea261b878365d01e00ce7e9a48f5 --- /dev/null +++ b/checkpoint-1000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c5bcf736f1b79303746fdacc768ece77446afaa1877de8dda3da8348fbcc7d5 +size 988 diff --git a/checkpoint-1000/scheduler.pt b/checkpoint-1000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..b827acba45350261c0d00d6f6dc874e6719a18ae --- /dev/null +++ b/checkpoint-1000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9878794dee7a9fc2f1e2977e16568f0d445f879bd810524aafb5aa9662642230 +size 1064 diff --git a/checkpoint-1000/sentencepiece.bpe.model b/checkpoint-1000/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-1000/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-1000/special_tokens_map.json b/checkpoint-1000/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-1000/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-1000/tokenizer.json b/checkpoint-1000/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-1000/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-1000/tokenizer_config.json b/checkpoint-1000/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-1000/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-1000/trainer_state.json b/checkpoint-1000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..583a2065823e4dd5b7eda0f61671e73056aae577 --- /dev/null +++ b/checkpoint-1000/trainer_state.json @@ -0,0 +1,15 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.30012004801920766, + "global_step": 1000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 2289752745025152.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-1000/training_args.bin b/checkpoint-1000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-1000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-1500/config.json b/checkpoint-1500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-1500/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-1500/optimizer.pt b/checkpoint-1500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2d01d7b29144b0c990228f4a676a189c9a06e06 --- /dev/null +++ b/checkpoint-1500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8939341b8e960508664efe97d5c04b21d50d002d6e34a5255ccd9be656fa4583 +size 2224498234 diff --git a/checkpoint-1500/pytorch_model.bin b/checkpoint-1500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..3139d533845ac4e82c6082cc96e4cfb4d2f05c01 --- /dev/null +++ b/checkpoint-1500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e3bea9b0c14ea4d6002d6b6b3fe155ebdf941aae1b2032500030036c92aa6f9 +size 1112263858 diff --git a/checkpoint-1500/rng_state.pth b/checkpoint-1500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..44b87b5928f34680ca95cba2120b3185adf2d84f --- /dev/null +++ b/checkpoint-1500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e2e9972f20a1c6a3e1f3d986d339d5b18060252505bf307e90192b5ff67bee9 +size 14244 diff --git a/checkpoint-1500/scaler.pt b/checkpoint-1500/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee46283434e08199c2a86c70151e1c4e2fb928d0 --- /dev/null +++ b/checkpoint-1500/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0617efbfbb7fc93b69f89ca8af67f24948e1b623a640583096a01c1e14d1a779 +size 988 diff --git a/checkpoint-1500/scheduler.pt b/checkpoint-1500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f0fdb951bd1ecac6bdc19bc08fe7002549fd3be --- /dev/null +++ b/checkpoint-1500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:947bcff8be39e16d93459c65045979b4f4e7391de422d205370ed75adf2cf818 +size 1064 diff --git a/checkpoint-1500/sentencepiece.bpe.model b/checkpoint-1500/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-1500/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-1500/special_tokens_map.json b/checkpoint-1500/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-1500/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-1500/tokenizer.json b/checkpoint-1500/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-1500/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-1500/tokenizer_config.json b/checkpoint-1500/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-1500/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-1500/trainer_state.json b/checkpoint-1500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d6db5d0cd099ca0cc48c46b6916254d8432131b9 --- /dev/null +++ b/checkpoint-1500/trainer_state.json @@ -0,0 +1,15 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.45018007202881155, + "global_step": 1500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 3427344033968256.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-1500/training_args.bin b/checkpoint-1500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-1500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-2000/config.json b/checkpoint-2000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-2000/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-2000/optimizer.pt b/checkpoint-2000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..3aa7e74e789efe29445b985def6e34d4bfeab939 --- /dev/null +++ b/checkpoint-2000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5c9506e4f39cdbc3af672d4d67543ed0aac71410a09676e08b4dd242997ec24 +size 2224498234 diff --git a/checkpoint-2000/pytorch_model.bin b/checkpoint-2000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..f776e5087d2c0cd18eb5122f21178c795d210e99 --- /dev/null +++ b/checkpoint-2000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9411f3ca927abef81eea2d70d8c9924b86ba017963d0dc3120a597df8b1d7523 +size 1112263858 diff --git a/checkpoint-2000/rng_state.pth b/checkpoint-2000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..a1410bfc428b484074cff2189a5249635c4e58fb --- /dev/null +++ b/checkpoint-2000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e66fbaebc79bf7c3a7d803385b9042c1ee2e1282975ecb6e28bdddf202c62b45 +size 14244 diff --git a/checkpoint-2000/scaler.pt b/checkpoint-2000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea3614f9d51f0c0f07ac70cec8983eb426058f4f --- /dev/null +++ b/checkpoint-2000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c494b3df6951b3dfb8d6d667cd822246eceb1361f5933fe08326cb830fde1b2c +size 988 diff --git a/checkpoint-2000/scheduler.pt b/checkpoint-2000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..375bf05f7258086d5b4bee24f2758c7f9aa74440 --- /dev/null +++ b/checkpoint-2000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dcecb64fbe503a9351db23cde6507c02a6349d16bd78d72f1f281cb8a2eb4d6 +size 1064 diff --git a/checkpoint-2000/sentencepiece.bpe.model b/checkpoint-2000/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-2000/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-2000/special_tokens_map.json b/checkpoint-2000/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-2000/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-2000/tokenizer.json b/checkpoint-2000/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-2000/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-2000/tokenizer_config.json b/checkpoint-2000/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-2000/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-2000/trainer_state.json b/checkpoint-2000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..441c14871e4be7e9792d8e2c633143dd25f4cb8c --- /dev/null +++ b/checkpoint-2000/trainer_state.json @@ -0,0 +1,15 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.6002400960384153, + "global_step": 2000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 4569868788082560.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-2000/training_args.bin b/checkpoint-2000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-2000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-2500/config.json b/checkpoint-2500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-2500/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-2500/optimizer.pt b/checkpoint-2500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2a1a46a5df264a3c2c7a5e84482cb37dcaae0a5 --- /dev/null +++ b/checkpoint-2500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2f34072663e7d19b085d14a6f6f603f3593a02c04e5a7cf45021c74be20df72 +size 2224498234 diff --git a/checkpoint-2500/pytorch_model.bin b/checkpoint-2500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab2960e383f9aaec912e18139027eac87e2e1569 --- /dev/null +++ b/checkpoint-2500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f737b6e4f38cf9d48930ebd4c3aa7355c176d29ad78fc2b97870d070d9a8f15a +size 1112263858 diff --git a/checkpoint-2500/rng_state.pth b/checkpoint-2500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..aea92f92ba3895e0a8ad2f8c618d7dd22ad29525 --- /dev/null +++ b/checkpoint-2500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaca9360678d07ba300097459dfbc25ecbad4780b3d504bd52723840f51b3895 +size 14244 diff --git a/checkpoint-2500/scaler.pt b/checkpoint-2500/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..155c6588094fa0e3c56029dea7908beef7aac6e3 --- /dev/null +++ b/checkpoint-2500/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e327e2fc109e7cb11a5de71c5b47a658cf81d9ad28f6990f404bf0161361e673 +size 988 diff --git a/checkpoint-2500/scheduler.pt b/checkpoint-2500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1937d1b0fb572f4789ab461a060adefe425ef73 --- /dev/null +++ b/checkpoint-2500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de0a9d338f40108c37209c103e3542be6a7bb598a8dc5b0c8ee11bc6e244c010 +size 1064 diff --git a/checkpoint-2500/sentencepiece.bpe.model b/checkpoint-2500/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-2500/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-2500/special_tokens_map.json b/checkpoint-2500/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-2500/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-2500/tokenizer.json b/checkpoint-2500/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-2500/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-2500/tokenizer_config.json b/checkpoint-2500/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-2500/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-2500/trainer_state.json b/checkpoint-2500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..6a144d377f5a294dbd8e3463b157fe71397a6a2a --- /dev/null +++ b/checkpoint-2500/trainer_state.json @@ -0,0 +1,15 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.7503001200480192, + "global_step": 2500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 5704763116065408.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-2500/training_args.bin b/checkpoint-2500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-2500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-3000/config.json b/checkpoint-3000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-3000/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-3000/optimizer.pt b/checkpoint-3000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e52ad11da68886e23f08e728dc376de5e213f4e --- /dev/null +++ b/checkpoint-3000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c343bbaa8ddbc24f6aa61b62b15d8f75feba7afb23c5b62149faf4a10dd9b8b +size 2224498234 diff --git a/checkpoint-3000/pytorch_model.bin b/checkpoint-3000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..52cb7730b9255bb9e06723b9b37e72f538eaecb1 --- /dev/null +++ b/checkpoint-3000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e46dffa55535486a8acab06cc84a1d925a48e4e491a28e806238c72f1809030c +size 1112263858 diff --git a/checkpoint-3000/rng_state.pth b/checkpoint-3000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..0944744b96abe8cf399ebdaa9cff47bdf6aaebe3 --- /dev/null +++ b/checkpoint-3000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce3c9c7c1836a8854e95828187436ca984ce5618080c1de46f7781ae68338f56 +size 14244 diff --git a/checkpoint-3000/scaler.pt b/checkpoint-3000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..64d3ff09bb87e9994d8e76e600ae76ac103bb3d8 --- /dev/null +++ b/checkpoint-3000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ab76333d06d884d5e443a2ad621fc4a5a7d6a50f51ad1cce2e0e2d30b5327b +size 988 diff --git a/checkpoint-3000/scheduler.pt b/checkpoint-3000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..32456e12dcf3b1de9989d94317382ad2bd52fc0b --- /dev/null +++ b/checkpoint-3000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:300c998e2cc30e9e152e3c87f68429a387b1581d00cf57926b84ae58e39a0d51 +size 1064 diff --git a/checkpoint-3000/sentencepiece.bpe.model b/checkpoint-3000/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-3000/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-3000/special_tokens_map.json b/checkpoint-3000/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-3000/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-3000/tokenizer.json b/checkpoint-3000/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-3000/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-3000/tokenizer_config.json b/checkpoint-3000/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-3000/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-3000/trainer_state.json b/checkpoint-3000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..aed8ed3da6e25f3c57ba2cf940c8b15717fda2c4 --- /dev/null +++ b/checkpoint-3000/trainer_state.json @@ -0,0 +1,15 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.9003601440576231, + "global_step": 3000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 6835875120750336.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-3000/training_args.bin b/checkpoint-3000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-3000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-3500/config.json b/checkpoint-3500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-3500/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-3500/optimizer.pt b/checkpoint-3500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..4139cbc642e689d46a53d93c5cd1ee0ed93e5257 --- /dev/null +++ b/checkpoint-3500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaddc3a4d410ef152641700ca133c318da086d88e624e9cf0c85dbb44a0e9033 +size 2224498234 diff --git a/checkpoint-3500/pytorch_model.bin b/checkpoint-3500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b1bcc4a10b0df71301e5ccd92756585ae75266c --- /dev/null +++ b/checkpoint-3500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59dd34f7a1b24f22539b3e150c1e29296165b4065d293999123f2b1d4993c304 +size 1112263858 diff --git a/checkpoint-3500/rng_state.pth b/checkpoint-3500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..27b2a526993c0971e4b4b99c06151694e584a18f --- /dev/null +++ b/checkpoint-3500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57cda6f0fd2c17c84bfc2dae3e2afd1f3fd1f81677f65b29ce2cdc3f5b45ac4 +size 14244 diff --git a/checkpoint-3500/scaler.pt b/checkpoint-3500/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6321d7c7270b6bfa83421d487dec4378c1bf64b5 --- /dev/null +++ b/checkpoint-3500/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbdb7492a0661aca7d7ba8026bad4935918d9a2cd6ddeb5e7d11db4707b6d6a7 +size 988 diff --git a/checkpoint-3500/scheduler.pt b/checkpoint-3500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..290a5f6699a2876382b897f36c6bf21677a82c02 --- /dev/null +++ b/checkpoint-3500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e84bf4be2ade1c3d9ef167425dd3c6629ae186978d3326ae10c5b3388e07800 +size 1064 diff --git a/checkpoint-3500/sentencepiece.bpe.model b/checkpoint-3500/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-3500/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-3500/special_tokens_map.json b/checkpoint-3500/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-3500/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-3500/tokenizer.json b/checkpoint-3500/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-3500/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-3500/tokenizer_config.json b/checkpoint-3500/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-3500/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-3500/trainer_state.json b/checkpoint-3500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..50bf4495523955e48063ca503f51a1471741209f --- /dev/null +++ b/checkpoint-3500/trainer_state.json @@ -0,0 +1,32 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.050420168067227, + "global_step": 3500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 1.0, + "learning_rate": 1.0015006002400962e-05, + "loss": 0.0212, + "step": 3331 + }, + { + "epoch": 1.0, + "eval_accuracy": 0.9995778453225261, + "eval_f1": 0.9995778832712353, + "eval_loss": 0.0017540693515911698, + "eval_runtime": 27.5028, + "eval_samples_per_second": 861.295, + "eval_steps_per_second": 6.763, + "step": 3332 + } + ], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 7964693064130656.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-3500/training_args.bin b/checkpoint-3500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-3500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-4000/config.json b/checkpoint-4000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-4000/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-4000/optimizer.pt b/checkpoint-4000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..07a6a27a7a1c9f88d3aed0e993cb880f62eb3b80 --- /dev/null +++ b/checkpoint-4000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfdb07d6b317742b52ef24e922d654dba7c39b19728e54f3e8a001460cbbcc10 +size 2224498234 diff --git a/checkpoint-4000/pytorch_model.bin b/checkpoint-4000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..95772af40855102a2291d7476fbb808622bd5fe6 --- /dev/null +++ b/checkpoint-4000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce808fff64259caedfc00d1a13dd0c0b5ba1e82a5f8f7b5fcd73a8a8d903407 +size 1112263858 diff --git a/checkpoint-4000/rng_state.pth b/checkpoint-4000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..f179dd1cd4d8c3ef79746d6f408289ada681f171 --- /dev/null +++ b/checkpoint-4000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f41338c7f8329e9652749236c1c77dd0268a24048905062b119e1f17578893a8 +size 14244 diff --git a/checkpoint-4000/scaler.pt b/checkpoint-4000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..87cb1bd0266bfc950996dd18a13ca44c002b2ef4 --- /dev/null +++ b/checkpoint-4000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f78956da0255b4f3c7028d2db42721c8359c50d974c8de242310c44135fd3fb3 +size 988 diff --git a/checkpoint-4000/scheduler.pt b/checkpoint-4000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e68edd84314eb0cd9483a825ec4f48444dca65 --- /dev/null +++ b/checkpoint-4000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad38463a9ae2261fb2700c27dddf0424bba42530c078813c5cb52c3e890dead0 +size 1064 diff --git a/checkpoint-4000/sentencepiece.bpe.model b/checkpoint-4000/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-4000/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-4000/special_tokens_map.json b/checkpoint-4000/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-4000/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-4000/tokenizer.json b/checkpoint-4000/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-4000/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-4000/tokenizer_config.json b/checkpoint-4000/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-4000/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-4000/trainer_state.json b/checkpoint-4000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..aed8f5a517c6b22e5ec1d284fb0ccda78d2a12f0 --- /dev/null +++ b/checkpoint-4000/trainer_state.json @@ -0,0 +1,32 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.2004801920768307, + "global_step": 4000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 1.0, + "learning_rate": 1.0015006002400962e-05, + "loss": 0.0212, + "step": 3331 + }, + { + "epoch": 1.0, + "eval_accuracy": 0.9995778453225261, + "eval_f1": 0.9995778832712353, + "eval_loss": 0.0017540693515911698, + "eval_runtime": 27.5028, + "eval_samples_per_second": 861.295, + "eval_steps_per_second": 6.763, + "step": 3332 + } + ], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 9105836447997024.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-4000/training_args.bin b/checkpoint-4000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-4000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-4500/config.json b/checkpoint-4500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-4500/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-4500/optimizer.pt b/checkpoint-4500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..df625c0bce3ce132eaf408a2778e25e2c5c241c4 --- /dev/null +++ b/checkpoint-4500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ede5a968107e376f623e9e723a94c58e73cc60e513a70a9a8263d8b1d362f43 +size 2224498234 diff --git a/checkpoint-4500/pytorch_model.bin b/checkpoint-4500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..632127a510876a379d59d99a38c7e46f14fe8692 --- /dev/null +++ b/checkpoint-4500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af6ed4d8f40fe590b8543c1fb8189c3f2682ad3d78beddf10fc314e7639f6be2 +size 1112263858 diff --git a/checkpoint-4500/rng_state.pth b/checkpoint-4500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..5e56df358ac5a6cee846d2b86130ccd2bd340af5 --- /dev/null +++ b/checkpoint-4500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37813bafa05604126a78a60288a15bbd5cce316c658d44673ce0b26eaf8cd220 +size 14244 diff --git a/checkpoint-4500/scaler.pt b/checkpoint-4500/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c6bb1073dec0b26a3ac7ccb3ed25fc82e392454 --- /dev/null +++ b/checkpoint-4500/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c80c64ef7099feee387f2e29d9a055fad893d0c2cfee38dc1c50180d92ac3b4a +size 988 diff --git a/checkpoint-4500/scheduler.pt b/checkpoint-4500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d15dfaa718146d2f0d10824df0a47e40a4454f40 --- /dev/null +++ b/checkpoint-4500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e265c3e508d7623e1cb2276b267462b4f28022f353f7d5793df0b166fbb48f +size 1064 diff --git a/checkpoint-4500/sentencepiece.bpe.model b/checkpoint-4500/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-4500/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-4500/special_tokens_map.json b/checkpoint-4500/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-4500/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-4500/tokenizer.json b/checkpoint-4500/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-4500/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-4500/tokenizer_config.json b/checkpoint-4500/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-4500/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-4500/trainer_state.json b/checkpoint-4500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..dc9f24579eb774000788ab5779abf6b6a90ff7e4 --- /dev/null +++ b/checkpoint-4500/trainer_state.json @@ -0,0 +1,32 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.3505402160864346, + "global_step": 4500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 1.0, + "learning_rate": 1.0015006002400962e-05, + "loss": 0.0212, + "step": 3331 + }, + { + "epoch": 1.0, + "eval_accuracy": 0.9995778453225261, + "eval_f1": 0.9995778832712353, + "eval_loss": 0.0017540693515911698, + "eval_runtime": 27.5028, + "eval_samples_per_second": 861.295, + "eval_steps_per_second": 6.763, + "step": 3332 + } + ], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 1.02494794542168e+16, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-4500/training_args.bin b/checkpoint-4500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-4500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-500/config.json b/checkpoint-500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-500/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-500/optimizer.pt b/checkpoint-500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..08f652119c121517ece42c771d3353f287d598e0 --- /dev/null +++ b/checkpoint-500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08f0055cc0b2063c50a944fd65da8d5cd7d29d2276653def7d94bbef0620aa7 +size 2224498234 diff --git a/checkpoint-500/pytorch_model.bin b/checkpoint-500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..86d0ddcd0d7c0977c5efcf3ce89bc33196836668 --- /dev/null +++ b/checkpoint-500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb25cbc7a4f8b46ad4397c396b128bc344cfbc8f2ce825bb7abea261f7944e1 +size 1112263858 diff --git a/checkpoint-500/rng_state.pth b/checkpoint-500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..e70115011f9f37b19369b0324e6795904371e48e --- /dev/null +++ b/checkpoint-500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb4e37d624ed2885a6f31e04584af4b86b3fb8a74a12c56443a363c9a9f544d +size 14244 diff --git a/checkpoint-500/scaler.pt b/checkpoint-500/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ad8cffce393d48d2f085bee3a95ae48a091b2d6 --- /dev/null +++ b/checkpoint-500/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0d8adddd1388932d2ed9b90b5c277a7847c95951a525f62dc60f3bd12186b70 +size 988 diff --git a/checkpoint-500/scheduler.pt b/checkpoint-500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc09397bd58a53e3114fd92ffa59b3de16112a21 --- /dev/null +++ b/checkpoint-500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21dbdba64bd4741def0eef0be431357dfbc15db76e27b6425669ff9cf8e73c1f +size 1064 diff --git a/checkpoint-500/sentencepiece.bpe.model b/checkpoint-500/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-500/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-500/special_tokens_map.json b/checkpoint-500/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-500/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-500/tokenizer.json b/checkpoint-500/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-500/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-500/tokenizer_config.json b/checkpoint-500/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-500/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-500/trainer_state.json b/checkpoint-500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..c48ec11caea8c067f8a87e16aef3de2ac5ddb5d1 --- /dev/null +++ b/checkpoint-500/trainer_state.json @@ -0,0 +1,15 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.15006002400960383, + "global_step": 500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 1135453454035584.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-500/training_args.bin b/checkpoint-500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-5000/config.json b/checkpoint-5000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-5000/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-5000/optimizer.pt b/checkpoint-5000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..2202ff48a17ede16f42eb38c8b92b7e62e501177 --- /dev/null +++ b/checkpoint-5000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4178238e255eab6b08d139885ddf7e272c02062e8efb84fbdcaae347b85e6e3 +size 2224498234 diff --git a/checkpoint-5000/pytorch_model.bin b/checkpoint-5000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..563b64b15c85dc7604923bf6e4e0abeb064193ba --- /dev/null +++ b/checkpoint-5000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f79c3e447a394201bb56e5fa3520412996e5c43b78d7a1f685ac8c615bfb1c2 +size 1112263858 diff --git a/checkpoint-5000/rng_state.pth b/checkpoint-5000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..9c80cfc17a599048089da3b5da1d96fbd2094540 --- /dev/null +++ b/checkpoint-5000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e40bdff45954b2de186da9b7a8828193f488320b7e637d6c1011128ea88d7f5 +size 14244 diff --git a/checkpoint-5000/scaler.pt b/checkpoint-5000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..91677e0386653af46263f12bc74bf93bcd324b77 --- /dev/null +++ b/checkpoint-5000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b9dc27fbd1463c1c244b47b0f00093a364926c54babc4c59f05d717764f712e +size 988 diff --git a/checkpoint-5000/scheduler.pt b/checkpoint-5000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dfd1b59f956d27da77717af56e39182a25eed6e --- /dev/null +++ b/checkpoint-5000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebf6b2ee598f0ac4335df31d040667462dd02e3d1eac62858ee5b8679cfc7d7e +size 1064 diff --git a/checkpoint-5000/sentencepiece.bpe.model b/checkpoint-5000/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-5000/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-5000/special_tokens_map.json b/checkpoint-5000/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-5000/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-5000/tokenizer.json b/checkpoint-5000/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-5000/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-5000/tokenizer_config.json b/checkpoint-5000/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-5000/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-5000/trainer_state.json b/checkpoint-5000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..4f8a18d4ffdc2e01f9509bb0dd4159f8853ceab5 --- /dev/null +++ b/checkpoint-5000/trainer_state.json @@ -0,0 +1,32 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.5006002400960385, + "global_step": 5000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 1.0, + "learning_rate": 1.0015006002400962e-05, + "loss": 0.0212, + "step": 3331 + }, + { + "epoch": 1.0, + "eval_accuracy": 0.9995778453225261, + "eval_f1": 0.9995778832712353, + "eval_loss": 0.0017540693515911698, + "eval_runtime": 27.5028, + "eval_samples_per_second": 861.295, + "eval_steps_per_second": 6.763, + "step": 3332 + } + ], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 1.1390524168779744e+16, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-5000/training_args.bin b/checkpoint-5000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-5000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-5500/config.json b/checkpoint-5500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-5500/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-5500/optimizer.pt b/checkpoint-5500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..60a10712b05d593feae831ab70e3f3103aa53e02 --- /dev/null +++ b/checkpoint-5500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dfc1cd3e1438a9b967ab46ab6700369f95fe6b8d0e0ca651fde85b3f4b19a9b +size 2224498234 diff --git a/checkpoint-5500/pytorch_model.bin b/checkpoint-5500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..76a5f23fe31befdd0ba4f04eddfe090b80beb0b6 --- /dev/null +++ b/checkpoint-5500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ab602fbbd80d582a8319cad6f85b8f3ec956b70ab486d71c941fbce80f84492 +size 1112263858 diff --git a/checkpoint-5500/rng_state.pth b/checkpoint-5500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..5cd3bb473d5b1e86b49a9084a0ffea1ce5ebf17e --- /dev/null +++ b/checkpoint-5500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76aa3360d7d58394dde61580a71ef09a36386de9bc069b58648a4b7eb7956764 +size 14244 diff --git a/checkpoint-5500/scaler.pt b/checkpoint-5500/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..04352e611065685e4a7e376ea393b1139861ae56 --- /dev/null +++ b/checkpoint-5500/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c5f5318dbfd4ec3e3f1b738f1106bdfe27e69649a8191846c8955cd547df61 +size 988 diff --git a/checkpoint-5500/scheduler.pt b/checkpoint-5500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1549c7486ec2af46bf68bd19d965d792a243cb2 --- /dev/null +++ b/checkpoint-5500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:172090f82e3fcbc5b15497fa960d62e6c96e5417c8582bd8c3a152c42f43a439 +size 1064 diff --git a/checkpoint-5500/sentencepiece.bpe.model b/checkpoint-5500/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-5500/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-5500/special_tokens_map.json b/checkpoint-5500/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-5500/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-5500/tokenizer.json b/checkpoint-5500/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-5500/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-5500/tokenizer_config.json b/checkpoint-5500/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-5500/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-5500/trainer_state.json b/checkpoint-5500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..f696ddcc5ef2f9062597fa8b95922163ccde8022 --- /dev/null +++ b/checkpoint-5500/trainer_state.json @@ -0,0 +1,32 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.6506602641056423, + "global_step": 5500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 1.0, + "learning_rate": 1.0015006002400962e-05, + "loss": 0.0212, + "step": 3331 + }, + { + "epoch": 1.0, + "eval_accuracy": 0.9995778453225261, + "eval_f1": 0.9995778832712353, + "eval_loss": 0.0017540693515911698, + "eval_runtime": 27.5028, + "eval_samples_per_second": 861.295, + "eval_steps_per_second": 6.763, + "step": 3332 + } + ], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 1.2531404434503648e+16, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-5500/training_args.bin b/checkpoint-5500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-5500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-6000/config.json b/checkpoint-6000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-6000/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-6000/optimizer.pt b/checkpoint-6000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..22dc4f17be5de49fd994c2a713f8dd97f63c23d4 --- /dev/null +++ b/checkpoint-6000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ed485bf2f5e145ecd29e12ec22b056a95dd18b55c2f3f80fcd2cb0e7e44ea56 +size 2224498234 diff --git a/checkpoint-6000/pytorch_model.bin b/checkpoint-6000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..0166dd7746fc56fb7c5d814de77ae30211d73602 --- /dev/null +++ b/checkpoint-6000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c2001ea07d6e0b3806c5920b574eb2727fe105a8d3e3ad5baa7f55da8d29a8 +size 1112263858 diff --git a/checkpoint-6000/rng_state.pth b/checkpoint-6000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..493f0974417e26103b8008fb31a76f777143f3aa --- /dev/null +++ b/checkpoint-6000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3613a86fedc1c5ca98b5397a6b85ac0af7166ac0cfa7db2884a422a6ad6d9e4 +size 14244 diff --git a/checkpoint-6000/scaler.pt b/checkpoint-6000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a60b866a2bae2570772d5dd4bdbaa3c5d4ae7007 --- /dev/null +++ b/checkpoint-6000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dce5f63b5dd43a0656a34bc3613915acebc1141d3be72ea7bb2c6992bbeae0a +size 988 diff --git a/checkpoint-6000/scheduler.pt b/checkpoint-6000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca0b7f67abab5968b9a53888b22ebb4e09a87e83 --- /dev/null +++ b/checkpoint-6000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:839295a4446eff234c3d35d9f2f87aae80ea3cce7c4ed455babe53a7ad6c6897 +size 1064 diff --git a/checkpoint-6000/sentencepiece.bpe.model b/checkpoint-6000/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-6000/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-6000/special_tokens_map.json b/checkpoint-6000/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-6000/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-6000/tokenizer.json b/checkpoint-6000/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-6000/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-6000/tokenizer_config.json b/checkpoint-6000/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-6000/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-6000/trainer_state.json b/checkpoint-6000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..05318f9b379ce8b99d7c3bc1e85954ae8f4bceb8 --- /dev/null +++ b/checkpoint-6000/trainer_state.json @@ -0,0 +1,32 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.800720288115246, + "global_step": 6000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 1.0, + "learning_rate": 1.0015006002400962e-05, + "loss": 0.0212, + "step": 3331 + }, + { + "epoch": 1.0, + "eval_accuracy": 0.9995778453225261, + "eval_f1": 0.9995778832712353, + "eval_loss": 0.0017540693515911698, + "eval_runtime": 27.5028, + "eval_samples_per_second": 861.295, + "eval_steps_per_second": 6.763, + "step": 3332 + } + ], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 1.3667449904359776e+16, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-6000/training_args.bin b/checkpoint-6000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-6000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/checkpoint-6500/config.json b/checkpoint-6500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52ee2690bb08beb1bf56d29f5587d2d4f3491252 --- /dev/null +++ b/checkpoint-6500/config.json @@ -0,0 +1,43 @@ +{ + "_name_or_path": "xlm-roberta-base", + "architectures": [ + "XLMRobertaForSequenceClassification" + ], + "attention_probs_dropout_prob": 0.1, + "bos_token_id": 0, + "classifier_dropout": null, + "eos_token_id": 2, + "hidden_act": "gelu", + "hidden_dropout_prob": 0.1, + "hidden_size": 768, + "id2label": { + "0": "arabic", + "1": "english", + "2": "french", + "3": "german", + "4": "russian" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "label2id": { + "arabic": 0, + "english": 1, + "french": 2, + "german": 3, + "russian": 4 + }, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 514, + "model_type": "xlm-roberta", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "output_past": true, + "pad_token_id": 1, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.28.0", + "type_vocab_size": 1, + "use_cache": true, + "vocab_size": 250002 +} diff --git a/checkpoint-6500/optimizer.pt b/checkpoint-6500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..bee317cda419af90fde0adc2a83305abfdccdcbe --- /dev/null +++ b/checkpoint-6500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2cfad20cffe487f12be9be3ff681919ced6737908b77141e20e70034f3d413c +size 2224498234 diff --git a/checkpoint-6500/pytorch_model.bin b/checkpoint-6500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..23aaaac74b7ae0a01869715f2ae5bbc21fd4e9a1 --- /dev/null +++ b/checkpoint-6500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0dad78c51d82d6311378bc2b3f90957a56d82d5e95e7ee81b6ffdf2d901db91 +size 1112263858 diff --git a/checkpoint-6500/rng_state.pth b/checkpoint-6500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..c4c701e704bd111229d851afdea7cbbb2a4a7ffe --- /dev/null +++ b/checkpoint-6500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66b6ca701ad91ec0d02c670628f7f41a47ddf196f3b3bf2c9636895be039ef9b +size 14244 diff --git a/checkpoint-6500/scaler.pt b/checkpoint-6500/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae3cfb18b44e35d96129db1122ff7c0101d7ece8 --- /dev/null +++ b/checkpoint-6500/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6d128ac992361b84f58da2d39bcc05cf0200f1c98c9a834dfd72247aecce8cd +size 988 diff --git a/checkpoint-6500/scheduler.pt b/checkpoint-6500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a02d47686cb912db604765cd6e4e8a977ae8a5ab --- /dev/null +++ b/checkpoint-6500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9f5d32cd992b7f052e1858a521ac70520a4b9ffa161d4dcb4c241caa4753167 +size 1064 diff --git a/checkpoint-6500/sentencepiece.bpe.model b/checkpoint-6500/sentencepiece.bpe.model new file mode 100644 index 0000000000000000000000000000000000000000..7a3f40a75f870bc1f21700cd414dc2acc431583c --- /dev/null +++ b/checkpoint-6500/sentencepiece.bpe.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865 +size 5069051 diff --git a/checkpoint-6500/special_tokens_map.json b/checkpoint-6500/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..d5698132694f4f1bcff08fa7d937b1701812598e --- /dev/null +++ b/checkpoint-6500/special_tokens_map.json @@ -0,0 +1,15 @@ +{ + "bos_token": "", + "cls_token": "", + "eos_token": "", + "mask_token": { + "content": "", + "lstrip": true, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "", + "sep_token": "", + "unk_token": "" +} diff --git a/checkpoint-6500/tokenizer.json b/checkpoint-6500/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..616a6db99f606f2d0a7acfe11a015f80e68aecf5 --- /dev/null +++ b/checkpoint-6500/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1edb0658cb47689db5cf78194ebe041bba3b6b775d1f1069fc9501b372d4acb0 +size 17082758 diff --git a/checkpoint-6500/tokenizer_config.json b/checkpoint-6500/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de1940d16d38be9877bf7cc228c9377841b311f --- /dev/null +++ b/checkpoint-6500/tokenizer_config.json @@ -0,0 +1,19 @@ +{ + "bos_token": "", + "clean_up_tokenization_spaces": true, + "cls_token": "", + "eos_token": "", + "mask_token": { + "__type": "AddedToken", + "content": "", + "lstrip": true, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": "", + "sep_token": "", + "tokenizer_class": "XLMRobertaTokenizer", + "unk_token": "" +} diff --git a/checkpoint-6500/trainer_state.json b/checkpoint-6500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..087ddb0d5ee012b574e91e9492271f92da5da4fc --- /dev/null +++ b/checkpoint-6500/trainer_state.json @@ -0,0 +1,32 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.95078031212485, + "global_step": 6500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 1.0, + "learning_rate": 1.0015006002400962e-05, + "loss": 0.0212, + "step": 3331 + }, + { + "epoch": 1.0, + "eval_accuracy": 0.9995778453225261, + "eval_f1": 0.9995778832712353, + "eval_loss": 0.0017540693515911698, + "eval_runtime": 27.5028, + "eval_samples_per_second": 861.295, + "eval_steps_per_second": 6.763, + "step": 3332 + } + ], + "max_steps": 6664, + "num_train_epochs": 2, + "total_flos": 1.480339670491248e+16, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-6500/training_args.bin b/checkpoint-6500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5009d155ab2aba35c384f47c39fc786931b19125 --- /dev/null +++ b/checkpoint-6500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfc6d5b87db9956e13fcac9bb19bcdb3ef9699bb6d06c99bc4cd34f72403b5d +size 4024 diff --git a/runs/Nov04_10-20-14_31c5388b0a70/1699093224.5860944/events.out.tfevents.1699093224.31c5388b0a70.434.1 b/runs/Nov04_10-20-14_31c5388b0a70/1699093224.5860944/events.out.tfevents.1699093224.31c5388b0a70.434.1 new file mode 100644 index 0000000000000000000000000000000000000000..27249433dd1905aae984f73117a306939c03d1cd --- /dev/null +++ b/runs/Nov04_10-20-14_31c5388b0a70/1699093224.5860944/events.out.tfevents.1699093224.31c5388b0a70.434.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd53b4918d203d7e763e4d2703ae33f3029bb625e6041e8ed0a307a12ebb432a +size 5883 diff --git a/runs/Nov04_10-20-14_31c5388b0a70/events.out.tfevents.1699093224.31c5388b0a70.434.0 b/runs/Nov04_10-20-14_31c5388b0a70/events.out.tfevents.1699093224.31c5388b0a70.434.0 new file mode 100644 index 0000000000000000000000000000000000000000..af1a8774f398505a7b5e4dc4553f5f7fa0bad024 --- /dev/null +++ b/runs/Nov04_10-20-14_31c5388b0a70/events.out.tfevents.1699093224.31c5388b0a70.434.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e42f5d8713406909ed105eb61109d8ca67fb09d36a1dbe43ad99f509be6b55ac +size 5673