Training in progress, epoch 1

Files changed (7) hide show

config.json CHANGED Viewed

@@ -1,10 +1,11 @@
 {
-  "_name_or_path": "aubmindlab/bert-base-arabertv2",
   "architectures": [
     "BertForSequenceClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
   "classifier_dropout": null,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,

 {
+  "_name_or_path": "aubmindlab/bert-base-arabertv02-twitter",
   "architectures": [
     "BertForSequenceClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
   "classifier_dropout": null,
+  "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d7724ec15db14f3e5d59f208296776c725a937bebb237ccfcf38abf97bf869be
 size 540854065

 version https://git-lfs.github.com/spec/v1
+oid sha256:07569c032c49f99965863f1d430bae602c950b8c76837c5514148e81b2faae20
 size 540854065

runs/Aug13_12-25-41_24ab7b88dc52/events.out.tfevents.1691929711.24ab7b88dc52.184.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0da3c8f8f939d17ad96b154a036b9234d083fcfb72534023f314c01980c4b3aa
+size 4725

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -7,36 +7,8 @@
   "max_len": 512,
   "model_max_length": 512,
   "never_split": [
-    "+ك",
-    "+كما",
-    "ك+",
-    "+وا",
-    "+ين",
-    "و+",
-    "+كن",
-    "+ان",
-    "+هم",
-    "+ة",
     "[بريد]",
-    "لل+",
-    "+ي",
-    "+ت",
-    "+ن",
-    "س+",
-    "ل+",
     "[مستخدم]",
-    "+كم",
-    "+ا",
-    "ب+",
-    "ف+",
-    "+نا",
-    "+ها",
-    "+ون",
-    "+هما",
-    "ال+",
-    "+ه",
-    "+هن",
-    "+ات",
     "[رابط]"
   ],
   "pad_token": "[PAD]",
@@ -44,5 +16,6 @@
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
-  "unk_token": "[UNK]"
 }

   "max_len": 512,
   "model_max_length": 512,
   "never_split": [
     "[بريد]",
     "[مستخدم]",
     "[رابط]"
   ],
   "pad_token": "[PAD]",
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]",
+  "use_fast": true
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9fb9ddc31ff614d55c6ef3ed8bef3430118d6c64b3d34663a13168f32def7b09
 size 4027

 version https://git-lfs.github.com/spec/v1
+oid sha256:c4289cd9e78357cd6a1191dd58a278205d9ae77020bc48b204d2ae622e223a0a
 size 4027

vocab.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff