Upload folder using huggingface_hub

Browse files

Files changed (6) hide show

Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/all_results.json +8 -0
Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/config.json +187 -0
Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/model.safetensors +3 -0
Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/train_results.json +8 -0
Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/trainer_state.json +231 -0
Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/training_args.bin +3 -0

Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/all_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 20.0,
+    "total_flos": 4.185802010861568e+16,
+    "train_loss": 267.56802662037035,
+    "train_runtime": 4171.6448,
+    "train_samples_per_second": 57.876,
+    "train_steps_per_second": 0.906
+}

Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/config.json ADDED Viewed

	@@ -0,0 +1,187 @@

+{
+  "_name_or_path": "bert-base-multilingual-cased",
+  "adapters": {
+    "adapters": {},
+    "config_map": {},
+    "fusion_config_map": {},
+    "fusion_name_map": {},
+    "fusions": {}
+  },
+  "architectures": [
+    "BertAdapterGeneralizeModel"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "_",
+    "1": "acl",
+    "2": "advcl",
+    "3": "advmod",
+    "4": "amod",
+    "5": "appos",
+    "6": "aux",
+    "7": "case",
+    "8": "cc",
+    "9": "ccomp",
+    "10": "clf",
+    "11": "compound",
+    "12": "conj",
+    "13": "cop",
+    "14": "csubj",
+    "15": "dep",
+    "16": "det",
+    "17": "discourse",
+    "18": "dislocated",
+    "19": "expl",
+    "20": "fixed",
+    "21": "flat",
+    "22": "goeswith",
+    "23": "iobj",
+    "24": "list",
+    "25": "mark",
+    "26": "nmod",
+    "27": "nsubj",
+    "28": "nummod",
+    "29": "obj",
+    "30": "obl",
+    "31": "orphan",
+    "32": "parataxis",
+    "33": "punct",
+    "34": "reparandum",
+    "35": "root",
+    "36": "vocative",
+    "37": "xcomp",
+    "38": "dup",
+    "39": "mwe",
+    "40": "name",
+    "41": "remnant"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "_": 0,
+    "acl": 1,
+    "advcl": 2,
+    "advmod": 3,
+    "amod": 4,
+    "appos": 5,
+    "aux": 6,
+    "case": 7,
+    "cc": 8,
+    "ccomp": 9,
+    "clf": 10,
+    "compound": 11,
+    "conj": 12,
+    "cop": 13,
+    "csubj": 14,
+    "dep": 15,
+    "det": 16,
+    "discourse": 17,
+    "dislocated": 18,
+    "dup": 38,
+    "expl": 19,
+    "fixed": 20,
+    "flat": 21,
+    "goeswith": 22,
+    "iobj": 23,
+    "list": 24,
+    "mark": 25,
+    "mwe": 39,
+    "name": 40,
+    "nmod": 26,
+    "nsubj": 27,
+    "nummod": 28,
+    "obj": 29,
+    "obl": 30,
+    "orphan": 31,
+    "parataxis": 32,
+    "punct": 33,
+    "remnant": 41,
+    "reparandum": 34,
+    "root": 35,
+    "vocative": 36,
+    "xcomp": 37
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "prediction_heads": {
+    "default": {
+      "activation_function": "gelu",
+      "bias": true,
+      "embedding_size": 768,
+      "head_type": "masked_lm",
+      "label2id": null,
+      "layer_norm": true,
+      "layers": 2,
+      "shift_labels": false,
+      "vocab_size": 119547
+    },
+    "ud_Maghrebi_Arabic_French-Arabizi": {
+      "head_type": "dependency_parsing",
+      "label2id": {
+        "_": 0,
+        "acl": 1,
+        "advcl": 2,
+        "advmod": 3,
+        "amod": 4,
+        "appos": 5,
+        "aux": 6,
+        "case": 7,
+        "cc": 8,
+        "ccomp": 9,
+        "clf": 10,
+        "compound": 11,
+        "conj": 12,
+        "cop": 13,
+        "csubj": 14,
+        "dep": 15,
+        "det": 16,
+        "discourse": 17,
+        "dislocated": 18,
+        "dup": 38,
+        "expl": 19,
+        "fixed": 20,
+        "flat": 21,
+        "goeswith": 22,
+        "iobj": 23,
+        "list": 24,
+        "mark": 25,
+        "mwe": 39,
+        "name": 40,
+        "nmod": 26,
+        "nsubj": 27,
+        "nummod": 28,
+        "obj": 29,
+        "obl": 30,
+        "orphan": 31,
+        "parataxis": 32,
+        "punct": 33,
+        "remnant": 41,
+        "reparandum": 34,
+        "root": 35,
+        "vocative": 36,
+        "xcomp": 37
+      },
+      "num_labels": 42
+    }
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.47.1",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 119547
+}

Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ccebd61f2628295313be72e9bff8b5b6bb85dd40f61bd31d1ad2b0627a1db6c1
+size 820332812

Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/train_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 20.0,
+    "total_flos": 4.185802010861568e+16,
+    "train_loss": 267.56802662037035,
+    "train_runtime": 4171.6448,
+    "train_samples_per_second": 57.876,
+    "train_steps_per_second": 0.906
+}

Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/trainer_state.json ADDED Viewed

	@@ -0,0 +1,231 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 20.0,
+  "eval_steps": 500,
+  "global_step": 3780,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 3.0555965966648526,
+      "las": 50.02414292612265,
+      "step": 189,
+      "uas": 65.37904394012554
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 3.4216131700409784,
+      "las": 55.72187349106712,
+      "step": 378,
+      "uas": 68.75905359729599
+    },
+    {
+      "epoch": 2.6455026455026456,
+      "grad_norm": 12.44039535522461,
+      "learning_rate": 0.00017354497354497354,
+      "loss": 277.0153,
+      "step": 500
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 3.969351053237915,
+      "las": 53.790439401255426,
+      "step": 567,
+      "uas": 69.33848382423949
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 3.998707585864597,
+      "las": 53.307580878802504,
+      "step": 756,
+      "uas": 66.58619024625784
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 4.432359602716234,
+      "las": 53.11443746982134,
+      "step": 945,
+      "uas": 67.26219217769194
+    },
+    {
+      "epoch": 5.291005291005291,
+      "grad_norm": 3.5135657787323,
+      "learning_rate": 0.0001470899470899471,
+      "loss": 269.3351,
+      "step": 1000
+    },
+    {
+      "epoch": 6.0,
+      "eval_loss": 4.637390759256151,
+      "las": 54.901014002897156,
+      "step": 1134,
+      "uas": 68.17962337035249
+    },
+    {
+      "epoch": 7.0,
+      "eval_loss": 4.736105018191868,
+      "las": 55.72187349106712,
+      "step": 1323,
+      "uas": 68.0830516658619
+    },
+    {
+      "epoch": 7.936507936507937,
+      "grad_norm": 1.9263081550598145,
+      "learning_rate": 0.00012063492063492063,
+      "loss": 265.2211,
+      "step": 1500
+    },
+    {
+      "epoch": 8.0,
+      "eval_loss": 5.14470981227027,
+      "las": 54.99758570738773,
+      "step": 1512,
+      "uas": 68.32448092708836
+    },
+    {
+      "epoch": 9.0,
+      "eval_loss": 5.348928583992852,
+      "las": 55.432158377595364,
+      "step": 1701,
+      "uas": 68.32448092708836
+    },
+    {
+      "epoch": 10.0,
+      "eval_loss": 5.436303801006741,
+      "las": 55.33558667310478,
+      "step": 1890,
+      "uas": 67.69676484789957
+    },
+    {
+      "epoch": 10.582010582010582,
+      "grad_norm": 1.5898433923721313,
+      "learning_rate": 9.417989417989419e-05,
+      "loss": 265.6262,
+      "step": 2000
+    },
+    {
+      "epoch": 11.0,
+      "eval_loss": 5.713245603773329,
+      "las": 55.38387252535008,
+      "step": 2079,
+      "uas": 68.46933848382423
+    },
+    {
+      "epoch": 12.0,
+      "eval_loss": 6.334327379862468,
+      "las": 54.94929985514244,
+      "step": 2268,
+      "uas": 68.17962337035249
+    },
+    {
+      "epoch": 13.0,
+      "eval_loss": 6.122544633017646,
+      "las": 55.14244326412361,
+      "step": 2457,
+      "uas": 68.37276677933366
+    },
+    {
+      "epoch": 13.227513227513228,
+      "grad_norm": 0.9446262717247009,
+      "learning_rate": 6.772486772486773e-05,
+      "loss": 265.4083,
+      "step": 2500
+    },
+    {
+      "epoch": 14.0,
+      "eval_loss": 6.367215209537083,
+      "las": 55.915016900048286,
+      "step": 2646,
+      "uas": 69.19362626750362
+    },
+    {
+      "epoch": 15.0,
+      "eval_loss": 6.573224518034193,
+      "las": 55.2390149686142,
+      "step": 2835,
+      "uas": 68.75905359729599
+    },
+    {
+      "epoch": 15.873015873015873,
+      "grad_norm": 0.8732636570930481,
+      "learning_rate": 4.126984126984127e-05,
+      "loss": 266.2385,
+      "step": 3000
+    },
+    {
+      "epoch": 16.0,
+      "eval_loss": 6.693118174870809,
+      "las": 55.67358763882182,
+      "step": 3024,
+      "uas": 69.19362626750362
+    },
+    {
+      "epoch": 17.0,
+      "eval_loss": 6.8626424471537275,
+      "las": 56.204732013520044,
+      "step": 3213,
+      "uas": 69.19362626750362
+    },
+    {
+      "epoch": 18.0,
+      "eval_loss": 7.04522709051768,
+      "las": 56.30130371801062,
+      "step": 3402,
+      "uas": 69.72477064220183
+    },
+    {
+      "epoch": 18.51851851851852,
+      "grad_norm": 0.7804134488105774,
+      "learning_rate": 1.4814814814814815e-05,
+      "loss": 264.3582,
+      "step": 3500
+    },
+    {
+      "epoch": 19.0,
+      "eval_loss": 7.162810643513997,
+      "las": 55.67358763882182,
+      "step": 3591,
+      "uas": 69.09705456301303
+    },
+    {
+      "epoch": 20.0,
+      "eval_loss": 7.247331725226508,
+      "las": 55.915016900048286,
+      "step": 3780,
+      "uas": 69.09705456301303
+    },
+    {
+      "epoch": 20.0,
+      "step": 3780,
+      "total_flos": 4.185802010861568e+16,
+      "train_loss": 267.56802662037035,
+      "train_runtime": 4171.6448,
+      "train_samples_per_second": 57.876,
+      "train_steps_per_second": 0.906
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 3780,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 20,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 4.185802010861568e+16,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": null
+}

Generalize/UD_Arabic-PADT-UD_Maghrebi_Arabic_French-Arabizi/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:188b95de8151ae70ed7a746a39e4ec0a00e25dc16be8c4f282ffef1ec2eb117a
+size 5496