Upload folder using huggingface_hub

Browse files

Files changed (11) hide show

config.json +49 -0
hyperpameters/experiment_state-2022-12-20_16-21-04.json +0 -0
hyperpameters/search_gen_state-2022-12-20_16-21-04.json +0 -0
hyperpameters/searcher-state-2022-12-20_16-21-04.pkl +3 -0
hyperparameters.csv +11 -0
optimizer.pt +3 -0
pytorch_model.bin +3 -0
scheduler.pt +3 -0
trainer_state.json +82 -0
training_args.bin +3 -0
training_resume.json +29 -0

config.json ADDED Viewed

	@@ -0,0 +1,49 @@

+{
+  "_name_or_path": "PlanTL-GOB-ES/roberta-base-bne",
+  "architectures": [
+    "RobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.0,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.23.1",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 50262
+}

hyperpameters/experiment_state-2022-12-20_16-21-04.json ADDED Viewed

The diff for this file is too large to render. See raw diff

hyperpameters/search_gen_state-2022-12-20_16-21-04.json ADDED Viewed

Binary file (1.21 kB). View file

hyperpameters/searcher-state-2022-12-20_16-21-04.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:55cacf51c25ea3f7859339f85b247ea83aa1a231ffbb487ebdca124c78aeaabe
+size 6775

hyperparameters.csv ADDED Viewed

	@@ -0,0 +1,11 @@

+objective,best,learning_rate,num_train_epochs,per_device_train_batch_size,warmup_steps,weight_decay,time_this_iter_s
+0.6443113896695691,True,3.180777925533466e-05,4,8,0,0.120996580489383,298.83673191070557
+0.6089856418323499,False,4.2608362046060736e-05,5,16,250,0.013431860702755793,277.2320647239685
+0.5095106557666577,False,1.0637577579349663e-05,2,8,250,0.1877430771288012,301.0902969837189
+0.472259840186323,False,4.1563816188891756e-05,5,8,1000,0.1161026692593292,300.9598762989044
+0.529856443331991,False,2.452236326363528e-05,1,8,500,0.10445925926224571,301.152028799057
+0.47216204569436443,False,3.933498237560027e-05,2,16,1000,0.24544607439873792,279.3527762889862
+0.5418994731991358,False,4.773883883904306e-05,1,8,0,0.06315173766701002,300.95647048950195
+0.5093720595534817,False,2.815232779630741e-05,2,16,0,0.10288070790935573,279.3547649383545
+0.5178339691369227,False,4.194670456106283e-05,3,16,250,0.20101691147250575,279.44476771354675
+0.4614279300033849,False,4.925349517520429e-05,1,8,1000,0.2706428191074305,300.6847951412201

optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62578cf7cad109803c4dbea866db795c4ab3cd42bb3abefc0d893dab56b700fd
+size 997363397

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce44e1a4be2ab3436c3db0824a5a447623f014a4b16c3b54c201bfad1c9a97bb
+size 498671285

scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bd7af3a64371d143c28cd7bebe6ce3d701696b700d984c227bd1b50c4691394e
+size 627

trainer_state.json ADDED Viewed

	@@ -0,0 +1,82 @@

+{
+  "best_metric": 0.8564009070396423,
+  "best_model_checkpoint": "./results/run-eb32b854/checkpoint-882",
+  "epoch": 4.0,
+  "global_step": 3528,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.0,
+      "learning_rate": 3.1798763444888135e-05,
+      "loss": 2.0373,
+      "step": 1
+    },
+    {
+      "epoch": 1.0,
+      "eval_f1": 0.4929364503071642,
+      "eval_loss": 0.8564009070396423,
+      "eval_runtime": 19.2818,
+      "eval_samples_per_second": 121.98,
+      "eval_steps_per_second": 15.248,
+      "step": 882
+    },
+    {
+      "epoch": 1.13,
+      "learning_rate": 2.2791968808811233e-05,
+      "loss": 0.9246,
+      "step": 1000
+    },
+    {
+      "epoch": 2.0,
+      "eval_f1": 0.6146216192253161,
+      "eval_loss": 0.8962076306343079,
+      "eval_runtime": 19.3209,
+      "eval_samples_per_second": 121.734,
+      "eval_steps_per_second": 15.217,
+      "step": 1764
+    },
+    {
+      "epoch": 2.27,
+      "learning_rate": 1.3776158362287801e-05,
+      "loss": 0.4402,
+      "step": 2000
+    },
+    {
+      "epoch": 3.0,
+      "eval_f1": 0.6171442898225464,
+      "eval_loss": 1.2047011852264404,
+      "eval_runtime": 19.3331,
+      "eval_samples_per_second": 121.656,
+      "eval_steps_per_second": 15.207,
+      "step": 2646
+    },
+    {
+      "epoch": 3.4,
+      "learning_rate": 4.760347915764371e-06,
+      "loss": 0.169,
+      "step": 3000
+    },
+    {
+      "epoch": 4.0,
+      "eval_f1": 0.6443113896695691,
+      "eval_loss": 1.3850061893463135,
+      "eval_runtime": 19.3579,
+      "eval_samples_per_second": 121.501,
+      "eval_steps_per_second": 15.188,
+      "step": 3528
+    }
+  ],
+  "max_steps": 3528,
+  "num_train_epochs": 4,
+  "total_flos": 5472186620003712.0,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 3.180777925533466e-05,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 8,
+    "warmup_steps": 0,
+    "weight_decay": 0.120996580489383
+  }
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:333dc0af7c718e703087a10096dc81062d9882971033588cac5592dc17d98477
+size 3387

training_resume.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+    "batch_train_size": 16,
+    "batch_val_size": 32,
+    "corpus": "text",
+    "dataset": "safercity",
+    "epochs": [
+        1,
+        2,
+        3,
+        4,
+        5
+    ],
+    "folder": "marIA",
+    "iterations": 10,
+    "labels": 8,
+    "model": "transformers",
+    "original_pretrained_model": "PlanTL-GOB-ES/roberta-base-bne",
+    "pretrained_model": "../assets/safercity/text/models/marIA",
+    "resources_per_trial": {
+        "gpu": 1
+    },
+    "run_id": "eb32b854",
+    "task": "",
+    "task_type": "classification",
+    "tokenizer_field": "tweet",
+    "tokenizer_model": "PlanTL-GOB-ES/roberta-base-bne",
+    "warmup_steps": 500,
+    "weight_decay": 0.01
+}