Model save

Browse files

Files changed (5) hide show

README.md +48 -0
config.json +115 -0
generation_config.json +5 -0
model.safetensors +3 -0
training_args.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,48 @@

+---
+license: apache-2.0
+base_model: bert-base-uncased
+tags:
+- generated_from_trainer
+model-index:
+- name: all
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# all
+This model is a fine-tuned version of [bert-base-uncased](https://huggingface.co/bert-base-uncased) on an unknown dataset.
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0008
+- train_batch_size: 16
+- eval_batch_size: 8
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- num_epochs: 10
+### Framework versions
+- Transformers 4.35.2
+- Pytorch 2.1.0+cu118
+- Datasets 2.15.0
+- Tokenizers 0.15.0

config.json ADDED Viewed

	@@ -0,0 +1,115 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "adapters": {
+    "adapters": {
+      "ner": "e15331acc3f0a5c0"
+    },
+    "config_map": {
+      "e15331acc3f0a5c0": {
+        "adapter_residual_before_ln": false,
+        "cross_adapter": false,
+        "factorized_phm_W": true,
+        "factorized_phm_rule": false,
+        "hypercomplex_nonlinearity": "glorot-uniform",
+        "init_weights": "bert",
+        "inv_adapter": null,
+        "inv_adapter_reduction_factor": null,
+        "is_parallel": false,
+        "learn_phm": true,
+        "leave_out": [],
+        "ln_after": false,
+        "ln_before": false,
+        "mh_adapter": false,
+        "non_linearity": "relu",
+        "original_ln_after": true,
+        "original_ln_before": true,
+        "output_adapter": true,
+        "phm_bias": true,
+        "phm_c_init": "normal",
+        "phm_dim": 4,
+        "phm_init_range": 0.0001,
+        "phm_layer": false,
+        "phm_rank": 1,
+        "reduction_factor": 2,
+        "residual_before_ln": true,
+        "scaling": 1.0,
+        "shared_W_phm": false,
+        "shared_phm_rule": true,
+        "use_gating": false
+      }
+    },
+    "fusion_config_map": {},
+    "fusions": {}
+  },
+  "architectures": [
+    "BertAdapterModel"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "custom_heads": {},
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "O",
+    "1": "B-test",
+    "2": "I-test",
+    "3": "B-problem",
+    "4": "I-problem",
+    "5": "B-treatment",
+    "6": "I-treatment"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "B-problem": 3,
+    "B-test": 1,
+    "B-treatment": 5,
+    "I-problem": 4,
+    "I-test": 2,
+    "I-treatment": 6,
+    "O": 0
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "prediction_heads": {
+    "default": {
+      "activation_function": "gelu",
+      "bias": true,
+      "embedding_size": 768,
+      "head_type": "masked_lm",
+      "label2id": null,
+      "layer_norm": true,
+      "layers": 2,
+      "shift_labels": false,
+      "vocab_size": 30522
+    },
+    "ner": {
+      "activation_function": "tanh",
+      "dropout_prob": null,
+      "head_type": "tagging",
+      "label2id": {
+        "B-problem": 3,
+        "B-test": 1,
+        "B-treatment": 5,
+        "I-problem": 4,
+        "I-test": 2,
+        "I-treatment": 6,
+        "O": 0
+      },
+      "layers": 1,
+      "num_labels": 7
+    }
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.35.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "_from_model_config": true,
+  "pad_token_id": 0,
+  "transformers_version": "4.35.2"
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:deb0d97a3ff79230ca79fb1a3c3969b89df0dd99710905ef5f87b2958710a0c9
+size 468838228

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e83baaf7b7beefc9b4a61dcb3d0f20379c9e9a460d1675b482027d13202a602
+size 4536