Upload InkubaLM multi-task with adapters

Files changed (10) hide show

config.json CHANGED Viewed

@@ -2,11 +2,46 @@
   "_name_or_path": "lelapa/InkubaLM-0.4B",
   "adapters": {
     "adapters": {
-      "machine-translation": "seq_bn",
       "sentiment-analysis": "seq_bn",
       "xnli": "seq_bn"
     },
-    "config_map": {},
     "fusion_config_map": {},
     "fusion_name_map": {},
     "fusions": {}

   "_name_or_path": "lelapa/InkubaLM-0.4B",
   "adapters": {
     "adapters": {
+      "machine-translation": "26cd1b10db746518",
       "sentiment-analysis": "seq_bn",
       "xnli": "seq_bn"
     },
+    "config_map": {
+      "26cd1b10db746518": {
+        "adapter_residual_before_ln": false,
+        "cross_adapter": false,
+        "dropout": 0.0,
+        "factorized_phm_W": true,
+        "factorized_phm_rule": false,
+        "hypercomplex_nonlinearity": "glorot-uniform",
+        "init_weights": "bert",
+        "inv_adapter": null,
+        "inv_adapter_reduction_factor": null,
+        "is_parallel": false,
+        "learn_phm": true,
+        "leave_out": [],
+        "ln_after": false,
+        "ln_before": false,
+        "mh_adapter": false,
+        "non_linearity": "relu",
+        "original_ln_after": true,
+        "original_ln_before": true,
+        "output_adapter": true,
+        "phm_bias": true,
+        "phm_c_init": "normal",
+        "phm_dim": 4,
+        "phm_init_range": 0.0001,
+        "phm_layer": false,
+        "phm_rank": 1,
+        "reduction_factor": 8,
+        "residual_before_ln": true,
+        "scaling": 1.0,
+        "shared_W_phm": false,
+        "shared_phm_rule": true,
+        "stochastic_depth": 0.0,
+        "use_gating": false
+      }
+    },
     "fusion_config_map": {},
     "fusion_name_map": {},
     "fusions": {}

machine-translation/adapter_config.json CHANGED Viewed

@@ -25,7 +25,7 @@
     "phm_init_range": 0.0001,
     "phm_layer": false,
     "phm_rank": 1,
-    "reduction_factor": 16,
     "residual_before_ln": true,
     "scaling": 1.0,
     "shared_W_phm": false,

     "phm_init_range": 0.0001,
     "phm_layer": false,
     "phm_rank": 1,
+    "reduction_factor": 8,
     "residual_before_ln": true,
     "scaling": 1.0,
     "shared_W_phm": false,

machine-translation/pytorch_adapter.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc47aca23a01a521202b599519696e10a8b03a4c10b86d7e3a310cbd7dfbdc6d
-size 16859030

 version https://git-lfs.github.com/spec/v1
+oid sha256:05181a303bdf4633323da7cd7cc42c0dc42de0047093fd154bd3d3cf56475ccb
+size 33640406

machine-translation/pytorch_model_head.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a95f248b1ba49ae1ae7000ec31584083fefccc4d66397773748d39d0f3c1e82
 size 523218998

 version https://git-lfs.github.com/spec/v1
+oid sha256:11fd55df1c791afae000989604f2fefa0e12abd715657be35bf2a00a393874cd
 size 523218998

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1c6afbf71ace664bd28406e25b8ce5afca0eccfc3011e7f72cca267d017e53e9
-size 3264041952

 version https://git-lfs.github.com/spec/v1
+oid sha256:e02a8f87608cbc40d6a46096618ad785ab8dfff3f75d0ef496ede17c994c4901
+size 3280823264

sentiment-analysis/pytorch_adapter.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:64cc397b31b51d58f07ce860a91ce71fd759b9ed8084931ca76a951c4146fa4a
 size 16859030

 version https://git-lfs.github.com/spec/v1
+oid sha256:b67fe84a865c161706578ea8e295c8f158b246896b98e8ee767e455f0fe5fded
 size 16859030

sentiment-analysis/pytorch_model_head.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e3b4a4fecbb3da2184e373f5f5f826c098bc440b03fee12b528e5e5e4554c3fc
 size 16812200

 version https://git-lfs.github.com/spec/v1
+oid sha256:cf7eac6525f75894ce9e9adbed2e71322205cbd82d0619042b473d006ab9edbc
 size 16812200

tokenizer.json CHANGED Viewed

@@ -1,7 +1,21 @@
 {
   "version": "1.0",
-  "truncation": null,
-  "padding": null,
   "added_tokens": [
     {
       "id": 0,

 {
   "version": "1.0",
+  "truncation": {
+    "direction": "Right",
+    "max_length": 128,
+    "strategy": "LongestFirst",
+    "stride": 0
+  },
+  "padding": {
+    "strategy": {
+      "Fixed": 128
+    },
+    "direction": "Left",
+    "pad_to_multiple_of": null,
+    "pad_id": 2,
+    "pad_type_id": 0,
+    "pad_token": "</s>"
+  },
   "added_tokens": [
     {
       "id": 0,

xnli/pytorch_adapter.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3d91c96805d108be1de37eff8546ba63dad24e08f9366104bcb3a2c402725cf1
 size 16858582

 version https://git-lfs.github.com/spec/v1
+oid sha256:0a584e75646d868757e70744f3fed1c83c25d66ff6cdf9994d6775d70874a806
 size 16858582

xnli/pytorch_model_head.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:190ceda766cc08d3d537b7ac71c3980ca14c5edccbbffcd6e975928faac12477
 size 16812136

 version https://git-lfs.github.com/spec/v1
+oid sha256:f1366e1b83a7b97a418f3f3053659d15a96ac13a53b4114249979ca6fce64fbd
 size 16812136