sahanes
/

Enlighten_Instruct

4-bit precision

Model card Files Files and versions

sahanes commited on May 1, 2024

Commit

add930f

·

verified ·

1 Parent(s): 31b1380

Update config.json

Files changed (1) hide show

config.json +18 -10

config.json CHANGED Viewed

@@ -1,16 +1,6 @@
 {
     "model_type": "transformer",
     "task_type": "CAUSAL_LM",
-    "base_model": "base_model",
-    "load_in_4bit": true,
-    "quantization_config": {
-        "quantization_type": "4bit",
-        "load_in_4bit": true
-        // Add any other relevant quantization settings here if needed.
-    },
-    "torch_dtype": "bfloat16",
-    "device_map": "auto",
-    "trust_remote_code": true,
     "peft_config": {
         "lora_alpha": 16,
         "lora_dropout": 0.1,
@@ -18,5 +8,23 @@
         "bias": "none",
         "task_type": "CAUSAL_LM",
         "target_modules": ["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj"]
     }
 }

 {
     "model_type": "transformer",
     "task_type": "CAUSAL_LM",
     "peft_config": {
         "lora_alpha": 16,
         "lora_dropout": 0.1,
         "bias": "none",
         "task_type": "CAUSAL_LM",
         "target_modules": ["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj"]
+    },
+    "training_arguments": {
+        "output_dir": "./results",
+        "num_train_epochs": 1,
+        "per_device_train_batch_size": 4,
+        "gradient_accumulation_steps": 1,
+        "optim": "paged_adamw_32bit",
+        "save_steps": 50,
+        "logging_steps": 1,
+        "learning_rate": 2e-4,
+        "weight_decay": 0.001,
+        "fp16": false,
+        "bf16": false,
+        "max_grad_norm": 0.3,
+        "max_steps": -1,
+        "warmup_ratio": 0.03,
+        "group_by_length": true,
+        "lr_scheduler_type": "constant"
     }
 }