sahanes
/

Enlighten_Instruct

4-bit precision

Model card Files Files and versions

sahanes commited on May 1, 2024

Commit

31b1380

·

verified ·

1 Parent(s): 93b3774

Update config.json

Files changed (1) hide show

config.json +10 -19

config.json CHANGED Viewed

@@ -1,6 +1,16 @@
 {
     "model_type": "transformer",
     "task_type": "CAUSAL_LM",
     "peft_config": {
         "lora_alpha": 16,
         "lora_dropout": 0.1,
@@ -8,24 +18,5 @@
         "bias": "none",
         "task_type": "CAUSAL_LM",
         "target_modules": ["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj"]
-    },
-    "training_arguments": {
-        "output_dir": "./results",
-        "num_train_epochs": 1,
-        "per_device_train_batch_size": 4,
-        "gradient_accumulation_steps": 1,
-        "optim": "paged_adamw_32bit",
-        "save_steps": 50,
-        "logging_steps": 1,
-        "learning_rate": 2e-4,
-        "weight_decay": 0.001,
-        "fp16": false,
-        "bf16": false,
-        "max_grad_norm": 0.3,
-        "max_steps": -1,
-        "warmup_ratio": 0.03,
-        "group_by_length": true,
-        "lr_scheduler_type": "constant"
     }
 }

 {
     "model_type": "transformer",
     "task_type": "CAUSAL_LM",
+    "base_model": "base_model",
+    "load_in_4bit": true,
+    "quantization_config": {
+        "quantization_type": "4bit",
+        "load_in_4bit": true
+        // Add any other relevant quantization settings here if needed.
+    },
+    "torch_dtype": "bfloat16",
+    "device_map": "auto",
+    "trust_remote_code": true,
     "peft_config": {
         "lora_alpha": 16,
         "lora_dropout": 0.1,
         "bias": "none",
         "task_type": "CAUSAL_LM",
         "target_modules": ["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj"]
     }
 }