sahanes
/

Enlighten_Instruct

4-bit precision

Model card Files Files and versions

sahanes commited on May 1, 2024

Commit

93b3774

·

verified ·

1 Parent(s): ea10dc9

Update config.json

Files changed (1) hide show

config.json +19 -1

config.json CHANGED Viewed

@@ -8,6 +8,24 @@
         "bias": "none",
         "task_type": "CAUSAL_LM",
         "target_modules": ["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj"]
     }
-    // Add any other model-specific settings here.
 }

         "bias": "none",
         "task_type": "CAUSAL_LM",
         "target_modules": ["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj"]
+    },
+    "training_arguments": {
+        "output_dir": "./results",
+        "num_train_epochs": 1,
+        "per_device_train_batch_size": 4,
+        "gradient_accumulation_steps": 1,
+        "optim": "paged_adamw_32bit",
+        "save_steps": 50,
+        "logging_steps": 1,
+        "learning_rate": 2e-4,
+        "weight_decay": 0.001,
+        "fp16": false,
+        "bf16": false,
+        "max_grad_norm": 0.3,
+        "max_steps": -1,
+        "warmup_ratio": 0.03,
+        "group_by_length": true,
+        "lr_scheduler_type": "constant"
     }
 }