tangledgroup
/

tangled-alpha-0.9-core

Text Generation

Model card Files Files and versions

mtasic85 commited on Mar 15, 2025

Commit

278cf75

·

1 Parent(s): ebd7609

cpt core 4

Files changed (1) hide show

scripts/cpt_core_model_4.py +2 -1

scripts/cpt_core_model_4.py CHANGED Viewed

@@ -41,7 +41,8 @@ model = FastLanguageModel.get_peft_model(
     lora_dropout = 0, # Supports any, but = 0 is optimized
     bias = "none",    # Supports any, but = "none" is optimized
     # [NEW] "unsloth" uses 30% less VRAM, fits 2x larger batch sizes!
-    use_gradient_checkpointing = "unsloth", # True or "unsloth" for very long context
     random_state = 3407,
     use_rslora = True,  # We support rank stabilized LoRA
     loftq_config = None, # And LoftQ

     lora_dropout = 0, # Supports any, but = 0 is optimized
     bias = "none",    # Supports any, but = "none" is optimized
     # [NEW] "unsloth" uses 30% less VRAM, fits 2x larger batch sizes!
+    # use_gradient_checkpointing = "unsloth", # True or "unsloth" for very long context
+    use_gradient_checkpointing = False,
     random_state = 3407,
     use_rslora = True,  # We support rank stabilized LoRA
     loftq_config = None, # And LoftQ