ceperaltab
/

neo4j-training-code

ceperaltab commited on Jan 22

Commit

4311ca5

verified ·

1 Parent(s): fbaf8cb

Upload train.py with huggingface_hub

Files changed (1) hide show

train.py CHANGED Viewed

@@ -116,20 +116,20 @@ def main():
         gradient_checkpointing=True,
         save_strategy="epoch",
         report_to="none",
-        warmup_ratio=0.03,
         lr_scheduler_type="cosine",
         # Push to Hugging Face Hub
         push_to_hub=True,
         hub_model_id=f"{HF_USERNAME}/{OUTPUT_DIR}",
     )
-    # Initialize trainer
     trainer = SFTTrainer(
         model=model,
         train_dataset=dataset,
         peft_config=peft_config,
         formatting_func=formatting_prompts_func,
-        max_seq_length=1024,
         tokenizer=tokenizer,
         args=training_args,
     )

         gradient_checkpointing=True,
         save_strategy="epoch",
         report_to="none",
+        warmup_steps=100,
         lr_scheduler_type="cosine",
+        max_seq_length=1024,
         # Push to Hugging Face Hub
         push_to_hub=True,
         hub_model_id=f"{HF_USERNAME}/{OUTPUT_DIR}",
     )
+    # Initialize trainer (TRL 0.27+ API)
     trainer = SFTTrainer(
         model=model,
         train_dataset=dataset,
         peft_config=peft_config,
         formatting_func=formatting_prompts_func,
         tokenizer=tokenizer,
         args=training_args,
     )