Upload train_memory_agent.py with huggingface_hub
Browse files- train_memory_agent.py +2 -3
train_memory_agent.py
CHANGED
|
@@ -16,10 +16,9 @@ from peft import LoraConfig
|
|
| 16 |
from trl import SFTTrainer, SFTConfig
|
| 17 |
|
| 18 |
print("Loading dataset...")
|
| 19 |
-
dataset = load_dataset("erik1988/
|
| 20 |
print(f"Dataset loaded: {len(dataset)} examples")
|
| 21 |
print(f"Columns: {dataset.column_names}")
|
| 22 |
-
print(f"First example keys: {dataset[0].keys()}")
|
| 23 |
|
| 24 |
dataset_split = dataset.train_test_split(test_size=0.1, seed=42)
|
| 25 |
train_dataset = dataset_split["train"]
|
|
@@ -55,7 +54,7 @@ config = SFTConfig(
|
|
| 55 |
gradient_checkpointing=True,
|
| 56 |
report_to="trackio",
|
| 57 |
project="way2agi-memory-agent",
|
| 58 |
-
run_name="memory-agent-sft-
|
| 59 |
)
|
| 60 |
|
| 61 |
print("Initializing trainer...")
|
|
|
|
| 16 |
from trl import SFTTrainer, SFTConfig
|
| 17 |
|
| 18 |
print("Loading dataset...")
|
| 19 |
+
dataset = load_dataset("erik1988/way2agi-memory-agent-sft", data_files="memory-agent-sft-v3-merged.jsonl", split="train")
|
| 20 |
print(f"Dataset loaded: {len(dataset)} examples")
|
| 21 |
print(f"Columns: {dataset.column_names}")
|
|
|
|
| 22 |
|
| 23 |
dataset_split = dataset.train_test_split(test_size=0.1, seed=42)
|
| 24 |
train_dataset = dataset_split["train"]
|
|
|
|
| 54 |
gradient_checkpointing=True,
|
| 55 |
report_to="trackio",
|
| 56 |
project="way2agi-memory-agent",
|
| 57 |
+
run_name="memory-agent-sft-v3-qwen1.5b",
|
| 58 |
)
|
| 59 |
|
| 60 |
print("Initializing trainer...")
|