Upload train.py with huggingface_hub
Browse files
train.py
CHANGED
|
@@ -13,9 +13,9 @@ from trl import SFTTrainer
|
|
| 13 |
# --- CONFIGURATION ---
|
| 14 |
# Base model: Using a quantized Llama 3 or Mistral is recommended for consumer GPUs.
|
| 15 |
# Ensure you have access to the model on Hugging Face (might need login).
|
| 16 |
-
MODEL_NAME = "
|
| 17 |
DATASET_NAME = "ceperaltab/elixir-golden-dataset"
|
| 18 |
-
OUTPUT_DIR = "elixir-model-
|
| 19 |
|
| 20 |
def main():
|
| 21 |
print(f"Loading dataset from {DATASET_NAME}...")
|
|
|
|
| 13 |
# --- CONFIGURATION ---
|
| 14 |
# Base model: Using a quantized Llama 3 or Mistral is recommended for consumer GPUs.
|
| 15 |
# Ensure you have access to the model on Hugging Face (might need login).
|
| 16 |
+
MODEL_NAME = "Qwen/Qwen2.5-Coder-7B-Instruct"
|
| 17 |
DATASET_NAME = "ceperaltab/elixir-golden-dataset"
|
| 18 |
+
OUTPUT_DIR = "elixir-model-qwen"
|
| 19 |
|
| 20 |
def main():
|
| 21 |
print(f"Loading dataset from {DATASET_NAME}...")
|