ceperaltab commited on
Commit
7cb962d
·
verified ·
1 Parent(s): fe0f10c

Upload train.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. train.py +2 -2
train.py CHANGED
@@ -13,9 +13,9 @@ from trl import SFTTrainer
13
  # --- CONFIGURATION ---
14
  # Base model: Using a quantized Llama 3 or Mistral is recommended for consumer GPUs.
15
  # Ensure you have access to the model on Hugging Face (might need login).
16
- MODEL_NAME = "meta-llama/Meta-Llama-3-8B"
17
  DATASET_NAME = "ceperaltab/elixir-golden-dataset"
18
- OUTPUT_DIR = "elixir-model-adapter"
19
 
20
  def main():
21
  print(f"Loading dataset from {DATASET_NAME}...")
 
13
  # --- CONFIGURATION ---
14
  # Base model: Using a quantized Llama 3 or Mistral is recommended for consumer GPUs.
15
  # Ensure you have access to the model on Hugging Face (might need login).
16
+ MODEL_NAME = "Qwen/Qwen2.5-Coder-7B-Instruct"
17
  DATASET_NAME = "ceperaltab/elixir-golden-dataset"
18
+ OUTPUT_DIR = "elixir-model-qwen"
19
 
20
  def main():
21
  print(f"Loading dataset from {DATASET_NAME}...")