Upload train_aviation.py with huggingface_hub
Browse files- train_aviation.py +22 -16
train_aviation.py
CHANGED
|
@@ -18,26 +18,32 @@ import os
|
|
| 18 |
from huggingface_hub import list_repo_files
|
| 19 |
|
| 20 |
# DEBUG: Check token and repo access
|
| 21 |
-
|
| 22 |
-
token = os.environ.get("HF_TOKEN")
|
| 23 |
-
print(f" HF_TOKEN env var present: {bool(token)}")
|
| 24 |
-
if token:
|
| 25 |
-
print(f" HF_TOKEN prefix: {token[:4]}...")
|
| 26 |
-
|
| 27 |
-
model_id = "mistralai/Ministral-3-14B-Reasoning-2512"
|
| 28 |
-
try:
|
| 29 |
-
print(f" Attempting to list files for {model_id}...")
|
| 30 |
-
files = list_repo_files(model_id, token=token)
|
| 31 |
-
print(f" ✅ Success! Found {len(files)} files.")
|
| 32 |
-
print(f" First 5 files: {files[:5]}")
|
| 33 |
-
except Exception as e:
|
| 34 |
-
print(f" ❌ Failed to list repo files: {e}")
|
| 35 |
-
print("="*40)
|
| 36 |
|
| 37 |
from datasets import load_dataset
|
| 38 |
from peft import LoraConfig, prepare_model_for_kbit_training, get_peft_model
|
| 39 |
from trl import SFTTrainer, SFTConfig
|
| 40 |
-
from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 41 |
|
| 42 |
# Model ID
|
| 43 |
# model_id defined above
|
|
|
|
| 18 |
from huggingface_hub import list_repo_files
|
| 19 |
|
| 20 |
# DEBUG: Check token and repo access
|
| 21 |
+
# ... (diagnostics code kept as is) ...
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 22 |
|
| 23 |
from datasets import load_dataset
|
| 24 |
from peft import LoraConfig, prepare_model_for_kbit_training, get_peft_model
|
| 25 |
from trl import SFTTrainer, SFTConfig
|
| 26 |
+
from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, AutoConfig
|
| 27 |
+
|
| 28 |
+
# Register 'ministral3' config if needed
|
| 29 |
+
print("🔧 Registering ministral3 config...")
|
| 30 |
+
try:
|
| 31 |
+
# Try to find Mistral3Config (available in very recent transformers)
|
| 32 |
+
from transformers import Mistral3Config
|
| 33 |
+
AutoConfig.register("ministral3", Mistral3Config)
|
| 34 |
+
print(" Registered ministral3 -> Mistral3Config")
|
| 35 |
+
except ImportError:
|
| 36 |
+
try:
|
| 37 |
+
# Fallback to internal path if not exposed
|
| 38 |
+
from transformers.models.mistral3.configuration_mistral3 import Mistral3Config
|
| 39 |
+
AutoConfig.register("ministral3", Mistral3Config)
|
| 40 |
+
print(" Registered ministral3 -> Mistral3Config (internal)")
|
| 41 |
+
except ImportError:
|
| 42 |
+
# Fallback to standard MistralConfig
|
| 43 |
+
print(" Mistral3Config not found, falling back to MistralConfig")
|
| 44 |
+
from transformers import MistralConfig
|
| 45 |
+
AutoConfig.register("ministral3", MistralConfig)
|
| 46 |
+
print(" Registered ministral3 -> MistralConfig")
|
| 47 |
|
| 48 |
# Model ID
|
| 49 |
# model_id defined above
|