Spaces:
Running
Running
Update imports and refactor model configuration to use ACTIVE_MODEL for improved clarity and consistency
Browse files
src/knowledge_base/dataset.py
CHANGED
|
@@ -10,7 +10,7 @@ from datetime import datetime
|
|
| 10 |
from huggingface_hub import HfApi, HfFolder
|
| 11 |
from langchain_community.vectorstores import FAISS
|
| 12 |
from config.settings import VECTOR_STORE_PATH, HF_TOKEN, EMBEDDING_MODEL
|
| 13 |
-
from
|
| 14 |
|
| 15 |
class DatasetManager:
|
| 16 |
def __init__(self, dataset_name="Rulga/status-law-knowledge-base", token: Optional[str] = None):
|
|
|
|
| 10 |
from huggingface_hub import HfApi, HfFolder
|
| 11 |
from langchain_community.vectorstores import FAISS
|
| 12 |
from config.settings import VECTOR_STORE_PATH, HF_TOKEN, EMBEDDING_MODEL
|
| 13 |
+
from langchain_community.embeddings import HuggingFaceEmbeddings # Updated import
|
| 14 |
|
| 15 |
class DatasetManager:
|
| 16 |
def __init__(self, dataset_name="Rulga/status-law-knowledge-base", token: Optional[str] = None):
|
src/training/model_manager.py
CHANGED
|
@@ -9,7 +9,7 @@ from typing import List, Dict, Any, Tuple, Optional
|
|
| 9 |
import logging
|
| 10 |
from huggingface_hub import HfApi, snapshot_download
|
| 11 |
from transformers import AutoModelForCausalLM, AutoTokenizer
|
| 12 |
-
from config.settings import MODEL_PATH, MODELS_REGISTRY_PATH,
|
| 13 |
|
| 14 |
logging.basicConfig(
|
| 15 |
level=logging.INFO,
|
|
@@ -184,7 +184,7 @@ def get_model(
|
|
| 184 |
(model, tokenizer, model_info)
|
| 185 |
"""
|
| 186 |
try:
|
| 187 |
-
model_path =
|
| 188 |
|
| 189 |
tokenizer = AutoTokenizer.from_pretrained(
|
| 190 |
model_path,
|
|
@@ -197,7 +197,7 @@ def get_model(
|
|
| 197 |
device_map="auto" if device == "cuda" else None
|
| 198 |
)
|
| 199 |
|
| 200 |
-
return model, tokenizer,
|
| 201 |
|
| 202 |
except Exception as e:
|
| 203 |
logger.error(f"Error loading model: {str(e)}")
|
|
@@ -209,10 +209,10 @@ if __name__ == "__main__":
|
|
| 209 |
|
| 210 |
# Register base model from config
|
| 211 |
success, message = manager.register_model(
|
| 212 |
-
model_id=
|
| 213 |
-
version=
|
| 214 |
-
source=
|
| 215 |
-
description=
|
| 216 |
is_active=True
|
| 217 |
)
|
| 218 |
print(message)
|
|
|
|
| 9 |
import logging
|
| 10 |
from huggingface_hub import HfApi, snapshot_download
|
| 11 |
from transformers import AutoModelForCausalLM, AutoTokenizer
|
| 12 |
+
from config.settings import MODEL_PATH, MODELS_REGISTRY_PATH, MODELS, ACTIVE_MODEL
|
| 13 |
|
| 14 |
logging.basicConfig(
|
| 15 |
level=logging.INFO,
|
|
|
|
| 184 |
(model, tokenizer, model_info)
|
| 185 |
"""
|
| 186 |
try:
|
| 187 |
+
model_path = ACTIVE_MODEL["training"]["fine_tuned_path"] if version else ACTIVE_MODEL["training"]["base_model_path"]
|
| 188 |
|
| 189 |
tokenizer = AutoTokenizer.from_pretrained(
|
| 190 |
model_path,
|
|
|
|
| 197 |
device_map="auto" if device == "cuda" else None
|
| 198 |
)
|
| 199 |
|
| 200 |
+
return model, tokenizer, ACTIVE_MODEL
|
| 201 |
|
| 202 |
except Exception as e:
|
| 203 |
logger.error(f"Error loading model: {str(e)}")
|
|
|
|
| 209 |
|
| 210 |
# Register base model from config
|
| 211 |
success, message = manager.register_model(
|
| 212 |
+
model_id=ACTIVE_MODEL["id"].split("/")[-1], # Extract model name from full HF path
|
| 213 |
+
version=ACTIVE_MODEL["type"],
|
| 214 |
+
source=ACTIVE_MODEL["id"],
|
| 215 |
+
description=ACTIVE_MODEL["description"],
|
| 216 |
is_active=True
|
| 217 |
)
|
| 218 |
print(message)
|