Rulga commited on
Commit
f33b7bd
·
1 Parent(s): 2a3ccaf

Update imports and refactor model configuration to use ACTIVE_MODEL for improved clarity and consistency

Browse files
src/knowledge_base/dataset.py CHANGED
@@ -10,7 +10,7 @@ from datetime import datetime
10
  from huggingface_hub import HfApi, HfFolder
11
  from langchain_community.vectorstores import FAISS
12
  from config.settings import VECTOR_STORE_PATH, HF_TOKEN, EMBEDDING_MODEL
13
- from langchain.embeddings import HuggingFaceEmbeddings
14
 
15
  class DatasetManager:
16
  def __init__(self, dataset_name="Rulga/status-law-knowledge-base", token: Optional[str] = None):
 
10
  from huggingface_hub import HfApi, HfFolder
11
  from langchain_community.vectorstores import FAISS
12
  from config.settings import VECTOR_STORE_PATH, HF_TOKEN, EMBEDDING_MODEL
13
+ from langchain_community.embeddings import HuggingFaceEmbeddings # Updated import
14
 
15
  class DatasetManager:
16
  def __init__(self, dataset_name="Rulga/status-law-knowledge-base", token: Optional[str] = None):
src/training/model_manager.py CHANGED
@@ -9,7 +9,7 @@ from typing import List, Dict, Any, Tuple, Optional
9
  import logging
10
  from huggingface_hub import HfApi, snapshot_download
11
  from transformers import AutoModelForCausalLM, AutoTokenizer
12
- from config.settings import MODEL_PATH, MODELS_REGISTRY_PATH, MODEL_CONFIG
13
 
14
  logging.basicConfig(
15
  level=logging.INFO,
@@ -184,7 +184,7 @@ def get_model(
184
  (model, tokenizer, model_info)
185
  """
186
  try:
187
- model_path = MODEL_CONFIG["training"]["fine_tuned_path"] if version else MODEL_CONFIG["training"]["base_model_path"]
188
 
189
  tokenizer = AutoTokenizer.from_pretrained(
190
  model_path,
@@ -197,7 +197,7 @@ def get_model(
197
  device_map="auto" if device == "cuda" else None
198
  )
199
 
200
- return model, tokenizer, MODEL_CONFIG
201
 
202
  except Exception as e:
203
  logger.error(f"Error loading model: {str(e)}")
@@ -209,10 +209,10 @@ if __name__ == "__main__":
209
 
210
  # Register base model from config
211
  success, message = manager.register_model(
212
- model_id=MODEL_CONFIG["id"].split("/")[-1], # Extract model name from full HF path
213
- version=MODEL_CONFIG["type"],
214
- source=MODEL_CONFIG["id"],
215
- description=MODEL_CONFIG["description"],
216
  is_active=True
217
  )
218
  print(message)
 
9
  import logging
10
  from huggingface_hub import HfApi, snapshot_download
11
  from transformers import AutoModelForCausalLM, AutoTokenizer
12
+ from config.settings import MODEL_PATH, MODELS_REGISTRY_PATH, MODELS, ACTIVE_MODEL
13
 
14
  logging.basicConfig(
15
  level=logging.INFO,
 
184
  (model, tokenizer, model_info)
185
  """
186
  try:
187
+ model_path = ACTIVE_MODEL["training"]["fine_tuned_path"] if version else ACTIVE_MODEL["training"]["base_model_path"]
188
 
189
  tokenizer = AutoTokenizer.from_pretrained(
190
  model_path,
 
197
  device_map="auto" if device == "cuda" else None
198
  )
199
 
200
+ return model, tokenizer, ACTIVE_MODEL
201
 
202
  except Exception as e:
203
  logger.error(f"Error loading model: {str(e)}")
 
209
 
210
  # Register base model from config
211
  success, message = manager.register_model(
212
+ model_id=ACTIVE_MODEL["id"].split("/")[-1], # Extract model name from full HF path
213
+ version=ACTIVE_MODEL["type"],
214
+ source=ACTIVE_MODEL["id"],
215
+ description=ACTIVE_MODEL["description"],
216
  is_active=True
217
  )
218
  print(message)