Spaces:

InvestmentResearchAI
/

LLM-ADE-dev

Paused

WilliamGazeley commited on May 8, 2024

Commit

d5870e6

1 Parent(s): 183e5bc

Fix pydantic reserved var name collision

Files changed (3) hide show

src/app.py CHANGED Viewed

@@ -6,6 +6,7 @@ from utils import get_assistant_message
 from functioncall import ModelInference
 from prompter import PromptManager
 @st.cache_resource(show_spinner="Loading model..")
 def init_llm():

 from functioncall import ModelInference
 from prompter import PromptManager
+print("Why, hello there!", flush=True)
 @st.cache_resource(show_spinner="Loading model..")
 def init_llm():

src/config.py CHANGED Viewed

@@ -3,7 +3,7 @@ from pydantic_settings import BaseSettings
 class Config(BaseSettings):
     hf_token: str = Field(...)
-    model_path: str = Field("InvestmentResearchAI/LLM-ADE-dev")
     headless: bool = Field(False, description="Run in headless mode.")
     chat_template: str = Field("chatml", description="Chat template for prompt formatting")

 class Config(BaseSettings):
     hf_token: str = Field(...)
+    hf_model: str = Field("InvestmentResearchAI/LLM-ADE-dev")
     headless: bool = Field(False, description="Run in headless mode.")
     chat_template: str = Field("chatml", description="Chat template for prompt formatting")

src/functioncall.py CHANGED Viewed

@@ -33,7 +33,7 @@ class ModelInference:
                 bnb_4bit_use_double_quant=True,
             )
         self.model = AutoModelForCausalLM.from_pretrained(
-            config.model_path,
             trust_remote_code=True,
             return_dict=True,
             quantization_config=self.bnb_config,
@@ -42,7 +42,7 @@ class ModelInference:
             device_map="auto",
         )
-        self.tokenizer = AutoTokenizer.from_pretrained(config.model_path, trust_remote_code=True)
         self.tokenizer.pad_token = self.tokenizer.eos_token
         self.tokenizer.padding_side = "left"

                 bnb_4bit_use_double_quant=True,
             )
         self.model = AutoModelForCausalLM.from_pretrained(
+            config.hf_model,
             trust_remote_code=True,
             return_dict=True,
             quantization_config=self.bnb_config,
             device_map="auto",
         )
+        self.tokenizer = AutoTokenizer.from_pretrained(config.hf_model, trust_remote_code=True)
         self.tokenizer.pad_token = self.tokenizer.eos_token
         self.tokenizer.padding_side = "left"