Spaces:

limapjoao
/

tech-explainer-rag

Sleeping

João Lima commited on Jan 24

Commit

2f98627

1 Parent(s): 96dd173

Fix HF Spaces compatibility (models + langchain imports)

Files changed (3) hide show

app.py CHANGED Viewed

@@ -36,4 +36,4 @@ with gr.Blocks(title="Tech Explainer RAG") as demo:
 if __name__ == "__main__":
-    demo.launch(share=True)

config.py CHANGED Viewed

@@ -1,3 +1,3 @@
 EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
-PRIMARY_LLM = "mistralai/Mistral-7B-Instruct-v0.2"
-FALLBACK_LLM = "microsoft/phi-2"

 EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
+PRIMARY_LLM = "google/gemma-2b-it"
+FALLBACK_LLM = "microsoft/phi-2"

rag/llm.py CHANGED Viewed

@@ -7,7 +7,7 @@ def load_model():
     try:
         tokenizer = AutoTokenizer.from_pretrained(PRIMARY_LLM)
         model = AutoModelForCausalLM.from_pretrained(
-            PRIMARY_LLM, device_map="auto", load_in_8bit=True
         )
     except Exception:
         tokenizer = AutoTokenizer.from_pretrained(FALLBACK_LLM, trust_remote_code=True)

     try:
         tokenizer = AutoTokenizer.from_pretrained(PRIMARY_LLM)
         model = AutoModelForCausalLM.from_pretrained(
+            PRIMARY_LLM, device_map="auto"
         )
     except Exception:
         tokenizer = AutoTokenizer.from_pretrained(FALLBACK_LLM, trust_remote_code=True)