Spaces:

Subha95
/

Harry_potter_wiki

Sleeping

Subha95 commited on Sep 3, 2025

Commit

3569bcd

verified ·

1 Parent(s): ead715a

Update chatbot_rag.py

Files changed (1) hide show

chatbot_rag.py CHANGED Viewed

@@ -25,21 +25,23 @@ def build_qa():
     # 3. Load LLM (Flan-T5 small for lightweight QA)
     print("🔹 Loading LLM...")
-    model_id = "google/flan-t5-small"
     tokenizer = AutoTokenizer.from_pretrained(model_id)
     model = AutoModelForSeq2SeqLM.from_pretrained(model_id)
     pipe = pipeline(
-        "text2text-generation",
-        model=model,
-        tokenizer=tokenizer,
-        max_new_tokens=256,
     )
     llm = HuggingFacePipeline(pipeline=pipe)
     # 4. QA Chain with retrieval
     print("🔹 Building RetrievalQA...")
-    retriever = vectorstore.as_retriever(search_kwargs={"k": 3})
     template = """

     # 3. Load LLM (Flan-T5 small for lightweight QA)
     print("🔹 Loading LLM...")
+    model_id = "microsoft/Phi-3-mini-4k-instruct"
     tokenizer = AutoTokenizer.from_pretrained(model_id)
     model = AutoModelForSeq2SeqLM.from_pretrained(model_id)
     pipe = pipeline(
+    "text-generation",
+    model=model,
+    tokenizer=tokenizer,
+    max_new_tokens=300,
+    do_sample=True, # Set to True to enable sampling and use temperature
+    temperature=0.2 # This is the temperature parameter
     )
     llm = HuggingFacePipeline(pipeline=pipe)
     # 4. QA Chain with retrieval
     print("🔹 Building RetrievalQA...")
+    retriever = vectorstore.as_retriever()
     template = """