Spaces:
Sleeping
Sleeping
File size: 1,495 Bytes
2728db4 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 | from dotenv import load_dotenv
import os
from pathlib import Path
import gradio as gr
from llama_index.embeddings.huggingface import HuggingFaceEmbedding
from llama_index.llms.groq import Groq
from llama_index.core import (
Settings,
VectorStoreIndex,
SimpleDirectoryReader,
StorageContext,
load_index_from_storage,
)
load_dotenv()
groq_key = os.getenv("GROQ_API_KEY")
assert groq_key, "GROQ_API_KEY not set in environment"
Settings.embed_model = HuggingFaceEmbedding(
model_name="sentence-transformers/all-MiniLM-L6-v2"
)
Settings.llm = Groq(
model="llama-3.1-8b-instant",
api_key=groq_key,
)
PERSIST_DIR = "storage"
if Path(PERSIST_DIR).exists():
storage_context = StorageContext.from_defaults(persist_dir=PERSIST_DIR)
index = load_index_from_storage(storage_context)
else:
documents = SimpleDirectoryReader("Data", recursive=True).load_data()
index = VectorStoreIndex.from_documents(documents, show_progress=True)
index.storage_context.persist(persist_dir=PERSIST_DIR)
query_engine = index.as_query_engine()
def ask(message: str, history: list[tuple[str, str]]):
question = message.strip()
if not question:
return "Please enter a question."
resp = query_engine.query(question)
return str(resp)
demo = gr.ChatInterface(
fn=ask,
title="Intel 64 & IA-32 Architecture Bot",
description="Ask questions based on the Intel Software Developer's Manual.",
)
if __name__ == "__main__":
demo.launch()
|