Spaces:

s4um1l
/

paul-graham-llama

Sleeping

App Files Files Community

s4um1l commited on May 24

Commit

13317bf

1 Parent(s): 2730edc

updating app.py

Browse files

Files changed (1) hide show

app.py +32 -15

app.py CHANGED Viewed

@@ -40,17 +40,17 @@ HF_TOKEN = os.environ["HF_TOKEN"]
 3. Load HuggingFace Embeddings (remember to use the URL we set above)
 4. Index Files if they do not exist, otherwise load the vectorstore
 """
-### 1. CREATE TEXT LOADER AND LOAD DOCUMENTS
-### NOTE: PAY ATTENTION TO THE PATH THEY ARE IN.
-text_loader =
-documents =
-### 2. CREATE TEXT SPLITTER AND SPLIT DOCUMENTS
-text_splitter =
-split_documents =
-### 3. LOAD HUGGINGFACE EMBEDDINGS
-hf_embeddings =
 async def add_documents_async(vectorstore, documents):
     await vectorstore.aadd_documents(documents)
@@ -109,18 +109,35 @@ hf_retriever = asyncio.run(run())
 1. Define a String Template
 2. Create a Prompt Template from the String Template
 """
-### 1. DEFINE STRING TEMPLATE
-RAG_PROMPT_TEMPLATE =
-### 2. CREATE PROMPT TEMPLATE
-rag_prompt =
 # -- GENERATION -- #
 """
 1. Create a HuggingFaceEndpoint for the LLM
 """
-### 1. CREATE HUGGINGFACE ENDPOINT FOR LLM
-hf_llm =
 @cl.author_rename
 def rename(original_author: str):

 3. Load HuggingFace Embeddings (remember to use the URL we set above)
 4. Index Files if they do not exist, otherwise load the vectorstore
 """
+document_loader = TextLoader("./data/paul_graham_essays.txt")
+documents = document_loader.load()
+text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=30)
+split_documents = text_splitter.split_documents(documents)
+hf_embeddings = HuggingFaceEndpointEmbeddings(
+    model=HF_EMBED_ENDPOINT,
+    task="feature-extraction",
+    huggingfacehub_api_token=HF_TOKEN,
+)
 async def add_documents_async(vectorstore, documents):
     await vectorstore.aadd_documents(documents)
 1. Define a String Template
 2. Create a Prompt Template from the String Template
 """
+RAG_PROMPT_TEMPLATE = """\
+<|start_header_id|>system<|end_header_id|>
+You are a helpful assistant. You answer user questions based on provided context. If you can't answer the question with the provided context, say you don't know.<|eot_id|>
+<|start_header_id|>user<|end_header_id|>
+User Query:
+{query}
+Context:
+{context}<|eot_id|>
+<|start_header_id|>assistant<|end_header_id|>
+"""
+rag_prompt = PromptTemplate.from_template(RAG_PROMPT_TEMPLATE)
 # -- GENERATION -- #
 """
 1. Create a HuggingFaceEndpoint for the LLM
 """
+hf_llm = HuggingFaceEndpoint(
+    endpoint_url=HF_LLM_ENDPOINT,
+    max_new_tokens=512,
+    top_k=10,
+    top_p=0.95,
+    temperature=0.3,
+    repetition_penalty=1.15,
+    huggingfacehub_api_token=HF_TOKEN,
+)
 @cl.author_rename
 def rename(original_author: str):