Spaces:

Asish22
/

code-crawler

Running

App Files Files Community

juliaturc commited on Sep 16, 2024

Commit

3d780b8

1 Parent(s): 52c1352

Add Cohere reranker

Browse files

Files changed (2) hide show

requirements.txt +7 -2
sage/chat.py +9 -1

requirements.txt CHANGED Viewed

@@ -1,12 +1,17 @@
 GitPython==3.1.43
 Pygments==2.18.0
 fastapi==0.112.2
 gradio>=4.26.0
-langchain==0.2.14
-langchain-community==0.2.12
 langchain-anthropic==0.1.23
 langchain-ollama==0.1.2
 langchain-openai==0.1.22
 marqo==3.7.0
 nbformat==5.10.4
 openai==1.42.0

 GitPython==3.1.43
 Pygments==2.18.0
+cohere==5.9.2
 fastapi==0.112.2
 gradio>=4.26.0
+langchain==0.2.15
 langchain-anthropic==0.1.23
+langchain-cohere==0.2.4
+langchain-community==0.2.12
+langchain-core==0.2.36
+langchain-experimental==0.0.64
 langchain-ollama==0.1.2
 langchain-openai==0.1.22
+langchain-text-splitters==0.2.2
 marqo==3.7.0
 nbformat==5.10.4
 openai==1.42.0

sage/chat.py CHANGED Viewed

@@ -1,9 +1,10 @@
 """A gradio app that enables users to chat with their codebase.
-You must run main.py first in order to index the codebase into a vector store.
 """
 import argparse
 import gradio as gr
 from dotenv import load_dotenv
@@ -11,6 +12,8 @@ from langchain.chains import create_history_aware_retriever, create_retrieval_ch
 from langchain.chains.combine_documents import create_stuff_documents_chain
 from langchain.schema import AIMessage, HumanMessage
 from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
 import sage.vector_store as vector_store
 from sage.llm import build_llm_via_langchain
@@ -21,7 +24,11 @@ load_dotenv()
 def build_rag_chain(args):
     """Builds a RAG chain via LangChain."""
     llm = build_llm_via_langchain(args.llm_provider, args.llm_model)
     retriever = vector_store.build_from_args(args).to_langchain().as_retriever()
     # Prompt to contextualize the latest query based on the chat history.
     contextualize_q_system_prompt = (
@@ -82,6 +89,7 @@ def main():
         default="http://localhost:8882",
         help="URL for the Marqo server. Required if using Marqo as embedder or vector store.",
     )
     parser.add_argument(
         "--share",
         default=False,

 """A gradio app that enables users to chat with their codebase.
+You must run `sage-index $GITHUB_REPO` first in order to index the codebase into a vector store.
 """
 import argparse
+import os
 import gradio as gr
 from dotenv import load_dotenv
 from langchain.chains.combine_documents import create_stuff_documents_chain
 from langchain.schema import AIMessage, HumanMessage
 from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
+from langchain.retrievers import ContextualCompressionRetriever
+from langchain_cohere import CohereRerank
 import sage.vector_store as vector_store
 from sage.llm import build_llm_via_langchain
 def build_rag_chain(args):
     """Builds a RAG chain via LangChain."""
     llm = build_llm_via_langchain(args.llm_provider, args.llm_model)
     retriever = vector_store.build_from_args(args).to_langchain().as_retriever()
+    if args.reranker == "cohere":
+        compressor = CohereRerank(model="rerank-english-v3.0", cohere_api_key=os.environ.get("COHERE_API_KEY"))
+        retriever = ContextualCompressionRetriever(base_compressor=compressor, base_retriever=retriever)
     # Prompt to contextualize the latest query based on the chat history.
     contextualize_q_system_prompt = (
         default="http://localhost:8882",
         help="URL for the Marqo server. Required if using Marqo as embedder or vector store.",
     )
+    parser.add_argument("--reranker", default="cohere", choices=["none", "cohere"])
     parser.add_argument(
         "--share",
         default=False,