Spaces:
Running
on
Zero
Running
on
Zero
jedick
commited on
Commit
·
26cf2c7
1
Parent(s):
555a40e
Use chromadb==0.6.3
Browse files- app.py +1 -1
- data.py +3 -1
- requirements.txt +5 -2
- retriever.py +2 -2
app.py
CHANGED
|
@@ -472,7 +472,7 @@ with gr.Blocks(
|
|
| 472 |
"""Get multi-turn example questions based on compute mode"""
|
| 473 |
questions = [
|
| 474 |
"Lookup emails that reference bugs.r-project.org in 2025",
|
| 475 |
-
"Did
|
| 476 |
]
|
| 477 |
|
| 478 |
if compute_mode == "remote":
|
|
|
|
| 472 |
"""Get multi-turn example questions based on compute mode"""
|
| 473 |
questions = [
|
| 474 |
"Lookup emails that reference bugs.r-project.org in 2025",
|
| 475 |
+
"Did the cited authors report bugs before 2025?",
|
| 476 |
]
|
| 477 |
|
| 478 |
if compute_mode == "remote":
|
data.py
CHANGED
|
@@ -45,7 +45,9 @@ def download_data():
|
|
| 45 |
|
| 46 |
if not os.path.exists("db.zip"):
|
| 47 |
# For S3 (need AWS_ACCESS_KEY_ID and AWS_ACCESS_KEY_SECRET)
|
| 48 |
-
|
|
|
|
|
|
|
| 49 |
## For Dropbox (shared file - key is in URL)
|
| 50 |
# shared_link = "https://www.dropbox.com/scl/fi/jx90g5lorpgkkyyzeurtc/db.zip?rlkey=wvqa3p9hdy4rmod1r8yf2am09&st=l9tsam56&dl=0"
|
| 51 |
# output_filename = "db.zip"
|
|
|
|
| 45 |
|
| 46 |
if not os.path.exists("db.zip"):
|
| 47 |
# For S3 (need AWS_ACCESS_KEY_ID and AWS_ACCESS_KEY_SECRET)
|
| 48 |
+
# db_20250801.zip: chromadb==1.0.13
|
| 49 |
+
# db_20250801a.zip: chromadb==0.6.3
|
| 50 |
+
download_file_from_bucket("r-help-chat", "db_20250801a.zip", "db.zip")
|
| 51 |
## For Dropbox (shared file - key is in URL)
|
| 52 |
# shared_link = "https://www.dropbox.com/scl/fi/jx90g5lorpgkkyyzeurtc/db.zip?rlkey=wvqa3p9hdy4rmod1r8yf2am09&st=l9tsam56&dl=0"
|
| 53 |
# output_filename = "db.zip"
|
requirements.txt
CHANGED
|
@@ -1,6 +1,8 @@
|
|
| 1 |
# Pin torch and chroma versions
|
| 2 |
torch==2.5.1
|
| 3 |
-
chromadb==
|
|
|
|
|
|
|
| 4 |
|
| 5 |
# Stated requirements:
|
| 6 |
# Gemma 3: transformers>=4.50
|
|
@@ -9,6 +11,7 @@ chromadb==1.0.13
|
|
| 9 |
# NOTE: Gemma 3 with transformers==4.54.0 gives:
|
| 10 |
# ValueError: Max cache length is not consistent across layers
|
| 11 |
transformers==4.51.3
|
|
|
|
| 12 |
# Required by langchain-huggingface
|
| 13 |
sentence-transformers==5.0.0
|
| 14 |
# For snapshot_download
|
|
@@ -17,7 +20,7 @@ huggingface-hub==0.34.3
|
|
| 17 |
# Langchain packages
|
| 18 |
langchain==0.3.26
|
| 19 |
langchain-core==0.3.72
|
| 20 |
-
langchain-chroma==0.2.
|
| 21 |
langchain-openai==0.3.27
|
| 22 |
langchain-community==0.3.27
|
| 23 |
langchain-huggingface==0.3.0
|
|
|
|
| 1 |
# Pin torch and chroma versions
|
| 2 |
torch==2.5.1
|
| 3 |
+
chromadb==0.6.3
|
| 4 |
+
# NOTE: chromadb==1.0.13 was giving intermittent error:
|
| 5 |
+
# ValueError('Could not connect to tenant default_tenant. Are you sure it exists?')
|
| 6 |
|
| 7 |
# Stated requirements:
|
| 8 |
# Gemma 3: transformers>=4.50
|
|
|
|
| 11 |
# NOTE: Gemma 3 with transformers==4.54.0 gives:
|
| 12 |
# ValueError: Max cache length is not consistent across layers
|
| 13 |
transformers==4.51.3
|
| 14 |
+
tokenizers==0.21.2
|
| 15 |
# Required by langchain-huggingface
|
| 16 |
sentence-transformers==5.0.0
|
| 17 |
# For snapshot_download
|
|
|
|
| 20 |
# Langchain packages
|
| 21 |
langchain==0.3.26
|
| 22 |
langchain-core==0.3.72
|
| 23 |
+
langchain-chroma==0.2.3
|
| 24 |
langchain-openai==0.3.27
|
| 25 |
langchain-community==0.3.27
|
| 26 |
langchain-huggingface==0.3.0
|
retriever.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
# Main retriever modules
|
| 2 |
from langchain_text_splitters import RecursiveCharacterTextSplitter
|
| 3 |
from langchain_community.document_loaders import TextLoader
|
|
|
|
| 4 |
|
| 5 |
-
# from langchain_chroma import Chroma
|
| 6 |
-
from mods.langchain_chroma import Chroma
|
| 7 |
from langchain.retrievers import ParentDocumentRetriever, EnsembleRetriever
|
| 8 |
from langchain_core.documents import Document
|
| 9 |
from langchain_core.retrievers import BaseRetriever, RetrieverLike
|
|
|
|
| 1 |
# Main retriever modules
|
| 2 |
from langchain_text_splitters import RecursiveCharacterTextSplitter
|
| 3 |
from langchain_community.document_loaders import TextLoader
|
| 4 |
+
from langchain_chroma import Chroma
|
| 5 |
|
| 6 |
+
# from mods.langchain_chroma import Chroma
|
|
|
|
| 7 |
from langchain.retrievers import ParentDocumentRetriever, EnsembleRetriever
|
| 8 |
from langchain_core.documents import Document
|
| 9 |
from langchain_core.retrievers import BaseRetriever, RetrieverLike
|