daniel-simeone commited on
Commit
b2be33e
·
1 Parent(s): 6b554cd

update to use correct paths on hg

Browse files
.gitignore CHANGED
@@ -1 +1,4 @@
1
  __pycache__/ingestion.cpython-312.pyc
 
 
 
 
1
  __pycache__/ingestion.cpython-312.pyc
2
+ *.pkl
3
+ *.pdf
4
+ *.faiss
app.py CHANGED
@@ -82,7 +82,7 @@ class RAGChatbot:
82
  self,
83
  model_name: str = "microsoft/DialoGPT-medium",
84
  embedding_model: str = "all-MiniLM-L6-v2",
85
- vector_store_path: str = "./vector_store"
86
  ):
87
  """
88
  Initialize the RAG chatbot.
 
82
  self,
83
  model_name: str = "microsoft/DialoGPT-medium",
84
  embedding_model: str = "all-MiniLM-L6-v2",
85
+ vector_store_path: str = "data/vector_store"
86
  ):
87
  """
88
  Initialize the RAG chatbot.
{pdfs → data/pdfs}/.gitkeep RENAMED
File without changes
ingest_documents.py CHANGED
@@ -8,7 +8,7 @@ from ingestion import DocumentIngestion
8
 
9
 
10
  # Configuration
11
- PDF_FOLDER = "./pdfs" # Folder containing PDF files
12
  URLS = [
13
  # Add your URLs here, one per line
14
  "https://www.ontario.ca/page/organic-crop-and-livestock-production-ontario"
 
8
 
9
 
10
  # Configuration
11
+ PDF_FOLDER = "data/pdfs" # Folder containing PDF files
12
  URLS = [
13
  # Add your URLs here, one per line
14
  "https://www.ontario.ca/page/organic-crop-and-livestock-production-ontario"
pdfs/P29-32-310-2020-eng.pdf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c4146268bf53ca2a958c4672767ece021c072b8a88fb70352d192103857e260
3
- size 2529910
 
 
 
 
vector_store/documents.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e501bec8852d7cfc615777d89c1d39a877480da7d3522ef165fc4124f98f819
3
- size 9722
 
 
 
 
vector_store/embeddings.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8880a7809837bbba93cd5d3f9a9ec2375dab0e08f1cbd17ede90dcb4ccd8eeb1
3
- size 15514
 
 
 
 
vector_store/index.faiss DELETED
Binary file (15.4 kB)