FauzanAriyatmoko commited on
Commit
01768eb
·
1 Parent(s): 51c1726

refactor: Update `RecursiveCharacterTextSplitter` import to use `langchain_text_splitters` with a fallback to `langchain.text_splitter`.

Browse files
Files changed (2) hide show
  1. requirements.txt +1 -0
  2. utils/pdf_processor.py +4 -1
requirements.txt CHANGED
@@ -9,6 +9,7 @@ sentence-transformers>=2.2.2
9
  chromadb>=0.4.22
10
  langchain>=0.1.0
11
  langchain-community>=0.0.20
 
12
 
13
  # PDF Processing
14
  PyPDF2>=3.0.0
 
9
  chromadb>=0.4.22
10
  langchain>=0.1.0
11
  langchain-community>=0.0.20
12
+ langchain-text-splitters>=0.0.1
13
 
14
  # PDF Processing
15
  PyPDF2>=3.0.0
utils/pdf_processor.py CHANGED
@@ -5,7 +5,10 @@ import os
5
  from typing import List, Dict
6
  import PyPDF2
7
  import pdfplumber
8
- from langchain.text_splitter import RecursiveCharacterTextSplitter
 
 
 
9
  from config.model_config import config
10
 
11
  class PDFProcessor:
 
5
  from typing import List, Dict
6
  import PyPDF2
7
  import pdfplumber
8
+ try:
9
+ from langchain_text_splitters import RecursiveCharacterTextSplitter
10
+ except ImportError:
11
+ from langchain.text_splitter import RecursiveCharacterTextSplitter
12
  from config.model_config import config
13
 
14
  class PDFProcessor: