Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -132,8 +132,15 @@ def loadKB(fileprovided, urlProvided, uploads_dir, request):
|
|
| 132 |
for file in request.files.getlist('files[]'):
|
| 133 |
print("File Received>>>" + file.filename)
|
| 134 |
file.save(os.path.join(uploads_dir, secure_filename(file.filename)))
|
| 135 |
-
loader = PyPDFLoader(os.path.join(uploads_dir, secure_filename(file.filename)))
|
| 136 |
-
documents.extend(loader.load())
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 137 |
else:
|
| 138 |
loader = TextLoader('Jio.txt')
|
| 139 |
documents.extend(loader.load())
|
|
|
|
| 132 |
for file in request.files.getlist('files[]'):
|
| 133 |
print("File Received>>>" + file.filename)
|
| 134 |
file.save(os.path.join(uploads_dir, secure_filename(file.filename)))
|
| 135 |
+
#loader = PyPDFLoader(os.path.join(uploads_dir, secure_filename(file.filename)))
|
| 136 |
+
#documents.extend(loader.load())
|
| 137 |
+
BASE_MODEL = "LLAMA-TOKENIZER"
|
| 138 |
+
savedModelPath = "./model/" + BASE_MODEL
|
| 139 |
+
global tokenizer
|
| 140 |
+
#tokenizer = LlamaTokenizer.from_pretrained(savedModelPath)
|
| 141 |
+
tokenizer = AutoTokenizer.from_pretrained("bert-base-cased")
|
| 142 |
+
separator = "</Q>"
|
| 143 |
+
documents.extend(PDFChunkerWithSeparator(os.path.join(uploads_dir, secure_filename(file.filename)),separator))
|
| 144 |
else:
|
| 145 |
loader = TextLoader('Jio.txt')
|
| 146 |
documents.extend(loader.load())
|