trlpop101 commited on
Commit
cf1f90b
ยท
verified ยท
1 Parent(s): e434a03

Update src/streamlit_app.py

Browse files
Files changed (1) hide show
  1. src/streamlit_app.py +9 -10
src/streamlit_app.py CHANGED
@@ -26,16 +26,15 @@ import json
26
  from langchain.docstore.document import Document
27
  from langchain_groq import ChatGroq
28
 
29
- # PDF ๋ฌธ์„œ๋กœ๋ถ€ํ„ฐ ํ…์ŠคํŠธ๋ฅผ ์ถ”์ถœํ•˜๋Š” ํ•จ์ˆ˜์ž…๋‹ˆ๋‹ค.
30
  def get_pdf_text(pdf_docs):
31
- temp_dir = tempfile.TemporaryDirectory() # ์ž„์‹œ ๋””๋ ‰ํ† ๋ฆฌ๋ฅผ ์ƒ์„ฑํ•ฉ๋‹ˆ๋‹ค.
32
- temp_filepath = os.path.join(temp_dir.name, pdf_docs.name) # ์ž„์‹œ ํŒŒ์ผ ๊ฒฝ๋กœ๋ฅผ ์ƒ์„ฑํ•ฉ๋‹ˆ๋‹ค.
33
- with open(temp_filepath, "wb") as f: # ์ž„์‹œ ํŒŒ์ผ์„ ๋ฐ”์ด๋„ˆ๋ฆฌ ์“ฐ๊ธฐ ๋ชจ๋“œ๋กœ ์—ฝ๋‹ˆ๋‹ค.
34
- f.write(pdf_docs.getvalue()) # PDF ๋ฌธ์„œ์˜ ๋‚ด์šฉ์„ ์ž„์‹œ ํŒŒ์ผ์— ์”๋‹ˆ๋‹ค.
35
- pdf_loader = PyPDFLoader(temp_filepath) # PyPDFLoader๋ฅผ ์‚ฌ์šฉํ•ด PDF๋ฅผ ๋กœ๋“œํ•ฉ๋‹ˆ๋‹ค.
36
- pdf_doc = pdf_loader.load() # ํ…์ŠคํŠธ๋ฅผ ์ถ”์ถœํ•ฉ๋‹ˆ๋‹ค.
37
- return pdf_doc # ์ถ”์ถœํ•œ ํ…์ŠคํŠธ๋ฅผ ๋ฐ˜ํ™˜ํ•ฉ๋‹ˆ๋‹ค.
38
-
39
 
40
  # txt ํŒŒ์ผ๋กœ๋ถ€ํ„ฐ text ์ถ”์ถœ
41
  def get_text_file(txt_docs):
@@ -44,7 +43,7 @@ def get_text_file(txt_docs):
44
  with open(temp_filepath, "wb") as f:
45
  f.write(txt_docs.getvalue())
46
  text_loader = TextLoader(temp_filepath)
47
- text_doc = text_loader.load()
48
  return text_doc
49
 
50
  # csv ํŒŒ์ผ๋กœ๋ถ€ํ„ฐ text ์ถ”์ถœ
 
26
  from langchain.docstore.document import Document
27
  from langchain_groq import ChatGroq
28
 
29
+ # PDF ๋ฌธ์„œ๋กœ๋ถ€ํ„ฐ ํ…์ŠคํŠธ๋ฅผ ์ถ”์ถœํ•˜๋Š” ํ•จ์ˆ˜
30
  def get_pdf_text(pdf_docs):
31
+ temp_dir = tempfile.TemporaryDirectory()
32
+ temp_filepath = os.path.join(temp_dir.name, pdf_docs.name)
33
+ with open(temp_filepath, "wb") as f:
34
+ f.write(pdf_docs.getvalue())
35
+ pdf_loader = PyPDFLoader(temp_filepath)
36
+ pdf_doc = pdf_loader.load()
37
+ return pdf_doc
 
38
 
39
  # txt ํŒŒ์ผ๋กœ๋ถ€ํ„ฐ text ์ถ”์ถœ
40
  def get_text_file(txt_docs):
 
43
  with open(temp_filepath, "wb") as f:
44
  f.write(txt_docs.getvalue())
45
  text_loader = TextLoader(temp_filepath)
46
+ text_doc = text_loader.load()
47
  return text_doc
48
 
49
  # csv ํŒŒ์ผ๋กœ๋ถ€ํ„ฐ text ์ถ”์ถœ