ShayanRl commited on
Commit
440b73f
·
verified ·
1 Parent(s): ffd8879

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +30 -2
app.py CHANGED
@@ -3,6 +3,27 @@ import io
3
  import requests
4
  import pdfplumber
5
  import os
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6
 
7
  def fextractURL(pdf_path):
8
  extracted_data = ""
@@ -51,12 +72,19 @@ st.markdown(vert_space, unsafe_allow_html=True)
51
  st.write("Extract full text from PDF URL")
52
 
53
  pdfURL = st.text_input(label="PDF URL", value="", max_chars=None, key=None, type="default", help=None, autocomplete=None, on_change=None, args=None, kwargs=None, placeholder=None, disabled=False, label_visibility="visible")
 
54
  button = st.button(label='Extract', key=None, help=None, on_click=None, args=None, kwargs=None, type="secondary", disabled=False, use_container_width=False)
55
  extractedText = st.empty()
56
 
57
  if button:
58
  try:
59
  text = fextractURL(pdfURL)
60
- extractedText.text(text)
 
 
61
  except Exception as e:
62
- st.error(f"An error occurred: {str(e)}")
 
 
 
 
 
3
  import requests
4
  import pdfplumber
5
  import os
6
+ from transformers import AutoModelForQuestionAnswering, AutoTokenizer, pipeline
7
+
8
+ def AImodel(text,questionText):
9
+ model_name = "deepset/tinyroberta-squad2"
10
+
11
+ # a) Get predictions
12
+ nlp = pipeline('question-answering', model=model_name, tokenizer=model_name)
13
+ QA_input = {
14
+ 'question': questionText,
15
+ 'context': text
16
+ }
17
+ res = nlp(QA_input)
18
+
19
+
20
+
21
+ # b) Load model & tokenizer
22
+ model = AutoModelForQuestionAnswering.from_pretrained(model_name)
23
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
24
+ return(res)
25
+
26
+
27
 
28
  def fextractURL(pdf_path):
29
  extracted_data = ""
 
72
  st.write("Extract full text from PDF URL")
73
 
74
  pdfURL = st.text_input(label="PDF URL", value="", max_chars=None, key=None, type="default", help=None, autocomplete=None, on_change=None, args=None, kwargs=None, placeholder=None, disabled=False, label_visibility="visible")
75
+ questionText = st.text_input(label="PDF URL", value="", max_chars=None, key=None, type="default", help=None, autocomplete=None, on_change=None, args=None, kwargs=None, placeholder=None, disabled=False, label_visibility="visible")
76
  button = st.button(label='Extract', key=None, help=None, on_click=None, args=None, kwargs=None, type="secondary", disabled=False, use_container_width=False)
77
  extractedText = st.empty()
78
 
79
  if button:
80
  try:
81
  text = fextractURL(pdfURL)
82
+ AItext = AImodel(text,questionText)
83
+ extractedText.text(AItext)
84
+
85
  except Exception as e:
86
+ st.error(f"An error occurred: {str(e)}")
87
+
88
+
89
+
90
+