Spaces:

venkatchoudharyala
/

HeadLineGen

Runtime error

App Files Files Community

venkatchoudharyala commited on Apr 12, 2024

Commit

12cc604

verified ·

1 Parent(s): aa17f32

Upload 7 files

Browse files

Files changed (7) hide show

.streamlit/config.toml +3 -0
WebComponents/ArticleExtractor.py +26 -0
app.py +16 -0
packages.txt +4 -0
pages/Extraction.py +55 -0
pages/Final.py +16 -0
requirements.txt +9 -0

.streamlit/config.toml ADDED Viewed

	@@ -0,0 +1,3 @@

+[theme]
+base = "dark"
+font = "monospace"

WebComponents/ArticleExtractor.py ADDED Viewed

	@@ -0,0 +1,26 @@

+import pytesseract
+from PIL import Image
+from io import BytesIO
+#import easyocr
+# Function to perform OCR with Tesseract
+def ocr_with_tesseract(image):
+	# Perform OCR on the image using pytesseract
+	extracted_text = pytesseract.image_to_string(image)
+	return extracted_text
+# Function to perform OCR with EasyOCR
+'''
+def ocr_with_easyocr(image):
+	# Convert the image to bytes for easyocr
+	image_bytes = image.tobytes()
+	# Perform OCR on the image using easyocr
+	reader = easyocr.Reader(['en'])  # You can add other languages as needed
+	result = reader.readtext(image_bytes)
+	# Extract text from OCR result
+	extracted_text = [text[1] for text in result]
+	return extracted_text
+'''

app.py ADDED Viewed

	@@ -0,0 +1,16 @@

+import streamlit as st
+from headline_gen.Control import ServerInit
+import os
+import nltk
+def main():
+	#os.environ['JAVAHOME'] = 'usr/bin/java'
+	st.title("Abstract Page")
+	if "Server" not in st.session_state:
+		with st.spinner("Booting Server"):
+			st.session_state["Server"] = ServerInit("Start")
+	else:
+		if st.button("Upload Text"):
+			st.switch_page("pages/Extraction.py")
+if __name__ == "__main__":
+	main()

packages.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+tesseract-ocr
+tesseract-ocr-por
+default-jdk
+default-jre

pages/Extraction.py ADDED Viewed

	@@ -0,0 +1,55 @@

+import streamlit as st
+from WebComponents import ArticleExtractor as ocr
+from streamlit_cropper import st_cropper
+from PIL import Image
+st.set_page_config(layout="wide")
+def main():
+	tab1, tab2 = st.tabs(['Manual', 'OCR'])
+	if 'Questions' not in st.session_state:
+		st.session_state['Questions'] = []
+	st.session_state['Flag'] = False
+	with tab1:
+		with st.form("Manual", clear_on_submit = True):
+			Question = st.text_area("Question")
+			st.write(Question)
+			col1, col2 = st.columns(2)
+			with col1:
+				if st.form_submit_button("Reset"):
+					k = 0
+					#st.session_state['Questions'].append({"QuestionID": ID, "Question": Question})
+			with col2:
+				if st.form_submit_button("Generate HL"):
+					st.session_state['Questions'].append(Question)
+					st.switch_page("pages/Final.py")
+	with tab2:
+		if "file_uploader_key" not in st.session_state:
+			st.session_state["file_uploader_key"] = 0
+		Image_File = st.file_uploader("Upload the Image", type=['png', 'jpg'], key=st.session_state["file_uploader_key"],)
+		if Image_File:
+			col1, col2 = st.columns(2)
+			with col1:
+				img = Image.open(Image_File)
+				cropped_img = st_cropper(img, realtime_update = True, box_color = "#FF0012", aspect_ratio = (5, 2))
+			with col2:
+				st.write("Preview")
+				_ = cropped_img.thumbnail((580, 580))
+				st.image(cropped_img)
+				#if st.button("Extract"):
+				ExText = ocr.ocr_with_tesseract(cropped_img)
+			with st.form("OCR", clear_on_submit = True):
+				Question = st.text_area("Question", value = ExText)
+				col1, col2 = st.columns(2)
+				with col1:
+					if st.form_submit_button("Reset"):
+						st.session_state["file_uploader_key"] += 1
+						st.rerun()
+						#st.session_state['Questions'].append({"Question": Question})
+				with col2:
+					if st.form_submit_button("Generate HL"):
+						st.session_state['Questions'].append(Question)
+						st.switch_page("pages/Final.py")
+if __name__ == "__main__":
+	main()

pages/Final.py ADDED Viewed

	@@ -0,0 +1,16 @@

+import streamlit as st
+from headline_gen.Control import Generate
+def main():
+	if 'Questions' in st.session_state:
+		with st.spinner("Generating Head Line!!!"):
+			#st.subheader(st.session_state['Questions'][-1])
+			if 'Server' in st.session_state:
+				st.success(Generate(st.session_state['Questions'][-1], st.session_state["Server"]))
+			else:
+				st.error("Server is not Booted")
+	else:
+		st.error("Please Navigate back to Extraction Page and Upload your Article")
+if __name__ == "__main__":
+	main()

requirements.txt ADDED Viewed

	@@ -0,0 +1,9 @@

+streamlit-cropper
+pytesseract
+textacy
+regex
+nltk
+scipy==1.12.0
+gensim
+networkx
+headline-gen