final_project2

Sleeping

App Files Files Community

final_project2 / src /app.py

dnj0

Update src/app.py

3340ad6 verified 3 months ago

raw

history blame contribute delete

13.3 kB

	import streamlit as st
	import os
	from pathlib import Path


	from pdf_parser import PDFParser
	from vector_store import VectorStore
	from rag_system import VisualMultimodalRAG
	from config import UPLOAD_FOLDER, MAX_PDF_SIZE_MB


	st.set_page_config(
	page_title="📄 Multimodal RAG LLM System (PDF Parsing)",
	layout="wide",
	initial_sidebar_state="expanded"
	)


	if 'api_key_set' not in st.session_state:
	st.session_state.api_key_set = False

	if 'api_key' not in st.session_state:
	st.session_state.api_key = None

	if 'visual_rag_system' not in st.session_state:
	st.session_state.visual_rag_system = None

	if 'vector_store' not in st.session_state:
	st.session_state.vector_store = None

	if 'parser' not in st.session_state:
	st.session_state.parser = None

	if 'current_document' not in st.session_state:
	st.session_state.current_document = None

	if 'current_text' not in st.session_state:
	st.session_state.current_text = None

	if 'current_images' not in st.session_state:
	st.session_state.current_images = None

	if 'current_tables' not in st.session_state:
	st.session_state.current_tables = None

	if 'processing_results' not in st.session_state:
	st.session_state.processing_results = None

	if 'answering_rag' not in st.session_state:
	st.session_state.answering_rag = None


	st.title("📄 Multimodal RAG LLM System (PDF Parsing)")




	with st.sidebar:
	st.header("⚙️ Configuration")

	st.subheader("🔑 OpenAI API Key")

	api_key = st.text_input(
	"Enter your OpenAI API key:",
	type="password",
	key="api_key_input"
	)

	if api_key:
	st.session_state.api_key = api_key
	st.session_state.api_key_set = True

	if st.session_state.visual_rag_system is None:
	try:
	st.session_state.visual_rag_system = VisualMultimodalRAG(api_key=api_key, debug=True)
	st.session_state.vector_store = VectorStore()
	st.session_state.parser = PDFParser(debug=True)
	st.success("✅ API Key set & systems initialized")
	except Exception as e:
	st.error(f"Error initializing systems: {e}")
	else:
	st.session_state.api_key_set = False
	st.warning("⚠️ Please enter your API key to continue")

	st.divider()

	st.subheader("📊 Vector Store Status")
	if st.session_state.vector_store:
	try:
	info = st.session_state.vector_store.get_collection_info()
	st.metric("Items in Store", info['count'])
	st.metric("Status", info['status'])
	st.caption(f"Path: {info['persist_path']}")
	except Exception as e:
	st.error(f"Error getting store info: {e}")
	else:
	st.info("Set API key to initialize vector store")

	st.divider()

	st.subheader("📁 Document Management")
	if st.button("🔄 Clear Vector Store"):
	if st.session_state.vector_store:
	try:
	st.session_state.vector_store.clear_all()
	st.success("✅ Vector store cleared")
	except Exception as e:
	st.error(f"Error clearing store: {e}")



	st.header("📤 Upload PDF Document")

	uploaded_file = st.file_uploader(
	"Choose a PDF file",
	type=['pdf'],
	help="PDF with text, images, and tables"
	)

	if uploaded_file is not None:
	upload_path = Path(UPLOAD_FOLDER)
	upload_path.mkdir(exist_ok=True)

	file_path = upload_path / uploaded_file.name
	with open(file_path, 'wb') as f:
	f.write(uploaded_file.getbuffer())

	st.success(f"✅ File saved: {uploaded_file.name}")

	if st.button("🔍 Parse PDF"):
	if not st.session_state.api_key_set:
	st.error("❌ Please set OpenAI API key first")
	else:
	try:
	with st.spinner("📄 Parsing PDF..."):
	print(f"\n{'='*70}")
	print(f"PARSING: {uploaded_file.name}")
	print(f"{'='*70}")

	# Parse PDF - returns text, images, tables
	parser = st.session_state.parser
	text, images, tables = parser.parse_pdf(str(file_path))

	# Store in session state
	st.session_state.current_document = uploaded_file.name
	st.session_state.current_text = text
	st.session_state.current_images = images
	st.session_state.current_tables = tables

	# Display results
	col1, col2, col3 = st.columns(3)
	with col1:
	st.metric("📝 Text", f"{len(text):,} chars")
	with col2:
	st.metric("🖼️ Images", len(images))
	with col3:
	st.metric("📋 Tables", len(tables))

	#if images:
	# st.subheader("🖼️ Extracted Images")
	# for idx, img in enumerate(images):
	# ocr_text = img.get('ocr_text', '')
	# ocr_len = len(ocr_text)
	#
	# if ocr_len > 0:
	# st.success(f"✅ Image {idx}: {ocr_len} characters (OCR)")
	# else:
	# st.warning(f"⚠️ Image {idx}: No OCR text (will use visual analysis)")

	st.success("✅ PDF parsing complete!")

	except Exception as e:
	st.error(f"❌ Error parsing PDF: {e}")
	print(f"Error: {e}")



	st.divider()
	st.header("🖼️ Analysis & Storage")


	if st.button("🖼️ Analyze & Store Components"):
	if not st.session_state.api_key_set:
	st.error("❌ Please set OpenAI API key first")
	elif st.session_state.current_text is None:
	st.error("❌ Please parse a PDF document first")
	else:
	try:
	with st.spinner("🖼️ Analyzing..."):
	print(f"\n{'='*70}")
	print(f"VISUAL IMAGE ANALYSIS")
	print(f"{'='*70}")

	visual_rag = st.session_state.visual_rag_system
	vector_store = st.session_state.vector_store

	results = visual_rag.process_and_store_document(
	text=st.session_state.current_text,
	images=st.session_state.current_images,
	tables=st.session_state.current_tables,
	vector_store=vector_store,
	doc_id=st.session_state.current_document or "current_doc"
	)

	st.session_state.processing_results = results

	st.success("✅ Visual analysis complete & stored!")

	col1, col2, col3 = st.columns(3)
	with col1:
	st.metric("🖼️ Images Analyzed", len(results['image_visual_analyses']))
	with col2:
	st.metric("📝 Text Chunks", len(results['text_summaries']))
	with col3:
	st.metric("📋 Tables Analyzed", len(results['table_summaries']))

	st.metric("📊 Total Stored in Vector", results['total_stored'])

	#if results['image_visual_analyses']:
	# st.subheader("🖼️ Visual Image Analyses (gpt-4o)")
	# for img_analysis in results['image_visual_analyses']:
	# with st.expander(f"Image {img_analysis['image_index']} - Visual Analysis"):
	# st.write("Visual Analysis by gpt-4o:")
	# st.write(img_analysis['visual_analysis'])
	#
	# st.write("Image Path:")
	# st.code(img_analysis['image_path'])
	#
	# if img_analysis['ocr_text']:
	# st.write("OCR Text (backup):")
	# st.text(img_analysis['ocr_text'][:500])

	#if results['text_summaries']:
	# st.subheader("📝 Text Chunk Summaries")
	# for chunk_summary in results['text_summaries']:
	# with st.expander(
	# f"Chunk {chunk_summary['chunk_index']} "
	# f"({chunk_summary['chunk_length']} chars)"
	# ):
	# st.write("Summary:")
	# st.write(chunk_summary['summary'])
	# st.write("Original Text (first 500 chars):")
	# st.text(chunk_summary['original_text'])

	#if results['table_summaries']:
	# st.subheader("📋 Table Analyses")
	# for table_summary in results['table_summaries']:
	# with st.expander(
	# f"Table {table_summary['table_index']} "
	# f"({table_summary['table_length']} chars)"
	# ):
	# st.write("Analysis:")
	# st.write(table_summary['summary'])
	# st.write("Original Content (first 500 chars):")
	# st.text(table_summary['original_content'])

	print(f"\n✅ Analysis processing complete!")

	except Exception as e:
	st.error(f"❌ Error during analysis: {e}")
	print(f"Error: {e}")


	st.divider()
	st.header("❓ Ask Questions About Document")

	if 'answering_rag' not in st.session_state:
	st.session_state.answering_rag = None

	if st.session_state.api_key_set and st.session_state.answering_rag is None:
	from rag_system import AnsweringRAG
	st.session_state.answering_rag = AnsweringRAG(api_key=st.session_state.api_key, debug=True)

	question = st.text_area(
	"Enter your question:",
	height=100,
	placeholder="What does the document say about...?"
	)

	if st.button("🔍 Search & Generate Answer"):
	if not st.session_state.api_key_set:
	st.error("❌ Please set OpenAI API key first")
	elif st.session_state.current_text is None:
	st.error("❌ Please parse a PDF document first")
	elif not question:
	st.error("❌ Please enter a question")
	else:
	try:
	with st.spinner("🔄 Searching document and analyzing..."):
	print(f"\n{'='*70}")
	print(f"QUESTION: {question}")
	print(f"{'='*70}")

	store = st.session_state.vector_store

	doc_name = st.session_state.current_document or "current_doc"
	doc_data = {
	'text': st.session_state.current_text,
	'images': [],
	'tables': []
	}
	store.add_documents(doc_data, doc_name)

	search_results = store.search(question, n_results=5)

	print(f"\n📊 Search Results Found: {len(search_results)}")

	answering_rag = st.session_state.answering_rag
	result = answering_rag.analyze_and_answer(question, search_results)

	st.success("✅ Analysis complete!")

	st.subheader("📝 Answer")

	col1, col2, col3 = st.columns(3)
	with col1:
	st.metric("Confidence", f"{result['confidence'].upper()}")
	with col2:
	st.metric("Sources Used", result['sources_used'])
	with col3:
	if result['sources_used'] > 0:
	st.metric("Avg Relevance", f"{sum(1-r.get('distance',0) for r in search_results)/len(search_results):.0%}")

	st.write(result['answer'])

	if st.checkbox("📚 Show Source Documents"):
	st.subheader("Sources Used in Answer")
	for idx, source in enumerate(result['formatted_sources'], 1):
	relevance = source['relevance']
	relevance_bar = "█" * int(relevance * 10) + "░" * (10 - int(relevance * 10))

	with st.expander(
	f"Source {idx} - {source['type'].upper()} "
	f"[{relevance_bar}] {relevance:.0%}"
	):
	st.write(source['content'])

	print(f"\n✅ Answer generation complete!")

	except Exception as e:
	st.error(f"❌ Error processing question: {e}")
	print(f"Error: {e}")


	st.divider()