"""
Enhanced Streamlit GUI for Sign Language Detector
Modern, Professional File Processing Interface
"""
import streamlit as st
import cv2
import numpy as np
import os
import sys
import time
import threading
from PIL import Image
import tempfile
from typing import Optional, List, Dict, Any
import plotly.express as px
import plotly.graph_objects as go
from plotly.subplots import make_subplots
import pandas as pd
import base64
from io import BytesIO
import json
# Add src directory to path
sys.path.append(os.path.dirname(__file__))
from src.file_handler import FileHandler
from src.output_handler import OutputHandler
from src.hand_detector import HandDetector
from src.gesture_extractor import GestureExtractor
from src.openai_classifier import SignLanguageClassifier
from src.visualization_utils import HandLandmarkVisualizer, create_processing_timeline
from src.export_utils import ResultExporter
# Page configuration
st.set_page_config(
page_title="Sign Language Detector Pro",
page_icon="đ¤",
layout="wide",
initial_sidebar_state="expanded"
)
# Comprehensive CSS for optimal text visibility and professional design
st.markdown("""
""", unsafe_allow_html=True)
# Initialize session state
if 'file_handler' not in st.session_state:
st.session_state.file_handler = None
if 'output_handler' not in st.session_state:
st.session_state.output_handler = None
if 'detections' not in st.session_state:
st.session_state.detections = []
if 'transcript' not in st.session_state:
st.session_state.transcript = []
if 'processing_results' not in st.session_state:
st.session_state.processing_results = []
if 'current_file' not in st.session_state:
st.session_state.current_file = None
if 'visualizer' not in st.session_state:
st.session_state.visualizer = HandLandmarkVisualizer()
if 'exporter' not in st.session_state:
st.session_state.exporter = ResultExporter()
def initialize_components():
"""Initialize the application components."""
if st.session_state.file_handler is None:
st.session_state.file_handler = FileHandler()
if st.session_state.output_handler is None:
st.session_state.output_handler = OutputHandler(
enable_speech=False, # Disable speech in web interface
save_transcript=False # Handle transcript in session state
)
def create_header():
"""Create the main header with modern styling."""
st.markdown("""
đ¤ Sign Language Detector Pro
Advanced AI-Powered Gesture Recognition & Analysis
""", unsafe_allow_html=True)
def create_file_upload_area():
"""Create an enhanced file upload area with drag-and-drop styling."""
st.markdown("""
đ Upload Your Files
Drag and drop your images or videos here, or click to browse
Supported formats: JPG, PNG, BMP, MP4, AVI, MOV, MKV
""", unsafe_allow_html=True)
def create_metrics_dashboard(results: List[Dict[str, Any]]):
"""Create a metrics dashboard showing processing statistics."""
if not results:
return
# Calculate metrics
total_files = len(results)
successful_files = sum(1 for r in results if r.get('success', False))
total_hands = sum(r.get('hands_detected', 0) for r in results if r.get('success', False))
avg_confidence = 0
if successful_files > 0:
confidences = []
for result in results:
if result.get('success') and result.get('detections'):
for detection in result['detections']:
if 'confidence' in detection:
confidences.append(detection['confidence'])
avg_confidence = np.mean(confidences) if confidences else 0
# Display metrics in columns
col1, col2, col3, col4 = st.columns(4)
with col1:
st.markdown(f"""
{total_files}
Files Processed
""", unsafe_allow_html=True)
with col2:
st.markdown(f"""
{successful_files}
Successful
""", unsafe_allow_html=True)
with col3:
st.markdown(f"""
{total_hands}
Hands Detected
""", unsafe_allow_html=True)
with col4:
st.markdown(f"""
{avg_confidence:.1%}
Avg Confidence
""", unsafe_allow_html=True)
def create_confidence_chart(results: List[Dict[str, Any]], chart_key: str = "confidence_chart"):
"""Create a confidence score visualization."""
confidences = []
file_names = []
for result in results:
if result.get('success') and result.get('detections'):
for i, detection in enumerate(result['detections']):
if 'confidence' in detection:
confidences.append(detection['confidence'])
file_name = os.path.basename(result.get('file_path', 'Unknown'))
file_names.append(f"{file_name} - Hand {i+1}")
if confidences:
df = pd.DataFrame({
'File': file_names,
'Confidence': confidences
})
fig = px.bar(df, x='File', y='Confidence',
title='Hand Detection Confidence Scores',
color='Confidence',
color_continuous_scale='Viridis')
fig.update_layout(
xaxis_tickangle=-45,
height=400,
showlegend=False
)
st.plotly_chart(fig, use_container_width=True, key=chart_key)
def create_gesture_analysis_chart(results: List[Dict[str, Any]], chart_key: str = "gesture_analysis_chart"):
"""Create gesture analysis visualization."""
gesture_data = []
for result in results:
if result.get('success') and result.get('detections'):
for detection in result['detections']:
if 'classification' in detection and detection['classification'].get('success'):
classification = detection['classification']
gesture_data.append({
'File': os.path.basename(result.get('file_path', 'Unknown')),
'Hand': detection.get('hand_label', 'Unknown'),
'Letter': classification.get('letter', 'N/A'),
'Word': classification.get('word', 'N/A'),
'Confidence': classification.get('confidence', 0)
})
if gesture_data:
df = pd.DataFrame(gesture_data)
# Create subplots
fig = make_subplots(
rows=1, cols=2,
subplot_titles=('Letters Detected', 'Classification Confidence'),
specs=[[{"type": "pie"}, {"type": "histogram"}]]
)
# Letter distribution pie chart
letter_counts = df['Letter'].value_counts()
fig.add_trace(
go.Pie(labels=letter_counts.index, values=letter_counts.values, name="Letters"),
row=1, col=1
)
# Confidence histogram
fig.add_trace(
go.Histogram(x=df['Confidence'], name="Confidence", nbinsx=10),
row=1, col=2
)
fig.update_layout(height=400, showlegend=False)
st.plotly_chart(fig, use_container_width=True, key=chart_key)
def setup_ai_api():
"""Setup AI API key with automatic Gemini configuration."""
st.sidebar.markdown("### đ AI API Configuration")
# Use Gemini by default
default_gemini_key = "AIzaSyDd2BfvfgnVQFkGufpuD76QOsaPM3hWgxo"
# AI provider selection
ai_provider = st.sidebar.selectbox(
"AI Provider",
["Google Gemini (Recommended)", "OpenAI GPT"],
index=0,
help="Choose your AI provider for sign language classification"
)
use_gemini = "Gemini" in ai_provider
# Check if user wants to use a custom API key
use_custom_key = st.sidebar.checkbox("Use Custom API Key", value=False)
if use_custom_key:
if use_gemini:
api_key = st.sidebar.text_input(
"Custom Gemini API Key",
type="password",
help="Enter your custom Google Gemini API key",
placeholder="AIza..."
)
env_key = 'GEMINI_API_KEY'
else:
api_key = st.sidebar.text_input(
"Custom OpenAI API Key",
type="password",
help="Enter your custom OpenAI API key",
placeholder="sk-..."
)
env_key = 'OPENAI_API_KEY'
if api_key:
os.environ[env_key] = api_key
st.sidebar.success(f"â
Custom {ai_provider.split()[0]} API key configured")
return api_key, use_gemini
else:
st.sidebar.warning("â ī¸ Please enter your custom API key")
return None, use_gemini
else:
# Use default keys
if use_gemini:
os.environ['GEMINI_API_KEY'] = default_gemini_key
os.environ['USE_GEMINI'] = 'True'
st.sidebar.success("â
Gemini API configured automatically")
st.sidebar.info("đ Using Google Gemini for fast, accurate predictions")
return default_gemini_key, True
else:
# OpenAI fallback (will likely fail due to quota)
st.sidebar.warning("â ī¸ OpenAI quota may be exceeded")
st.sidebar.info("đĄ Recommend using Gemini for better reliability")
return None, False
def create_settings_panel():
"""Create an advanced settings panel."""
st.sidebar.markdown("### âī¸ Processing Settings")
# Detection confidence threshold
confidence_threshold = st.sidebar.slider(
"Detection Confidence Threshold",
min_value=0.1,
max_value=1.0,
value=0.7,
step=0.1,
help="Minimum confidence for hand detection"
)
# Maximum hands to detect
max_hands = st.sidebar.selectbox(
"Maximum Hands to Detect",
options=[1, 2, 3, 4],
index=1,
help="Maximum number of hands to detect per image"
)
# Video frame sampling
frame_skip = st.sidebar.slider(
"Video Frame Sampling",
min_value=1,
max_value=30,
value=5,
help="Process every Nth frame in videos (higher = faster processing)"
)
# Export options
st.sidebar.markdown("### đ Export Options")
export_format = st.sidebar.selectbox(
"Export Format",
options=["JSON", "CSV", "PDF Report"],
help="Choose format for exporting results"
)
return {
'confidence_threshold': confidence_threshold,
'max_hands': max_hands,
'frame_skip': frame_skip,
'export_format': export_format
}
def process_uploaded_files(uploaded_files: List, api_key: str, settings: Dict[str, Any], use_gemini: bool = True):
"""Process multiple uploaded files with progress tracking."""
if not uploaded_files:
return []
results = []
progress_bar = st.progress(0)
status_text = st.empty()
# Initialize file handler with settings
file_handler = FileHandler(
frame_skip=settings['frame_skip'],
max_frames=100
)
if api_key:
file_handler.initialize_classifier(api_key, use_gemini=use_gemini)
for i, uploaded_file in enumerate(uploaded_files):
# Update progress
progress = (i + 1) / len(uploaded_files)
progress_bar.progress(progress)
status_text.text(f"Processing {uploaded_file.name}... ({i+1}/{len(uploaded_files)})")
# Save uploaded file to temporary location
with tempfile.NamedTemporaryFile(delete=False, suffix=os.path.splitext(uploaded_file.name)[1]) as tmp_file:
tmp_file.write(uploaded_file.getvalue())
tmp_path = tmp_file.name
try:
# Determine file type and process
file_type = file_handler.get_file_type(tmp_path)
if file_type == 'image':
result = file_handler.process_image(tmp_path)
elif file_type == 'video':
result = file_handler.process_video(tmp_path)
else:
result = {'success': False, 'error': 'Unsupported file format'}
# Add filename to result
result['filename'] = uploaded_file.name
result['file_size'] = len(uploaded_file.getvalue())
results.append(result)
except Exception as e:
results.append({
'success': False,
'error': str(e),
'filename': uploaded_file.name,
'file_size': len(uploaded_file.getvalue())
})
finally:
# Clean up temporary file
try:
os.unlink(tmp_path)
except:
pass
progress_bar.empty()
status_text.empty()
return results
def create_image_with_landmarks(image_array: np.ndarray, hand_landmarks: List[Dict[str, Any]]) -> Image.Image:
"""Create an image with hand landmarks overlaid."""
# Convert to PIL Image for display
if len(image_array.shape) == 3 and image_array.shape[2] == 3:
# BGR to RGB conversion
image_rgb = cv2.cvtColor(image_array, cv2.COLOR_BGR2RGB)
else:
image_rgb = image_array
return Image.fromarray(image_rgb)
def display_image_results(result: Dict[str, Any]):
"""Display results for image processing with enhanced UI."""
if not result['success']:
st.error(f"â Error processing {result.get('filename', 'file')}: {result.get('error', 'Unknown error')}")
return
filename = result.get('filename', 'Unknown')
file_size = result.get('file_size', 0)
# Create result card
st.markdown(f"""
đ¸ {filename}
File Size: {file_size / 1024:.1f} KB | Hands Detected: {result['hands_detected']}
""", unsafe_allow_html=True)
if result['hands_detected'] > 0:
col1, col2 = st.columns([1, 1])
with col1:
st.subheader("đŧī¸ Processed Images")
# Create tabs for different views
img_tab1, img_tab2, img_tab3 = st.tabs(["đ Enhanced", "đ Comparison", "đ¯ 3D View"])
with img_tab1:
if 'enhanced_image' in result:
enhanced_img = create_image_with_landmarks(result['enhanced_image'], [])
st.image(enhanced_img, caption="Enhanced Hand Landmarks", use_container_width=True)
elif 'annotated_image' in result:
annotated_img = create_image_with_landmarks(result['annotated_image'], [])
st.image(annotated_img, caption="Hand Landmarks Detected", use_container_width=True)
with img_tab2:
if 'comparison_image' in result:
comparison_img = create_image_with_landmarks(result['comparison_image'], [])
st.image(comparison_img, caption="Before vs After Comparison", use_container_width=True)
with img_tab3:
# 3D visualization for first detected hand
if result['detections'] and 'landmarks_3d' in result['detections'][0]:
hand_data = {
'label': result['detections'][0]['hand_label'],
'landmarks': result['detections'][0]['landmarks_3d']
}
visualizer = st.session_state.visualizer
fig_3d = visualizer.create_3d_hand_plot(hand_data)
st.plotly_chart(fig_3d, use_container_width=True, key="3d_hand_plot")
else:
st.info("3D visualization requires hand landmark data")
with col2:
st.subheader("đ Detection Details")
for i, detection in enumerate(result['detections']):
with st.expander(f"â Hand {i+1}: {detection['hand_label']}", expanded=True):
# Confidence meter
confidence = detection['confidence']
st.metric("Detection Confidence", f"{confidence:.1%}")
# Progress bar for confidence
st.progress(confidence)
# Gesture description
st.text_area(
"Gesture Description",
detection['gesture_description'],
height=100,
disabled=True
)
# Classification results
if 'classification' in detection and detection['classification']['success']:
classification = detection['classification']
col_a, col_b = st.columns(2)
with col_a:
if classification.get('letter'):
st.success(f"đ¤ **Letter:** {classification['letter']}")
with col_b:
if classification.get('word'):
st.success(f"đ **Word:** {classification['word']}")
if classification.get('confidence'):
st.info(f"đ¯ **AI Confidence:** {classification['confidence']:.1%}")
def display_video_results(result: Dict[str, Any]):
"""Display results for video processing with enhanced UI."""
if not result['success']:
st.error(f"â Error processing {result.get('filename', 'file')}: {result.get('error', 'Unknown error')}")
return
filename = result.get('filename', 'Unknown')
file_size = result.get('file_size', 0)
video_props = result['video_properties']
# Create result card
st.markdown(f"""
đĨ {filename}
File Size: {file_size / (1024*1024):.1f} MB |
Duration: {video_props['duration']:.1f}s |
Total Hands: {result['total_hands_detected']}
""", unsafe_allow_html=True)
# Video metrics
col1, col2, col3, col4 = st.columns(4)
with col1:
st.metric("Total Frames", video_props['total_frames'])
with col2:
st.metric("Processed Frames", video_props['processed_frames'])
with col3:
st.metric("FPS", f"{video_props['fps']:.1f}")
with col4:
st.metric("Hands Found", result['total_hands_detected'])
# Frame-by-frame analysis
if result['frame_detections']:
st.subheader("đ Frame-by-Frame Analysis")
# Enhanced timeline visualization
timeline_fig = create_processing_timeline(result['frame_detections'])
st.plotly_chart(timeline_fig, use_container_width=True, key="video_timeline")
# Additional analysis charts
col_chart1, col_chart2 = st.columns(2)
with col_chart1:
# Confidence over time
confidence_data = []
for frame in result['frame_detections']:
for detection in frame['detections']:
if 'confidence' in detection:
confidence_data.append({
'Timestamp': frame['timestamp'],
'Confidence': detection['confidence'],
'Hand': detection['hand_label']
})
if confidence_data:
conf_df = pd.DataFrame(confidence_data)
fig_conf = px.scatter(conf_df, x='Timestamp', y='Confidence',
color='Hand', title='Detection Confidence Over Time')
st.plotly_chart(fig_conf, use_container_width=True, key="confidence_over_time")
with col_chart2:
# Hand distribution
hand_counts = {}
for frame in result['frame_detections']:
for detection in frame['detections']:
hand_label = detection.get('hand_label', 'Unknown')
hand_counts[hand_label] = hand_counts.get(hand_label, 0) + 1
if hand_counts:
fig_pie = px.pie(values=list(hand_counts.values()),
names=list(hand_counts.keys()),
title='Hand Distribution')
st.plotly_chart(fig_pie, use_container_width=True, key="hand_distribution")
# Detailed frame results
st.subheader("đ Detailed Frame Results")
# Show first 10 frames with detections
frames_to_show = [f for f in result['frame_detections'] if f['hands_detected'] > 0][:10]
for frame_data in frames_to_show:
with st.expander(f"âąī¸ Frame {frame_data['frame_number']} (t={frame_data['timestamp']:.1f}s)"):
for i, detection in enumerate(frame_data['detections']):
st.write(f"**â {detection['hand_label']} Hand {i+1}**")
if 'classification' in detection and detection['classification']['success']:
classification = detection['classification']
col_a, col_b, col_c = st.columns(3)
with col_a:
if classification.get('letter'):
st.info(f"Letter: **{classification['letter']}**")
with col_b:
if classification.get('word'):
st.info(f"Word: **{classification['word']}**")
with col_c:
if classification.get('confidence'):
st.info(f"Confidence: **{classification['confidence']:.1%}**")
# Sequence analysis
if result.get('sequence_analysis') and result['sequence_analysis'].get('success'):
st.subheader("đ Sequence Analysis")
sequence = result['sequence_analysis']
col1, col2 = st.columns(2)
with col1:
if sequence.get('word'):
st.success(f"đ¯ **Detected Word:** {sequence['word']}")
if sequence.get('sentence'):
st.success(f"đ **Detected Sentence:** {sequence['sentence']}")
with col2:
if sequence.get('individual_letters'):
letters_str = ' â '.join(sequence['individual_letters'])
st.info(f"đ¤ **Letter Sequence:** {letters_str}")
if sequence.get('confidence'):
st.metric("Sequence Confidence", f"{sequence['confidence']:.1%}")
def export_results(results: List[Dict[str, Any]], format_type: str):
"""Enhanced export functionality with multiple formats."""
if not results:
st.warning("No results to export")
return
exporter = st.session_state.exporter
timestamp = int(time.time())
col1, col2, col3 = st.columns(3)
with col1:
if st.button("đ Export JSON", use_container_width=True):
with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as tmp_file:
if exporter.export_to_json(results, tmp_file.name, include_metadata=True):
with open(tmp_file.name, 'r') as f:
json_data = f.read()
st.download_button(
label="đĨ Download JSON",
data=json_data,
file_name=f"sign_language_results_{timestamp}.json",
mime="application/json",
use_container_width=True
)
os.unlink(tmp_file.name)
else:
st.error("Failed to export JSON")
with col2:
if st.button("đ Export CSV", use_container_width=True):
with tempfile.NamedTemporaryFile(mode='w', suffix='.csv', delete=False) as tmp_file:
if exporter.export_to_csv(results, tmp_file.name):
with open(tmp_file.name, 'r') as f:
csv_data = f.read()
st.download_button(
label="đĨ Download CSV",
data=csv_data,
file_name=f"sign_language_results_{timestamp}.csv",
mime="text/csv",
use_container_width=True
)
os.unlink(tmp_file.name)
else:
st.error("Failed to export CSV")
with col3:
if st.button("đ Export PDF Report", use_container_width=True):
with tempfile.NamedTemporaryFile(suffix='.pdf', delete=False) as tmp_file:
if exporter.export_to_pdf(results, tmp_file.name, include_images=False):
with open(tmp_file.name, 'rb') as f:
pdf_data = f.read()
st.download_button(
label="đĨ Download PDF",
data=pdf_data,
file_name=f"sign_language_report_{timestamp}.pdf",
mime="application/pdf",
use_container_width=True
)
os.unlink(tmp_file.name)
else:
st.error("Failed to export PDF")
# Summary report
if st.button("đ Generate Summary Report", use_container_width=True):
summary = exporter.create_summary_report(results)
st.markdown("### đ Processing Summary")
col_a, col_b, col_c, col_d = st.columns(4)
with col_a:
st.metric("Total Files", summary['total_files'])
with col_b:
st.metric("Successful", summary['successful_files'])
with col_c:
st.metric("Failed", summary['failed_files'])
with col_d:
st.metric("Hands Detected", summary['total_hands_detected'])
if summary['detected_letters']:
st.markdown("#### đ¤ Most Common Letters")
letters_df = pd.DataFrame(list(summary['detected_letters'].items()),
columns=['Letter', 'Count'])
letters_df = letters_df.sort_values('Count', ascending=False)
fig = px.bar(letters_df.head(10), x='Letter', y='Count',
title='Top 10 Detected Letters')
st.plotly_chart(fig, use_container_width=True, key="top_letters_chart")
if summary['detected_words']:
st.markdown("#### đ Most Common Words")
words_df = pd.DataFrame(list(summary['detected_words'].items()),
columns=['Word', 'Count'])
words_df = words_df.sort_values('Count', ascending=False)
fig = px.bar(words_df.head(10), x='Word', y='Count',
title='Top 10 Detected Words')
st.plotly_chart(fig, use_container_width=True, key="top_words_chart")
def get_single_prediction(result: Dict[str, Any]) -> str:
"""
Extract a single, clear prediction from the result.
Args:
result: Processing result dictionary
Returns:
Single prediction string (letter, word, or "No prediction")
"""
if not result.get('success') or not result.get('detections'):
return "No prediction"
# Collect all predictions from all detected hands
letters = []
words = []
for detection in result['detections']:
if 'classification' in detection and detection['classification'].get('success'):
classification = detection['classification']
# Get letter prediction
if classification.get('letter') and classification['letter'] != 'N/A':
letters.append(classification['letter'])
# Get word prediction
if classification.get('word') and classification['word'] != 'N/A':
words.append(classification['word'])
# Priority: Word > Letter > No prediction
if words:
# Return the most confident word or the first word if multiple
return words[0].upper()
elif letters:
# Return the most confident letter or the first letter if multiple
return letters[0].upper()
else:
return "No prediction"
def display_single_prediction_card(result: Dict[str, Any]):
"""Display a single, clear prediction card for the result."""
filename = os.path.basename(result.get('file_path', 'Unknown'))
prediction = get_single_prediction(result)
# Determine card color based on prediction
if prediction == "No prediction":
card_color = "#E74C3C" # Red for no prediction
icon = "â"
confidence_text = ""
else:
card_color = "#27AE60" # Green for successful prediction
icon = "â
"
# Get confidence if available
confidence = 0.0
for detection in result.get('detections', []):
if 'classification' in detection and detection['classification'].get('success'):
conf = detection['classification'].get('confidence', 0)
if conf > confidence:
confidence = conf
confidence_text = f" (Confidence: {confidence:.1%})" if confidence > 0 else ""
# Display the prediction card
st.markdown(f"""
{icon} {prediction}
đ {filename}{confidence_text}
""", unsafe_allow_html=True)
def display_results(results: List[Dict[str, Any]]):
"""Display processing results with enhanced UI."""
if not results:
st.info("No results to display")
return
# Display Single Predictions First (Most Important)
st.markdown("## đ¯ **SIGN LANGUAGE PREDICTIONS**")
# Create a summary table of all predictions
prediction_data = []
for result in results:
filename = os.path.basename(result.get('file_path', 'Unknown'))
prediction = get_single_prediction(result)
# Get confidence
confidence = 0.0
for detection in result.get('detections', []):
if 'classification' in detection and detection['classification'].get('success'):
conf = detection['classification'].get('confidence', 0)
if conf > confidence:
confidence = conf
prediction_data.append({
'File': filename,
'Prediction': prediction,
'Confidence': f"{confidence:.1%}" if confidence > 0 else "N/A"
})
if prediction_data:
# Display as a clean table
import pandas as pd
df = pd.DataFrame(prediction_data)
st.dataframe(df, use_container_width=True, hide_index=True)
st.markdown("### Individual Prediction Cards")
# Show single prediction cards for each file
for result in results:
display_single_prediction_card(result)
# Add separator
st.markdown("---")
# Create metrics dashboard
create_metrics_dashboard(results)
# Create visualizations
col1, col2 = st.columns(2)
with col1:
create_confidence_chart(results, "main_confidence_chart")
with col2:
create_gesture_analysis_chart(results, "main_gesture_analysis_chart")
# Display individual results
st.markdown("## đ Detailed Analysis")
for result in results:
if result.get('file_type') == 'image':
display_image_results(result)
elif result.get('file_type') == 'video':
display_video_results(result)
else:
st.error(f"â Failed to process {result.get('filename', 'unknown file')}: {result.get('error', 'Unknown error')}")
def display_quick_summary(results: List[Dict[str, Any]]):
"""Display a quick summary of predictions at the top."""
if not results:
return
predictions = []
for result in results:
filename = os.path.basename(result.get('file_path', 'Unknown'))
prediction = get_single_prediction(result)
if prediction != "No prediction":
predictions.append(f"**{filename}** â **{prediction}**")
if predictions:
st.success("đ¯ **Quick Results:** " + " | ".join(predictions))
else:
st.warning("â ī¸ No clear predictions found in uploaded files")
def main():
"""Enhanced Streamlit application with modern UI."""
# Create header
create_header()
# Show quick summary if results exist
if st.session_state.processing_results:
display_quick_summary(st.session_state.processing_results)
# Initialize components
initialize_components()
# Sidebar configuration
st.sidebar.markdown("# đī¸ Control Panel")
# AI API setup
api_key, use_gemini = setup_ai_api()
# Settings panel
settings = create_settings_panel()
# Main content area
tab1, tab2, tab3 = st.tabs(["đ File Processing", "đ Analytics", "âšī¸ About"])
with tab1:
st.markdown("## đ File Processing")
# Enhanced file upload area
create_file_upload_area()
# Multiple file uploader
uploaded_files = st.file_uploader(
"Choose files",
type=['jpg', 'jpeg', 'png', 'bmp', 'mp4', 'avi', 'mov', 'mkv'],
accept_multiple_files=True,
help="Upload multiple images or videos for batch processing"
)
if uploaded_files:
st.success(f"â
{len(uploaded_files)} file(s) uploaded successfully")
# Show file details
with st.expander("đ File Details", expanded=True):
for file in uploaded_files:
file_size = len(file.getvalue())
st.write(f"âĸ **{file.name}** ({file_size / 1024:.1f} KB)")
# Process button
col1, col2, col3 = st.columns([1, 2, 1])
with col2:
if st.button("đ Process All Files", type="primary", use_container_width=True):
if not api_key:
st.error("â Please provide an OpenAI API key to analyze gestures")
else:
with st.spinner("đ Processing files..."):
results = process_uploaded_files(uploaded_files, api_key, settings, use_gemini)
st.session_state.processing_results = results
if results:
st.success(f"â
Processing complete! {len(results)} files processed.")
display_results(results)
# Export options
st.markdown("### đ¤ Export Results")
col_a, col_b = st.columns(2)
with col_a:
export_results(results, settings['export_format'])
with col_b:
if st.button("đī¸ Clear Results"):
st.session_state.processing_results = []
st.experimental_rerun()
# Display previous results if available
elif st.session_state.processing_results:
st.markdown("### đ Previous Results")
display_results(st.session_state.processing_results)
# Export options
st.markdown("### đ¤ Export Results")
col_a, col_b = st.columns(2)
with col_a:
export_results(st.session_state.processing_results, settings['export_format'])
with col_b:
if st.button("đī¸ Clear Results"):
st.session_state.processing_results = []
st.experimental_rerun()
with tab2:
st.markdown("## đ Analytics Dashboard")
if st.session_state.processing_results:
results = st.session_state.processing_results
# Overall statistics
st.markdown("### đ Overall Statistics")
create_metrics_dashboard(results)
# Detailed charts
st.markdown("### đ Detailed Analysis")
col1, col2 = st.columns(2)
with col1:
create_confidence_chart(results, "analytics_confidence_chart")
with col2:
create_gesture_analysis_chart(results, "analytics_gesture_analysis_chart")
# File processing timeline
st.markdown("### âąī¸ Processing Timeline")
if results:
timeline_data = []
for i, result in enumerate(results):
timeline_data.append({
'File': result.get('filename', f'File {i+1}'),
'Success': result.get('success', False),
'Hands': result.get('hands_detected', 0) if result.get('success') else 0,
'Size (KB)': result.get('file_size', 0) / 1024
})
df = pd.DataFrame(timeline_data)
fig = px.scatter(df, x='Size (KB)', y='Hands',
color='Success', size='Hands',
hover_data=['File'],
title='File Size vs Hands Detected')
st.plotly_chart(fig, use_container_width=True, key="file_size_scatter")
else:
st.info("đ No data available. Process some files to see analytics.")
with tab3:
st.markdown("## âšī¸ About Sign Language Detector Pro")
col1, col2 = st.columns(2)
with col1:
st.markdown("""
### đ¯ Features
- **Advanced File Processing**: Batch analysis of images and videos
- **AI-Powered Classification**: OpenAI API integration for accurate gesture recognition
- **Interactive Analytics**: Real-time charts and metrics
- **Multiple Export Formats**: JSON, CSV, and PDF reports
- **Professional UI**: Modern, responsive design
- **Comprehensive Analysis**: Hand landmarks, gesture features, and confidence scores
### đ§ How It Works
1. **Upload Files**: Drag and drop or select multiple files
2. **Hand Detection**: MediaPipe detects 21 hand landmarks
3. **Feature Extraction**: Advanced gesture analysis
4. **AI Classification**: OpenAI interprets gestures
5. **Results Display**: Interactive charts and detailed analysis
""")
with col2:
st.markdown("""
### đ Supported Formats
**Images:**
- JPG, JPEG, PNG, BMP
**Videos:**
- MP4, AVI, MOV, MKV
### âī¸ System Requirements
- Python 3.8+
- OpenAI API key
- Modern web browser
### đ Performance
- Batch processing support
- Optimized video frame sampling
- Real-time progress tracking
- Memory-efficient processing
""")
# System information
st.markdown("### đģ System Information")
info_col1, info_col2 = st.columns(2)
with info_col1:
st.info(f"**Python:** {sys.version.split()[0]}")
st.info(f"**OpenCV:** {cv2.__version__}")
with info_col2:
st.info(f"**Streamlit:** {st.__version__}")
api_status = "â
Configured" if api_key else "â Not configured"
st.info(f"**OpenAI API:** {api_status}")
# Enhanced footer with improved text visibility
st.markdown("---")
st.markdown("""
đ¤ Sign Language Detector Pro
Empowering communication through AI-powered gesture recognition
Built with â¤ī¸ using MediaPipe, OpenAI, and Streamlit
""", unsafe_allow_html=True)
if __name__ == "__main__":
main()