Spaces:

pilotstuki
/

odatalogparser

Sleeping

App Files Files Community

odatalogparser / app.py

pilotstuki

Fix slow request threshold not applying from UI

113119c 5 months ago

raw

history blame contribute delete

18.3 kB

	"""
	IIS Log Analyzer - Streamlit Application
	High-performance log analysis tool for large IIS log files (200MB-1GB+)
	"""

	import streamlit as st
	import plotly.graph_objects as go
	import plotly.express as px
	from plotly.subplots import make_subplots
	import pandas as pd
	from pathlib import Path
	import tempfile
	from typing import List
	import time

	from log_parser import IISLogParser, LogAnalyzer, analyze_multiple_logs


	# Page configuration
	st.set_page_config(
	page_title="IIS Log Analyzer",
	page_icon="📊",
	layout="wide",
	initial_sidebar_state="expanded"
	)

	# Custom CSS
	st.markdown("""
	<style>
	.metric-card {
	background-color: #f0f2f6;
	padding: 20px;
	border-radius: 10px;
	margin: 10px 0;
	}
	.error-metric {
	background-color: #ffebee;
	}
	.success-metric {
	background-color: #e8f5e9;
	}
	.warning-metric {
	background-color: #fff3e0;
	}
	</style>
	""", unsafe_allow_html=True)


	def format_number(num: int) -> str:
	"""Format large numbers with thousand separators."""
	return f"{num:,}"


	def create_summary_table(stats: dict) -> pd.DataFrame:
	"""Create summary statistics table."""
	# Get threshold in seconds for display
	threshold_ms = stats.get("slow_threshold", 3000)
	threshold_display = f">{threshold_ms}ms" if threshold_ms >= 1000 else f">{threshold_ms}ms"

	data = {
	"Metric": [
	"Total Requests (before filtering)",
	"Excluded Requests (HEAD+Zabbix + 401)",
	"Processed Requests",
	"Errors (≠200, ≠401)",
	f"Slow Requests ({threshold_display})",
	"Peak RPS",
	"Peak Timestamp",
	"Avg Response Time (ms)",
	"Max Response Time (ms)",
	"Min Response Time (ms)",
	],
	"Value": [
	format_number(stats["total_requests_before"]),
	format_number(stats["excluded_requests"]),
	format_number(stats["total_requests_after"]),
	format_number(stats["errors"]),
	format_number(stats["slow_requests"]),
	format_number(stats["peak_rps"]),
	stats["peak_timestamp"] or "N/A",
	format_number(stats["avg_time_ms"]),
	format_number(stats["max_time_ms"]),
	format_number(stats["min_time_ms"]),
	]
	}
	return pd.DataFrame(data)


	def create_response_time_chart(dist: dict, title: str) -> go.Figure:
	"""Create response time distribution chart."""
	labels = list(dist.keys())
	values = list(dist.values())

	fig = go.Figure(data=[
	go.Bar(
	x=labels,
	y=values,
	marker_color='lightblue',
	text=values,
	textposition='auto',
	)
	])

	fig.update_layout(
	title=title,
	xaxis_title="Response Time Range",
	yaxis_title="Request Count",
	height=400,
	showlegend=False
	)

	return fig


	def create_top_methods_chart(methods: List[dict], title: str) -> go.Figure:
	"""Create top methods bar chart."""
	if not methods:
	return go.Figure()

	df = pd.DataFrame(methods)

	fig = make_subplots(
	rows=1, cols=2,
	subplot_titles=("Request Count", "Avg Response Time (ms)")
	)

	# Request count
	fig.add_trace(
	go.Bar(
	x=df["method_name"],
	y=df["count"],
	name="Count",
	marker_color='steelblue',
	text=df["count"],
	textposition='auto',
	),
	row=1, col=1
	)

	# Average time
	fig.add_trace(
	go.Bar(
	x=df["method_name"],
	y=df["avg_time"].round(1),
	name="Avg Time",
	marker_color='coral',
	text=df["avg_time"].round(1),
	textposition='auto',
	),
	row=1, col=2
	)

	fig.update_layout(
	title_text=title,
	height=400,
	showlegend=False
	)

	return fig


	def create_metrics_comparison(individual_stats: List[dict]) -> go.Figure:
	"""Create comparison chart for multiple services."""
	services = [s["summary"]["service_name"] for s in individual_stats]
	requests = [s["summary"]["total_requests_after"] for s in individual_stats]
	errors = [s["summary"]["errors"] for s in individual_stats]
	avg_times = [s["summary"]["avg_time_ms"] for s in individual_stats]

	fig = make_subplots(
	rows=1, cols=3,
	subplot_titles=("Processed Requests", "Errors", "Avg Response Time (ms)"),
	specs=[[{"type": "bar"}, {"type": "bar"}, {"type": "bar"}]]
	)

	fig.add_trace(
	go.Bar(x=services, y=requests, marker_color='lightblue', text=requests, textposition='auto'),
	row=1, col=1
	)

	fig.add_trace(
	go.Bar(x=services, y=errors, marker_color='salmon', text=errors, textposition='auto'),
	row=1, col=2
	)

	fig.add_trace(
	go.Bar(x=services, y=avg_times, marker_color='lightgreen', text=avg_times, textposition='auto'),
	row=1, col=3
	)

	fig.update_layout(
	title_text="Service Comparison",
	height=400,
	showlegend=False
	)

	return fig


	def process_log_file(file_path: str, service_name: str = None, slow_threshold: int = 3000) -> dict:
	"""Process a single log file and return statistics."""
	parser = IISLogParser(file_path)
	if service_name:
	parser.service_name = service_name

	with st.spinner(f"Parsing {Path(file_path).name}..."):
	df = parser.parse()

	if df.height == 0:
	st.error(f"No valid log entries found in {Path(file_path).name}")
	return None

	with st.spinner(f"Analyzing {parser.service_name}..."):
	analyzer = LogAnalyzer(df, parser.service_name, slow_threshold)

	stats = {
	"summary": analyzer.get_summary_stats(),
	"top_methods": analyzer.get_top_methods(),
	"error_breakdown": analyzer.get_error_breakdown(),
	"errors_by_method": analyzer.get_errors_by_method(n=10),
	"response_time_dist": analyzer.get_response_time_distribution(),
	"analyzer": analyzer, # Keep reference for detailed error queries
	}

	return stats


	def main():
	st.title("📊 IIS Log Performance Analyzer")
	st.markdown("High-performance analysis tool for large IIS log files (up to 1GB+)")

	# Sidebar
	st.sidebar.header("Configuration")

	# File upload mode
	upload_mode = st.sidebar.radio(
	"Upload Mode",
	["Single File", "Multiple Files"],
	help="Analyze one or multiple log files"
	)

	# File uploader
	if upload_mode == "Single File":
	uploaded_files = st.sidebar.file_uploader(
	"Upload IIS Log File",
	type=["log", "txt"],
	help="Upload IIS W3C Extended format log file"
	)
	uploaded_files = [uploaded_files] if uploaded_files else []
	else:
	uploaded_files = st.sidebar.file_uploader(
	"Upload IIS Log Files",
	type=["log", "txt"],
	accept_multiple_files=True,
	help="Upload multiple IIS log files for comparison"
	)

	# Analysis options
	st.sidebar.header("Analysis Options")
	show_top_n = st.sidebar.slider("Top N Methods", 3, 20, 5)
	slow_threshold = st.sidebar.number_input(
	"Slow Request Threshold (ms)",
	min_value=100,
	max_value=10000,
	value=3000,
	step=100
	)

	# Process files
	if uploaded_files:
	st.info(f"Processing {len(uploaded_files)} file(s)...")

	# Save uploaded files to temp directory
	temp_files = []
	for uploaded_file in uploaded_files:
	with tempfile.NamedTemporaryFile(delete=False, suffix=".log") as tmp:
	tmp.write(uploaded_file.getvalue())
	temp_files.append(tmp.name)

	start_time = time.time()

	# Process each file
	all_stats = []
	for i, temp_file in enumerate(temp_files):
	file_name = uploaded_files[i].name
	st.subheader(f"📄 {file_name}")

	stats = process_log_file(temp_file, None, slow_threshold)
	if stats:
	all_stats.append(stats)

	# Display summary metrics
	col1, col2, col3, col4 = st.columns(4)
	with col1:
	st.metric(
	"Total Requests",
	format_number(stats["summary"]["total_requests_after"])
	)
	with col2:
	st.metric(
	"Errors",
	format_number(stats["summary"]["errors"]),
	delta=None,
	delta_color="inverse"
	)
	with col3:
	st.metric(
	"Avg Time (ms)",
	format_number(stats["summary"]["avg_time_ms"])
	)
	with col4:
	st.metric(
	"Peak RPS",
	format_number(stats["summary"]["peak_rps"])
	)

	# Tabs for detailed analysis
	tab1, tab2, tab3, tab4, tab5 = st.tabs([
	"Summary", "Top Methods", "Response Time", "Error Breakdown", "Errors by Method"
	])

	with tab1:
	st.dataframe(
	create_summary_table(stats["summary"]),
	hide_index=True,
	use_container_width=True
	)

	with tab2:
	if stats["top_methods"]:
	st.plotly_chart(
	create_top_methods_chart(
	stats["top_methods"][:show_top_n],
	f"Top {show_top_n} Methods - {stats['summary']['service_name']}"
	),
	use_container_width=True
	)

	# Show table
	methods_df = pd.DataFrame(stats["top_methods"][:show_top_n])
	methods_df["avg_time"] = methods_df["avg_time"].round(1)
	st.dataframe(methods_df, hide_index=True, use_container_width=True)
	else:
	st.info("No method data available")

	with tab3:
	if stats["response_time_dist"]:
	st.plotly_chart(
	create_response_time_chart(
	stats["response_time_dist"],
	f"Response Time Distribution - {stats['summary']['service_name']}"
	),
	use_container_width=True
	)
	else:
	st.info("No response time distribution data")

	with tab4:
	if stats["error_breakdown"]:
	error_df = pd.DataFrame(stats["error_breakdown"])
	error_df.columns = ["Status Code", "Count"]
	st.dataframe(error_df, hide_index=True, use_container_width=True)

	# Pie chart
	fig = px.pie(
	error_df,
	values="Count",
	names="Status Code",
	title=f"Error Distribution - {stats['summary']['service_name']}"
	)
	st.plotly_chart(fig, use_container_width=True)
	else:
	st.success("No errors found! ✓")

	with tab5:
	st.markdown("### 🔍 Errors by Method")
	st.markdown("This view shows which specific methods are causing errors, with full context for debugging.")

	if stats["errors_by_method"]:
	# Display summary table
	errors_method_df = pd.DataFrame(stats["errors_by_method"])
	errors_method_df["error_rate_percent"] = errors_method_df["error_rate_percent"].round(2)
	errors_method_df["avg_response_time_ms"] = errors_method_df["avg_response_time_ms"].round(1)

	# Rename columns for better display
	errors_method_df.columns = [
	"Method Path", "Total Calls", "Error Count",
	"Most Common Error", "Avg Response Time (ms)", "Error Rate (%)"
	]

	st.dataframe(errors_method_df, hide_index=True, use_container_width=True)

	# Bar chart of top error-prone methods
	fig = go.Figure()
	fig.add_trace(go.Bar(
	x=errors_method_df["Method Path"],
	y=errors_method_df["Error Count"],
	marker_color='red',
	text=errors_method_df["Error Count"],
	textposition='auto',
	name="Error Count"
	))

	fig.update_layout(
	title=f"Top Error-Prone Methods - {stats['summary']['service_name']}",
	xaxis_title="Method Path",
	yaxis_title="Error Count",
	height=400,
	showlegend=False
	)
	st.plotly_chart(fig, use_container_width=True)

	# Allow users to drill down into specific methods
	st.markdown("#### 🔎 Detailed Error Logs")
	selected_method = st.selectbox(
	"Select a method to view detailed error logs:",
	options=["All"] + errors_method_df["Method Path"].tolist(),
	key=f"method_select_{file_name}"
	)

	if selected_method and selected_method != "All":
	error_details = stats["analyzer"].get_error_details(
	method_path=selected_method,
	limit=50
	)
	if error_details:
	details_df = pd.DataFrame(error_details)
	st.dataframe(details_df, hide_index=True, use_container_width=True)
	st.info(f"Showing up to 50 most recent errors for {selected_method}")
	else:
	st.info(f"No error details found for {selected_method}")
	elif selected_method == "All":
	error_details = stats["analyzer"].get_error_details(limit=50)
	if error_details:
	details_df = pd.DataFrame(error_details)
	st.dataframe(details_df, hide_index=True, use_container_width=True)
	st.info("Showing up to 50 most recent errors across all methods")
	else:
	st.success("No errors found in any methods! ✓")

	st.divider()

	# Multi-file comparison
	if len(all_stats) > 1:
	st.header("📊 Service Comparison")
	st.plotly_chart(
	create_metrics_comparison(all_stats),
	use_container_width=True
	)

	# Combined summary
	st.subheader("Combined Statistics")
	combined = {
	"total_requests_before": sum(s["summary"]["total_requests_before"] for s in all_stats),
	"excluded_requests": sum(s["summary"]["excluded_requests"] for s in all_stats),
	"total_requests_after": sum(s["summary"]["total_requests_after"] for s in all_stats),
	"errors": sum(s["summary"]["errors"] for s in all_stats),
	"slow_requests": sum(s["summary"]["slow_requests"] for s in all_stats),
	}

	col1, col2, col3 = st.columns(3)
	with col1:
	st.metric("Total Requests (All Services)", format_number(combined["total_requests_after"]))
	with col2:
	st.metric("Total Errors (All Services)", format_number(combined["errors"]))
	with col3:
	st.metric("Total Slow Requests (All Services)", format_number(combined["slow_requests"]))

	processing_time = time.time() - start_time
	st.success(f"✓ Analysis completed in {processing_time:.2f} seconds")

	# Clean up temp files
	for temp_file in temp_files:
	Path(temp_file).unlink(missing_ok=True)

	else:
	# Welcome screen
	st.info("👆 Upload one or more IIS log files to begin analysis")

	st.markdown("""
	### Features
	- ⚡ Fast processing of large files (200MB-1GB+) using Polars
	- 📊 Comprehensive metrics: RPS, response times, error rates
	- 🔍 Detailed analysis: Top methods, error breakdown, time distribution
	- 📈 Visual reports: Interactive charts with Plotly
	- 🔄 Multi-file support: Compare multiple services side-by-side

	### Log Format
	This tool supports IIS W3C Extended Log Format with the following fields:
	```
	date time s-ip cs-method cs-uri-stem cs-uri-query s-port cs-username
	c-ip cs(User-Agent) cs(Referer) sc-status sc-substatus sc-win32-status time-taken
	```

	### Filtering Rules
	- Excludes lines with both `HEAD` method and `Zabbix` in User-Agent
	- 401 Unauthorized responses are excluded from error counts
	- Errors are defined as status codes ≠ 200 and ≠ 401
	- Slow requests are those with response time > 3000ms (configurable)
	""")


	if __name__ == "__main__":
	main()