InteractiveImageMosaicGenerator / analyze_metrics.py
VanKee's picture
complete the project with additional analyze metric, create comparisons. Update requirements.txt
25e074b
#!/usr/bin/env python3
"""
Parameter behavior analysis for mosaic generator
Focuses on: parameter degradation effects, CIFAR comparison, cross-image consistency
Analyzes three images: akaza, IMG_5090, IMG_6914
"""
import json
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from pathlib import Path
import re
from collections import defaultdict
import warnings
warnings.filterwarnings('ignore')
# Configuration
METRICS_DIR = Path('./output/test_result/metrics')
OUTPUT_DIR = Path('./output/analysis')
TARGET_IMAGES = ['akaza', 'IMG_3378', 'IMG_5090', 'IMG_6914']
# Visualization settings
plt.style.use('default')
sns.set_palette("husl")
def setup_directories():
"""Create analysis output directories"""
OUTPUT_DIR.mkdir(parents=True, exist_ok=True)
for image in TARGET_IMAGES:
(OUTPUT_DIR / image).mkdir(parents=True, exist_ok=True)
print(f"[INFO] Created analysis directories under {OUTPUT_DIR}")
def parse_filename(filename):
"""Parse filename to extract parameters"""
# Pattern: {image}-min{min}-max{max}-sub{sub}-quant{quant}-{tile}_metrics.json
pattern = r'(.+)-min(\d+)-max(\d+)-sub([0-9p]+)-quant(\d+)-(.+)_metrics\.json'
match = re.match(pattern, filename)
if not match:
return None
image, min_size, max_size, sub_threshold, quantization, tile_library = match.groups()
# Convert threshold back from string (0p1 -> 0.1)
sub_threshold = sub_threshold.replace('p', '.')
return {
'image': image,
'min_size': int(min_size),
'max_size': int(max_size),
'sub_threshold': float(sub_threshold),
'quantization': int(quantization),
'tile_library': tile_library
}
def load_metrics_data():
"""Load all metrics data and organize by image"""
data_by_image = defaultdict(list)
print("[INFO] Loading metrics data...")
for json_file in METRICS_DIR.glob('*.json'):
# Skip files not belonging to our target images
if not any(img in json_file.name for img in TARGET_IMAGES):
continue
parsed = parse_filename(json_file.name)
if parsed is None:
continue
# Load metrics
try:
with open(json_file, 'r') as f:
metrics = json.load(f)
# Combine parameters and metrics
record = {**parsed, **metrics}
data_by_image[parsed['image']].append(record)
except Exception as e:
print(f"[WARNING] Failed to load {json_file.name}: {e}")
# Convert to DataFrames
dfs = {}
for image, records in data_by_image.items():
df = pd.DataFrame(records)
dfs[image] = df
print(f"[INFO] Loaded {len(df)} records for {image}")
return dfs
def create_heatmaps(df, image_name):
"""Create heatmap visualizations for an image"""
print(f"[INFO] Creating heatmaps for {image_name}")
fig, axes = plt.subplots(2, 2, figsize=(16, 12))
fig.suptitle(f'Parameter Impact Heatmaps - {image_name}', fontsize=16, fontweight='bold')
# 1. Min_size vs Max_size colored by SSIM
pivot1 = df.pivot_table(values='SSIM', index='min_size', columns='max_size', aggfunc='mean')
sns.heatmap(pivot1, annot=True, fmt='.3f', ax=axes[0,0], cmap='RdYlGn')
axes[0,0].set_title('SSIM by Min/Max Size')
axes[0,0].set_xlabel('Max Size')
axes[0,0].set_ylabel('Min Size')
# 2. Quantization vs Tile_library colored by Overall_Quality
pivot2 = df.pivot_table(values='Overall_Quality', index='quantization', columns='tile_library', aggfunc='mean')
sns.heatmap(pivot2, annot=True, fmt='.3f', ax=axes[0,1], cmap='RdYlGn')
axes[0,1].set_title('Overall Quality by Quantization/Tile Library')
axes[0,1].set_xlabel('Tile Library')
axes[0,1].set_ylabel('Quantization')
# 3. Subdivision vs Quantization colored by MSE (inverted colormap since lower MSE is better)
pivot3 = df.pivot_table(values='MSE', index='sub_threshold', columns='quantization', aggfunc='mean')
sns.heatmap(pivot3, annot=True, fmt='.0f', ax=axes[1,0], cmap='RdYlGn_r')
axes[1,0].set_title('MSE by Subdivision/Quantization')
axes[1,0].set_xlabel('Quantization')
axes[1,0].set_ylabel('Subdivision Threshold')
# 4. Tile library vs Min_size colored by Edge_Similarity
pivot4 = df.pivot_table(values='Edge_Similarity', index='tile_library', columns='min_size', aggfunc='mean')
sns.heatmap(pivot4, annot=True, fmt='.3f', ax=axes[1,1], cmap='RdYlGn')
axes[1,1].set_title('Edge Similarity by Tile Library/Min Size')
axes[1,1].set_xlabel('Min Size')
axes[1,1].set_ylabel('Tile Library')
plt.tight_layout()
output_path = OUTPUT_DIR / image_name / 'heatmaps.png'
plt.savefig(output_path, dpi=300, bbox_inches='tight')
plt.close()
print(f"[INFO] Saved heatmaps to {output_path}")
def create_metric_comparisons(df, image_name):
"""Create metric comparison charts"""
print(f"[INFO] Creating metric comparisons for {image_name}")
fig, axes = plt.subplots(2, 2, figsize=(16, 12))
fig.suptitle(f'Metric Comparisons - {image_name}', fontsize=16, fontweight='bold')
# 1. Box plots by tile library
metrics_to_plot = ['SSIM', 'Histogram_Correlation', 'Edge_Similarity', 'Overall_Quality']
for i, metric in enumerate(metrics_to_plot):
ax = axes[i//2, i%2]
df.boxplot(column=metric, by='tile_library', ax=ax)
ax.set_title(f'{metric} by Tile Library')
ax.set_xlabel('Tile Library')
ax.set_ylabel(metric)
ax.grid(True, alpha=0.3)
plt.suptitle('') # Remove automatic title
fig.suptitle(f'Metric Distribution by Tile Library - {image_name}', fontsize=16, fontweight='bold')
plt.tight_layout()
output_path = OUTPUT_DIR / image_name / 'metric_comparison.png'
plt.savefig(output_path, dpi=300, bbox_inches='tight')
plt.close()
print(f"[INFO] Saved metric comparison to {output_path}")
def create_parameter_impact(df, image_name):
"""Create parameter impact analysis"""
print(f"[INFO] Creating parameter impact analysis for {image_name}")
fig, axes = plt.subplots(2, 3, figsize=(18, 12))
fig.suptitle(f'Parameter Impact Analysis - {image_name}', fontsize=16, fontweight='bold')
# 1a. Quality metrics by quantization
quantization_impact = df.groupby('quantization')[['MSE', 'SSIM', 'Histogram_Correlation', 'Edge_Similarity']].mean()
quality_metrics = ['SSIM', 'Histogram_Correlation', 'Edge_Similarity']
quantization_impact[quality_metrics].plot(kind='bar', ax=axes[0,0])
axes[0,0].set_title('Quality Metrics by Quantization')
axes[0,0].set_xlabel('Quantization')
axes[0,0].set_ylabel('Metric Value')
axes[0,0].legend()
axes[0,0].tick_params(axis='x', rotation=0)
axes[0,0].grid(True, alpha=0.3)
# 1b. MSE by quantization (separate subplot)
quantization_impact['MSE'].plot(kind='bar', ax=axes[0,1], color='red')
axes[0,1].set_title('MSE by Quantization')
axes[0,1].set_xlabel('Quantization')
axes[0,1].set_ylabel('MSE')
axes[0,1].tick_params(axis='x', rotation=0)
axes[0,1].grid(True, alpha=0.3)
# 2. Size ratio impact (max/min)
df['size_ratio'] = df['max_size'] / df['min_size']
size_ratio_impact = df.groupby('size_ratio')['Overall_Quality'].mean()
size_ratio_impact.plot(kind='bar', ax=axes[0,2], color='skyblue')
axes[0,2].set_title('Overall Quality by Size Ratio (Max/Min)')
axes[0,2].set_xlabel('Size Ratio')
axes[0,2].set_ylabel('Overall Quality')
axes[0,2].tick_params(axis='x', rotation=45)
axes[0,2].grid(True, alpha=0.3)
# 3. Subdivision threshold impact
sub_impact = df.groupby('sub_threshold')['Overall_Quality'].mean()
sub_impact.plot(kind='bar', ax=axes[1,0], color='lightcoral')
axes[1,0].set_title('Overall Quality by Subdivision Threshold')
axes[1,0].set_xlabel('Subdivision Threshold')
axes[1,0].set_ylabel('Overall Quality')
axes[1,0].tick_params(axis='x', rotation=0)
axes[1,0].grid(True, alpha=0.3)
# 4a. Quality metrics by tile library
tile_performance = df.groupby('tile_library')[['MSE', 'SSIM', 'Histogram_Correlation', 'Edge_Similarity']].mean()
quality_metrics = ['SSIM', 'Histogram_Correlation', 'Edge_Similarity']
tile_performance[quality_metrics].plot(kind='bar', ax=axes[1,1])
axes[1,1].set_title('Quality Metrics by Tile Library')
axes[1,1].set_xlabel('Tile Library')
axes[1,1].set_ylabel('Metric Value')
axes[1,1].legend()
axes[1,1].tick_params(axis='x', rotation=45)
axes[1,1].grid(True, alpha=0.3)
# 4b. MSE by tile library
tile_performance['MSE'].plot(kind='bar', ax=axes[1,2], color='red')
axes[1,2].set_title('MSE by Tile Library')
axes[1,2].set_xlabel('Tile Library')
axes[1,2].set_ylabel('MSE')
axes[1,2].tick_params(axis='x', rotation=45)
axes[1,2].grid(True, alpha=0.3)
plt.tight_layout()
output_path = OUTPUT_DIR / image_name / 'parameter_impact.png'
plt.savefig(output_path, dpi=300, bbox_inches='tight')
plt.close()
print(f"[INFO] Saved parameter impact to {output_path}")
def analyze_parameter_degradation(df, image_name):
"""Analyze which parameters cause quality degradation (for artistic/mosaic effects)"""
print(f"[INFO] Analyzing parameter degradation effects for {image_name}")
fig, axes = plt.subplots(2, 2, figsize=(16, 12))
fig.suptitle(f'Parameter Degradation Analysis (For Artistic Effects) - {image_name}', fontsize=16, fontweight='bold')
# 1. Which parameters INCREASE MSE (worse quality = more artistic)
mse_by_param = {}
mse_by_param['quantization'] = df.groupby('quantization')['MSE'].mean()
mse_by_param['min_size'] = df.groupby('min_size')['MSE'].mean()
mse_by_param['max_size'] = df.groupby('max_size')['MSE'].mean()
mse_by_param['sub_threshold'] = df.groupby('sub_threshold')['MSE'].mean()
# Plot MSE increase trends
ax = axes[0,0]
colors = ['red', 'orange', 'green', 'blue']
for i, (param, values) in enumerate(mse_by_param.items()):
ax.plot(values.index, values.values, marker='o', label=param, color=colors[i], linewidth=2)
ax.set_title('MSE by Parameters (Higher = More Artistic)')
ax.set_xlabel('Parameter Value')
ax.set_ylabel('Average MSE')
ax.legend()
ax.grid(True, alpha=0.3)
# 2. Which parameters DECREASE SSIM (worse similarity = more artistic)
ssim_by_param = {}
ssim_by_param['quantization'] = df.groupby('quantization')['SSIM'].mean()
ssim_by_param['min_size'] = df.groupby('min_size')['SSIM'].mean()
ssim_by_param['max_size'] = df.groupby('max_size')['SSIM'].mean()
ssim_by_param['sub_threshold'] = df.groupby('sub_threshold')['SSIM'].mean()
ax = axes[0,1]
for i, (param, values) in enumerate(ssim_by_param.items()):
ax.plot(values.index, values.values, marker='s', label=param, color=colors[i], linewidth=2)
ax.set_title('SSIM by Parameters (Lower = More Artistic)')
ax.set_xlabel('Parameter Value')
ax.set_ylabel('Average SSIM')
ax.legend()
ax.grid(True, alpha=0.3)
# 3. Parameter impact ranking for degradation
degradation_impact = {}
# Calculate impact as difference between max and min values (normalized)
for param in ['quantization', 'min_size', 'max_size', 'sub_threshold']:
mse_range = mse_by_param[param].max() - mse_by_param[param].min()
ssim_range = ssim_by_param[param].max() - ssim_by_param[param].min()
# Normalize by overall metric range
mse_impact = mse_range / df['MSE'].std()
ssim_impact = ssim_range / df['SSIM'].std()
degradation_impact[param] = (mse_impact + ssim_impact) / 2
# Plot simple impact ranking
ax = axes[1,0]
params = list(degradation_impact.keys())
impacts = list(degradation_impact.values())
ax.bar(params, impacts, color='lightcoral')
ax.set_title('Parameter Impact on Quality Degradation')
ax.set_xlabel('Parameters')
ax.set_ylabel('Impact Score')
ax.tick_params(axis='x', rotation=45)
ax.grid(True, alpha=0.3)
# Add score labels
for i, (param, impact) in enumerate(zip(params, impacts)):
ax.text(i, impact + 0.05, f'{impact:.2f}', ha='center', va='bottom')
# 4. Empty subplot (remove recommendations)
axes[1,1].axis('off')
plt.tight_layout()
output_path = OUTPUT_DIR / image_name / 'parameter_degradation.png'
plt.savefig(output_path, dpi=300, bbox_inches='tight')
plt.close()
print(f"[INFO] Saved parameter degradation analysis to {output_path}")
def analyze_cifar_comparison(df, image_name):
"""Direct comparison between CIFAR-10 and CIFAR-100"""
print(f"[INFO] Analyzing CIFAR-10 vs CIFAR-100 comparison for {image_name}")
# Filter data for CIFAR comparisons only
cifar_data = df[df['tile_library'].isin(['cifar-10', 'cifar-100'])].copy()
if len(cifar_data) == 0:
print(f"[WARNING] No CIFAR data found for {image_name}")
return
fig, axes = plt.subplots(2, 2, figsize=(16, 12))
fig.suptitle(f'CIFAR-10 vs CIFAR-100 Direct Comparison - {image_name}', fontsize=16, fontweight='bold')
# 1a. Quality metrics comparison
metrics = ['MSE', 'SSIM', 'Histogram_Correlation', 'Edge_Similarity']
cifar_comparison = cifar_data.groupby('tile_library')[metrics].mean()
quality_metrics = ['SSIM', 'Histogram_Correlation', 'Edge_Similarity']
cifar_comparison[quality_metrics].T.plot(kind='bar', ax=axes[0,0], color=['lightblue', 'lightcoral'])
axes[0,0].set_title('Quality Metrics Comparison')
axes[0,0].set_ylabel('Metric Value')
axes[0,0].legend(title='Tile Library')
axes[0,0].tick_params(axis='x', rotation=45)
axes[0,0].grid(True, alpha=0.3)
# 1b. MSE comparison (separate subplot)
cifar_comparison['MSE'].plot(kind='bar', ax=axes[0,1], color=['red', 'orange'])
axes[0,1].set_title('MSE Comparison')
axes[0,1].set_ylabel('MSE')
axes[0,1].legend(['CIFAR-10', 'CIFAR-100'])
axes[0,1].grid(True, alpha=0.3)
# 2. Paired comparison for same parameter settings
# Create parameter combination identifier
cifar_data['param_combo'] = (cifar_data['min_size'].astype(str) + '_' +
cifar_data['max_size'].astype(str) + '_' +
cifar_data['sub_threshold'].astype(str) + '_' +
cifar_data['quantization'].astype(str))
# Find configurations that exist for both CIFAR types
cifar10_combos = set(cifar_data[cifar_data['tile_library'] == 'cifar-10']['param_combo'])
cifar100_combos = set(cifar_data[cifar_data['tile_library'] == 'cifar-100']['param_combo'])
common_combos = cifar10_combos.intersection(cifar100_combos)
paired_data = []
for combo in common_combos:
combo_data = cifar_data[cifar_data['param_combo'] == combo]
if len(combo_data) == 2: # Should have both CIFAR-10 and CIFAR-100
cifar10_row = combo_data[combo_data['tile_library'] == 'cifar-10'].iloc[0]
cifar100_row = combo_data[combo_data['tile_library'] == 'cifar-100'].iloc[0]
paired_data.append({
'combo': combo,
'cifar10_ssim': cifar10_row['SSIM'],
'cifar100_ssim': cifar100_row['SSIM'],
'cifar10_mse': cifar10_row['MSE'],
'cifar100_mse': cifar100_row['MSE'],
'ssim_diff': cifar10_row['SSIM'] - cifar100_row['SSIM'],
'mse_diff': cifar10_row['MSE'] - cifar100_row['MSE']
})
paired_df = pd.DataFrame(paired_data)
# 2. Win/Loss analysis
ax = axes[1,0]
if len(paired_df) > 0:
ssim_wins = (paired_df['ssim_diff'] > 0).sum() # CIFAR-10 wins
ssim_losses = (paired_df['ssim_diff'] < 0).sum() # CIFAR-100 wins
mse_wins = (paired_df['mse_diff'] < 0).sum() # CIFAR-10 wins (lower MSE is better)
mse_losses = (paired_df['mse_diff'] > 0).sum() # CIFAR-100 wins
categories = ['SSIM', 'MSE']
cifar10_scores = [ssim_wins, mse_wins]
cifar100_scores = [ssim_losses, mse_losses]
x = np.arange(len(categories))
width = 0.35
ax.bar(x - width/2, cifar10_scores, width, label='CIFAR-10 Wins', color='lightblue')
ax.bar(x + width/2, cifar100_scores, width, label='CIFAR-100 Wins', color='lightcoral')
ax.set_title(f'Win/Loss Analysis ({len(paired_df)} comparisons)')
ax.set_ylabel('Number of Wins')
ax.set_xticks(x)
ax.set_xticklabels(categories)
ax.legend()
ax.grid(True, alpha=0.3)
# Add value labels
for i, (c10, c100) in enumerate(zip(cifar10_scores, cifar100_scores)):
ax.text(i - width/2, c10 + 0.5, str(c10), ha='center', va='bottom')
ax.text(i + width/2, c100 + 0.5, str(c100), ha='center', va='bottom')
# 3. Performance difference distribution
ax = axes[1,1]
if len(paired_df) > 0:
ax.hist(paired_df['ssim_diff'], bins=20, alpha=0.7, color='skyblue', edgecolor='black')
ax.axvline(x=0, color='red', linestyle='--', linewidth=2)
ax.set_title('SSIM Difference Distribution (CIFAR-10 - CIFAR-100)')
ax.set_xlabel('SSIM Difference')
ax.set_ylabel('Frequency')
ax.grid(True, alpha=0.3)
plt.tight_layout()
output_path = OUTPUT_DIR / image_name / 'cifar_comparison.png'
plt.savefig(output_path, dpi=300, bbox_inches='tight')
plt.close()
print(f"[INFO] Saved CIFAR comparison to {output_path}")
def analyze_size_consistency(all_dfs):
"""Analyze if min/max size effects are consistent across images"""
print("[INFO] Analyzing min/max size consistency across images")
fig, axes = plt.subplots(2, 2, figsize=(16, 12))
fig.suptitle('Min/Max Size Effects Consistency Across Images', fontsize=16, fontweight='bold')
# Combine all data
combined_data = []
for image_name, df in all_dfs.items():
df_copy = df.copy()
df_copy['image'] = image_name
combined_data.append(df_copy)
combined_df = pd.concat(combined_data, ignore_index=True)
# 1. Min size effect on SSIM across images
ax = axes[0,0]
for image in TARGET_IMAGES:
image_data = combined_df[combined_df['image'] == image]
min_size_effect = image_data.groupby('min_size')['SSIM'].mean()
ax.plot(min_size_effect.index, min_size_effect.values, marker='o', label=image, linewidth=2)
ax.set_title('Min Size Effect on SSIM')
ax.set_xlabel('Min Size')
ax.set_ylabel('Average SSIM')
ax.legend()
ax.grid(True, alpha=0.3)
# 2. Max size effect on SSIM across images
ax = axes[0,1]
for image in TARGET_IMAGES:
image_data = combined_df[combined_df['image'] == image]
max_size_effect = image_data.groupby('max_size')['SSIM'].mean()
ax.plot(max_size_effect.index, max_size_effect.values, marker='s', label=image, linewidth=2)
ax.set_title('Max Size Effect on SSIM')
ax.set_xlabel('Max Size')
ax.set_ylabel('Average SSIM')
ax.legend()
ax.grid(True, alpha=0.3)
# 3. Size ratio consistency
combined_df['size_ratio'] = combined_df['max_size'] / combined_df['min_size']
ax = axes[1,0]
for image in TARGET_IMAGES:
image_data = combined_df[combined_df['image'] == image]
ratio_effect = image_data.groupby('size_ratio')['Overall_Quality'].mean()
ax.plot(ratio_effect.index, ratio_effect.values, marker='^', label=image, linewidth=2)
ax.set_title('Size Ratio Effect on Overall Quality')
ax.set_xlabel('Size Ratio (Max/Min)')
ax.set_ylabel('Average Overall Quality')
ax.legend()
ax.grid(True, alpha=0.3)
# 4. Size ratio effect comparison
ax = axes[1,1]
# Show correlation values as a simple bar chart
consistency_analysis = {}
for size_param in ['min_size', 'max_size']:
param_effects = {}
for image in TARGET_IMAGES:
image_data = combined_df[combined_df['image'] == image]
effect = image_data.groupby(size_param)['SSIM'].mean()
param_effects[image] = effect
# Calculate correlation between images
correlations = []
images = list(param_effects.keys())
for i in range(len(images)):
for j in range(i+1, len(images)):
# Find common parameter values
common_params = set(param_effects[images[i]].index).intersection(
set(param_effects[images[j]].index)
)
if len(common_params) > 1:
vals_i = [param_effects[images[i]][p] for p in common_params]
vals_j = [param_effects[images[j]][p] for p in common_params]
corr = np.corrcoef(vals_i, vals_j)[0,1]
correlations.append(corr)
consistency_analysis[size_param] = np.mean(correlations) if correlations else 0
# Plot consistency as bar chart
params = list(consistency_analysis.keys())
correlations = list(consistency_analysis.values())
ax.bar(params, correlations, color=['skyblue', 'lightgreen'])
ax.set_title('Parameter Consistency Across Images')
ax.set_xlabel('Size Parameters')
ax.set_ylabel('Average Correlation')
ax.set_ylim(0, 1)
ax.grid(True, alpha=0.3)
# Add correlation values
for i, (param, corr) in enumerate(zip(params, correlations)):
ax.text(i, corr + 0.02, f'{corr:.3f}', ha='center', va='bottom')
plt.tight_layout()
output_path = OUTPUT_DIR / 'size_consistency_analysis.png'
plt.savefig(output_path, dpi=300, bbox_inches='tight')
plt.close()
print(f"[INFO] Saved size consistency analysis to {output_path}")
def main():
"""Main analysis function"""
print("=" * 60)
print("MOSAIC PARAMETER BEHAVIOR ANALYSIS")
print("=" * 60)
setup_directories()
# Load data
all_dfs = load_metrics_data()
if not all_dfs:
print("[ERROR] No data loaded. Check metrics directory.")
return
# Analyze each image
for image_name, df in all_dfs.items():
print(f"\n[INFO] Analyzing {image_name}...")
# Keep original heatmaps and parameter impact
create_heatmaps(df, image_name)
create_parameter_impact(df, image_name)
# New analyses
analyze_parameter_degradation(df, image_name)
analyze_cifar_comparison(df, image_name)
# Cross-image consistency analysis
analyze_size_consistency(all_dfs)
print("\n" + "=" * 60)
print("ANALYSIS COMPLETE!")
print("=" * 60)
print(f"Results saved to: {OUTPUT_DIR}")
print("\nGenerated analyses:")
print("• heatmaps.png - Parameter impact heatmaps")
print("• parameter_impact.png - Parameter effect analysis")
print("• parameter_degradation.png - Settings for artistic effects")
print("• cifar_comparison.png - CIFAR-10 vs CIFAR-100 comparison")
print("• size_consistency_analysis.png - Cross-image size effect consistency")
if __name__ == "__main__":
main()