Spaces:

UMCU
/

PerplexityViewer

Sleeping

PerplexityViewer / test_colors.py

Bram van Es

bla

ef12530 about 1 month ago

7.11 kB

	#!/usr/bin/env python3
	"""
	Test script to verify color visualization is working correctly
	"""

	import numpy as np
	import re
	from app import create_visualization

	def test_color_visualization():
	"""Test that the visualization creates colored HTML"""
	print("🎨 Testing Color Visualization")
	print("=" * 50)

	# Test with sample data
	tokens = ["The", "quick", "brown", "fox", "jumps", "over", "lazy", "dog"]
	perplexities = np.array([1.2, 2.5, 8.3, 3.1, 15.7, 2.0, 12.4, 1.8])

	print(f"📝 Tokens: {tokens}")
	print(f"📊 Perplexities: {perplexities}")

	# Generate visualization
	html = create_visualization(tokens, perplexities)

	# Check that HTML was generated
	assert len(html) > 100, "HTML output too short"
	print("✅ HTML generated successfully")

	# Check for color information in HTML
	color_pattern = r'rgba?\(\d+,\s\d+,\s\d+(?:,\s*[\d.]+)?\)'
	colors_found = re.findall(color_pattern, html)

	print(f"🎨 Colors found in HTML: {len(colors_found)}")
	for i, color in enumerate(colors_found[:5]): # Show first 5
	print(f" Color {i+1}: {color}")

	assert len(colors_found) > 0, "No colors found in HTML output"
	print("✅ Color information found in HTML")

	# Check for span elements with style attributes
	span_pattern = r'<span style="[^"]background-color[^"]"[^>]*>'
	spans_found = re.findall(span_pattern, html)

	print(f"🏷️ Styled spans found: {len(spans_found)}")
	assert len(spans_found) >= len(tokens) - 2, "Not enough styled spans found" # Allow for some filtering
	print("✅ Styled spans with background colors found")

	# Check for tooltip information
	assert 'title="Perplexity:' in html, "No tooltip information found"
	print("✅ Tooltip information found")

	# Verify different colors for different perplexity ranges
	# Extract RGB values
	rgb_values = []
	for color in colors_found:
	# Extract numbers from rgba(r,g,b,a) or rgb(r,g,b)
	numbers = re.findall(r'\d+', color)
	if len(numbers) >= 3:
	rgb_values.append((int(numbers[0]), int(numbers[1]), int(numbers[2])))

	if len(rgb_values) >= 2:
	# Check that we have different colors (not all the same)
	unique_colors = set(rgb_values)
	print(f"🌈 Unique colors found: {len(unique_colors)}")
	assert len(unique_colors) > 1, "All tokens have the same color"
	print("✅ Multiple different colors found")

	# Check color range makes sense
	red_values = [r for r, g, b in rgb_values]
	green_values = [g for r, g, b in rgb_values]

	print(f"🔴 Red range: {min(red_values)} - {max(red_values)}")
	print(f"🟢 Green range: {min(green_values)} - {max(green_values)}")

	# Should have variation in color channels
	assert max(red_values) - min(red_values) > 20, "Not enough red variation"
	print("✅ Sufficient color variation found")

	return html

	def test_edge_cases():
	"""Test edge cases for color visualization"""
	print("\n🧪 Testing Edge Cases")
	print("=" * 50)

	# Test with very high perplexities
	tokens = ["unusual", "words", "here"]
	high_perplexities = np.array([100.0, 200.0, 50.0])

	html = create_visualization(tokens, high_perplexities)
	assert len(html) > 50, "HTML too short for high perplexities"
	print("✅ High perplexity values handled")

	# Test with very low perplexities
	low_perplexities = np.array([0.1, 0.2, 0.15])
	html = create_visualization(tokens, low_perplexities)
	assert len(html) > 50, "HTML too short for low perplexities"
	print("✅ Low perplexity values handled")

	# Test with single token
	single_token = ["word"]
	single_perplexity = np.array([5.0])
	html = create_visualization(single_token, single_perplexity)
	assert len(html) > 50, "HTML too short for single token"
	print("✅ Single token handled")

	# Test with empty input
	empty_html = create_visualization([], np.array([]))
	assert "No tokens" in empty_html, "Empty case not handled properly"
	print("✅ Empty input handled")

	def test_color_gradient():
	"""Test that color gradient works as expected"""
	print("\n🌈 Testing Color Gradient")
	print("=" * 50)

	# Create tokens with ascending perplexities
	tokens = [f"token_{i}" for i in range(10)]
	perplexities = np.array([i * 2.0 + 1.0 for i in range(10)]) # 1, 3, 5, 7, 9, 11, 13, 15, 17, 19

	html = create_visualization(tokens, perplexities)

	# Extract all RGB values in order
	color_pattern = r'rgba?\((\d+),\s(\d+),\s(\d+)(?:,\s*[\d.]+)?\)'
	colors_found = re.findall(color_pattern, html)

	if len(colors_found) >= 5:
	# Convert to numeric values
	rgb_values = [(int(r), int(g), int(b)) for r, g, b in colors_found]

	# Check that low perplexity tokens are more green
	low_perp_color = rgb_values[0] # First token (lowest perplexity)
	high_perp_color = rgb_values[-1] # Last token (highest perplexity)

	print(f"🟢 Low perplexity color (perp={perplexities[0]:.1f}): RGB{low_perp_color}")
	print(f"🔴 High perplexity color (perp={perplexities[-1]:.1f}): RGB{high_perp_color}")

	# Low perplexity should be more green (higher green value)
	# High perplexity should be more red (higher red value)
	if low_perp_color[1] > high_perp_color[1]: # Green component
	print("✅ Low perplexity tokens are greener")
	else:
	print("⚠️ Expected low perplexity to be greener")

	if high_perp_color[0] > low_perp_color[0]: # Red component
	print("✅ High perplexity tokens are redder")
	else:
	print("⚠️ Expected high perplexity to be redder")

	def main():
	"""Run all color visualization tests"""
	print("🎨 Color Visualization Test Suite")
	print("=" * 60)

	try:
	# Test basic functionality
	html = test_color_visualization()

	# Test edge cases
	test_edge_cases()

	# Test color gradient
	test_color_gradient()

	print("\n" + "=" * 60)
	print("🎉 All color visualization tests passed!")
	print("🌈 The tokens should now appear with colored backgrounds!")
	print("=" * 60)

	# Save a sample HTML file for manual inspection
	with open("sample_visualization.html", "w") as f:
	f.write(f"""
	<!DOCTYPE html>
	<html>
	<head>
	<title>Sample Perplexity Visualization</title>
	</head>
	<body>
	<h1>Sample Perplexity Visualization</h1>
	<p>This is what the colored visualization should look like:</p>
	{html}
	</body>
	</html>
	""")
	print("💾 Sample visualization saved to 'sample_visualization.html'")
	print(" Open this file in your browser to see the colors!")

	return True

	except Exception as e:
	print(f"\n❌ Color visualization test failed: {e}")
	import traceback
	traceback.print_exc()
	return False

	if __name__ == "__main__":
	success = main()
	exit(0 if success else 1)