UserSyncUI

Paused

App Files Files Community

UserSyncUI / tests /unit /test_tiny_styler.py

harvesthealth

Upload folder using huggingface_hub

f6686e1 verified 2 months ago

raw

history blame contribute delete

7.3 kB

	import pytest
	import textwrap

	import logging
	logger = logging.getLogger("tinytroupe")

	import sys
	# Insert paths at the beginning of sys.path (position 0)
	sys.path.insert(0, '..')
	sys.path.insert(0, '../../')
	sys.path.insert(0, '../../tinytroupe/')

	from testing_utils import *

	from tinytroupe.enrichment.tiny_styler import TinyStyler

	def test_apply_style():
	"""Test the basic functionality of apply_style using the actual LLM."""
	content_to_style = textwrap.dedent("""
	The results of our quarterly financial analysis show a 15% increase in revenue
	and a 5% decrease in operating costs. Customer acquisition costs have decreased
	by 10% while retention rates have improved from 65% to 78%. Our new product line
	has contributed to 25% of this quarter's growth.
	""").strip()

	style = "casual"

	# Call the method with the actual LLM
	styler = TinyStyler()
	result = styler.apply_style(
	content=content_to_style,
	style=style,
	content_type="report",
	verbose=True
	)

	# lowercase the content to make assertions case-insensitive
	result = result.lower() if result else None
	# Log the result for manual inspection
	logger.debug(f"Styled content: {result}")

	# Assert result
	assert result is not None, "The result should not be None"
	# Check that key information is preserved in the styled content
	assert ("15" in result) or ("fifteen" in result), "The styled content should preserve the 15% revenue increase information"
	assert ("5" in result) or ("five" in result), "The styled content should preserve the 5% decrease in operating costs information"
	assert ("78" in result) or ("seventy-eight" in result), "The styled content should preserve the 78% retention rate information"

	# Semantic verification: ensure the styled content maintains financial/business meaning
	assert proposition_holds(result + " - The content discusses financial performance, revenue, costs, or business metrics")

	# Semantic verification: ensure the styled content is actually in casual style
	assert proposition_holds(result + " - The writing style is casual, informal, or conversational rather than formal or technical")

	# Check that the style has been applied (this is more subjective)
	# For casual style, we might expect certain casual markers
	casual_indicators = ["!", "we", "our", "pretty", "nice", "great", "awesome", "cool", "hey", "check", "looking"]
	has_casual_tone = any(indicator in result.lower() for indicator in casual_indicators)
	assert has_casual_tone, "The result should have a casual tone"

	logger.debug(f"Styling result: {result}")

	def test_apply_style_with_different_styles():
	"""Test applying different styles to the same content."""
	content_to_style = "We need to improve our customer retention strategies to boost quarterly performance."

	# Test with three different styles
	styles = ["technical", "professional", "enthusiastic"]
	results = {}

	styler = TinyStyler()
	for style in styles:
	results[style] = styler.apply_style(
	content=content_to_style,
	style=style
	)
	# Basic validation
	assert results[style] is not None, f"The {style} styled result should not be None"
	assert "customer retention" in results[style], f"The {style} styled content should preserve the key information"

	# Semantic verification: ensure each style is appropriately applied
	if style == "technical":
	assert proposition_holds(results[style] + " - The writing style is technical, detailed, or uses professional/technical language")
	elif style == "professional":
	assert proposition_holds(results[style] + " - The writing style is professional, formal, or business-like")
	elif style == "enthusiastic":
	assert proposition_holds(results[style] + " - The writing style is enthusiastic, energetic, or shows excitement")

	# Verify that different styles produce different results
	assert results["technical"] != results["professional"] != results["enthusiastic"], "Different styles should produce different results"

	# Log results for manual inspection
	for style, result in results.items():
	logger.debug(f"{style} styling result: {result}")

	def test_context_cache_usage():
	"""Test that context cache is properly used when enabled."""
	# Create styler with context caching enabled
	styler = TinyStyler(use_past_results_in_context=True)

	# First styling
	first_content = "The team completed the project ahead of schedule."
	first_style = "formal"
	first_result = styler.apply_style(content=first_content, style=first_style)

	# Second styling - should have context from first
	second_content = "We saved 15% on the project budget."
	second_style = "casual"
	second_result = styler.apply_style(content=second_content, style=second_style)

	# Verify context cache has been populated
	assert len(styler.context_cache) == 2, "Context cache should contain 2 entries"
	assert styler.context_cache[0]["original"] == first_content
	assert styler.context_cache[0]["style"] == first_style
	assert styler.context_cache[0]["styled"] == first_result

	# Third styling with explicit context
	third_content = "Customer satisfaction increased by 20%."
	external_context = [{"original": "Original text", "style": "poetic", "styled": "Poetic version"}]
	third_result = styler.apply_style(
	content=third_content,
	style="technical",
	context_cache=external_context
	)

	# Verify context_cache parameter was respected (it should override the instance's context_cache)
	assert len(styler.context_cache) == 3, "Context cache should now contain 3 entries"

	def test_temperature_parameter():
	"""Test that temperature parameter affects output variability."""
	content_to_style = "The product launch is scheduled for next month."
	style = "creative"

	# Generate outputs with different temperatures
	styler = TinyStyler()
	results_low_temp = [
	styler.apply_style(content=content_to_style, style=style, temperature=0.1)
	for _ in range(2)
	]

	results_high_temp = [
	styler.apply_style(content=content_to_style, style=style, temperature=1.0)
	for _ in range(2)
	]

	# With very low temperature, results should be more similar to each other
	# With high temperature, results should be more varied
	# This is a probabilistic test, so it might not always pass

	# Log results for manual inspection
	logger.debug(f"Low temperature results: {results_low_temp}")
	logger.debug(f"High temperature results: {results_high_temp}")

	# If we want more deterministic testing, we could check that all results preserve key information
	for result in results_low_temp + results_high_temp:
	assert proposition_holds(f"The following content discusses something that could be a product launch scheduled for next month: {result}"), \
	"All styled content should semantically preserve the product launch and timing information"

	if __name__ == '__main__':
	pytest.main()