Spaces:

ayushm98
/

cascade

Sleeping

App Files Files Community

cascade / tests /test_api.py

ayushm98

Add tests for API schemas and cost tracking

16ccf4e 9 months ago

raw

history blame contribute delete

6.16 kB

	"""Tests for the API module."""

	import pytest
	from unittest.mock import AsyncMock, patch
	from fastapi.testclient import TestClient

	from cascade.api.schemas import (
	ChatCompletionRequest,
	ChatCompletionResponse,
	ChatMessage,
	UsageInfo,
	ChatCompletionChoice,
	)


	class TestSchemas:
	"""Tests for API schemas."""

	def test_chat_message_creation(self):
	"""ChatMessage should be created correctly."""
	msg = ChatMessage(role="user", content="Hello")
	assert msg.role == "user"
	assert msg.content == "Hello"

	def test_chat_message_roles(self):
	"""ChatMessage should accept valid roles."""
	for role in ["system", "user", "assistant"]:
	msg = ChatMessage(role=role, content="test")
	assert msg.role == role

	def test_chat_request_defaults(self):
	"""ChatCompletionRequest should have correct defaults."""
	request = ChatCompletionRequest(
	messages=[ChatMessage(role="user", content="Hello")]
	)
	assert request.model == "gpt-4o"
	assert request.temperature == 0.7
	assert request.max_tokens is None
	assert request.stream is False

	def test_chat_request_custom_values(self):
	"""ChatCompletionRequest should accept custom values."""
	request = ChatCompletionRequest(
	model="gpt-4o-mini",
	messages=[ChatMessage(role="user", content="Hello")],
	temperature=0.5,
	max_tokens=100,
	)
	assert request.model == "gpt-4o-mini"
	assert request.temperature == 0.5
	assert request.max_tokens == 100

	def test_usage_info(self):
	"""UsageInfo should track token usage."""
	usage = UsageInfo(
	prompt_tokens=10,
	completion_tokens=20,
	total_tokens=30,
	)
	assert usage.prompt_tokens == 10
	assert usage.completion_tokens == 20
	assert usage.total_tokens == 30

	def test_chat_response_creation(self):
	"""ChatCompletionResponse should be created correctly."""
	response = ChatCompletionResponse(
	id="test-123",
	created=1234567890,
	model="gpt-4o",
	choices=[
	ChatCompletionChoice(
	index=0,
	message=ChatMessage(role="assistant", content="Hi there!"),
	finish_reason="stop",
	)
	],
	usage=UsageInfo(
	prompt_tokens=5,
	completion_tokens=10,
	total_tokens=15,
	),
	)
	assert response.id == "test-123"
	assert response.model == "gpt-4o"
	assert len(response.choices) == 1
	assert response.choices[0].message.content == "Hi there!"


	class TestCostTracking:
	"""Tests for cost tracking."""

	def test_cost_calculation(self):
	"""Cost should be calculated correctly."""
	from cascade.cost.pricing import calculate_cost

	# GPT-4o: $0.03/1K input, $0.06/1K output
	cost = calculate_cost("gpt-4o", 1000, 1000)
	assert cost == 0.09 # 0.03 + 0.06

	def test_free_model_cost(self):
	"""Free models should have zero cost."""
	from cascade.cost.pricing import calculate_cost, is_free_model

	cost = calculate_cost("llama3.2", 1000, 1000)
	assert cost == 0.0
	assert is_free_model("llama3.2")

	def test_savings_calculation(self):
	"""Savings should be calculated correctly."""
	from cascade.cost.pricing import calculate_savings

	dollars_saved, percentage_saved = calculate_savings(1.0, 10.0)
	assert dollars_saved == 9.0
	assert percentage_saved == 90.0

	def test_savings_zero_baseline(self):
	"""Savings with zero baseline should not error."""
	from cascade.cost.pricing import calculate_savings

	dollars_saved, percentage_saved = calculate_savings(0.0, 0.0)
	assert dollars_saved == 0.0
	assert percentage_saved == 0.0


	class TestCostTracker:
	"""Tests for the cost tracker service."""

	def test_tracker_initialization(self):
	"""CostTracker should initialize with zero values."""
	from cascade.cost.tracker import CostTracker

	tracker = CostTracker()
	assert tracker.total_requests == 0
	assert tracker.total_cost == 0.0
	assert tracker.cache_hits_exact == 0

	def test_record_request(self):
	"""Recording requests should update totals."""
	from cascade.cost.tracker import CostTracker

	tracker = CostTracker()
	tracker.record_request(
	model="gpt-4o",
	prompt_tokens=100,
	completion_tokens=50,
	latency=0.5,
	)

	assert tracker.total_requests == 1
	assert tracker.total_cost > 0
	assert tracker.total_tokens == 150

	def test_cache_hit_tracking(self):
	"""Cache hits should be tracked correctly."""
	from cascade.cost.tracker import CostTracker

	tracker = CostTracker()
	tracker.record_cache_hit("exact")
	tracker.record_cache_hit("semantic")
	tracker.record_cache_hit("miss")

	assert tracker.cache_hits_exact == 1
	assert tracker.cache_hits_semantic == 1
	assert tracker.cache_misses == 1

	def test_get_summary(self):
	"""Summary should contain all metrics."""
	from cascade.cost.tracker import CostTracker

	tracker = CostTracker()
	tracker.record_request("gpt-4o", 100, 50, 0.5)
	tracker.record_cache_hit("exact")

	summary = tracker.get_summary()

	assert "total_requests" in summary
	assert "cost" in summary
	assert "cache" in summary
	assert "latency" in summary
	assert "models" in summary

	def test_reset(self):
	"""Reset should clear all metrics."""
	from cascade.cost.tracker import CostTracker

	tracker = CostTracker()
	tracker.record_request("gpt-4o", 100, 50, 0.5)
	tracker.reset()

	assert tracker.total_requests == 0
	assert tracker.total_cost == 0.0