| #!/usr/bin/env python3 | |
| """Test script for the API""" | |
| import requests | |
| def test_api(): | |
| base_url = "https://Ariyan-Pro-rag-latency-optimization.hf.space" | |
| print("Testing RAG Optimization API...") | |
| # Test health | |
| health = requests.get(f"{base_url}/health") | |
| print(f"Health: {health.json()}") | |
| # Test metrics | |
| metrics = requests.get(f"{base_url}/metrics") | |
| data = metrics.json() | |
| print(f"\nPerformance Metrics:") | |
| print(f" Baseline: {data['baseline_latency_ms']}ms") | |
| print(f" Optimized: {data['optimized_latency_ms']}ms") | |
| print(f" Speedup: {data['speedup_factor']}×") | |
| print(f" Reduction: {data['latency_reduction_percent']}%") | |
| # Test query | |
| query = requests.post( | |
| f"{base_url}/query", | |
| json={"question": "What is machine learning?"} | |
| ) | |
| print(f"\nQuery Response:") | |
| print(f" Latency: {query.json()['latency_ms']}ms") | |
| print(f" Speedup: {query.json()['optimization']}") | |
| if __name__ == "__main__": | |
| test_api() | |