Spaces:
Runtime error
Runtime error
File size: 10,448 Bytes
3951d64 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 |
import requests
import json
import time
import asyncio
from typing import Dict, List
import logging
from concurrent.futures import ThreadPoolExecutor
# Configure logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)
class RAGSystemTester:
def __init__(self, base_url: str = "http://localhost:8000", bearer_token: str = None):
self.base_url = base_url
self.bearer_token = bearer_token or "dbbdb701cfc45d4041e22a03edbfc65753fe9d7b4b9ba1df4884e864f3bb934d"
self.headers = {
"Authorization": f"Bearer {self.bearer_token}",
"Content-Type": "application/json"
}
self.executor = ThreadPoolExecutor(max_workers=3)
def test_health_check(self) -> bool:
"""Test health check endpoint"""
try:
response = requests.get(f"{self.base_url}/health", timeout=10)
if response.status_code == 200:
data = response.json()
print(f"β
Health check passed: {data}")
return True
else:
print(f"β Health check failed: Status {response.status_code}")
logger.error(f"Health check failed with status: {response.status_code}")
return False
except Exception as e:
print(f"β Health check error: {str(e)}")
logger.error(f"Health check error: {str(e)}")
return False
def test_metrics_endpoint(self) -> bool:
"""Test metrics endpoint"""
try:
response = requests.get(f"{self.base_url}/metrics", headers=self.headers, timeout=10)
if response.status_code == 200:
data = response.json()
print(f"β
Metrics endpoint passed: {json.dumps(data, indent=2)}")
return True
else:
print(f"β Metrics endpoint failed: Status {response.status_code}")
logger.error(f"Metrics endpoint failed with status: {response.status_code}")
return False
except Exception as e:
print(f"β Metrics endpoint error: {str(e)}")
logger.error(f"Metrics endpoint error: {str(e)}")
return False
def test_sample_query(self) -> bool:
"""Test with the provided sample data"""
sample_data = {
"documents": "https://hackrx.blob.core.windows.net/assets/Arogya%20Sanjeevani%20Policy%20-%20CIN%20-%20U10200WB1906GOI001713%201.pdf?sv=2023-01-03&st=2025-07-21T08%3A29%3A02Z&se=2025-09-22T08%3A29%3A00Z&sr=b&sp=r&sig=nzrz1K9Iurt%2BBXom%2FB%2BMPTFMFP3PRnIvEsipAX10Ig4%3D",
"questions": [
"What is the grace period for premium payment under the National Parivar Mediclaim Plus Policy?",
"What is the waiting period for pre-existing diseases (PED) to be covered?",
"Does this policy cover maternity expenses, and what are the conditions?",
"What is the waiting period for cataract surgery?",
"Are the medical expenses for an organ donor covered under this policy?",
"What is the No Claim Discount (NCD) offered in this policy?",
"Is there a benefit for preventive health check-ups?",
"How does the policy define a 'Hospital'?",
"What is the extent of coverage for AYUSH treatments?",
"Are there any sub-limits on room rent and ICU charges for Plan A?"
]
}
try:
print("π Testing sample query...")
start_time = time.time()
response = requests.post(
f"{self.base_url}/hackrx/run",
headers=self.headers,
json=sample_data,
timeout=120
)
end_time = time.time()
latency = end_time - start_time
if response.status_code == 200:
data = response.json()
answers = data.get("answers", [])
print(f"β
Sample query successful (Latency: {latency:.2f}s)")
print(f"π Received {len(answers)} answers")
# Print all answers for validation
for i, (question, answer) in enumerate(zip(sample_data['questions'], answers)):
print(f"Q{i+1}: {question}")
print(f"A{i+1}: {answer[:200]}..." if len(answer) > 200 else f"A{i+1}: {answer}")
print("-" * 50)
# Validate that we received answers for all questions
if len(answers) == len(sample_data['questions']):
print("β
All questions answered")
return True
else:
print(f"β Incomplete response: Expected {len(sample_data['questions'])} answers, got {len(answers)}")
logger.warning(f"Incomplete response: Expected {len(sample_data['questions'])} answers, got {len(answers)}")
return False
else:
print(f"β Sample query failed: Status {response.status_code}")
print(f"Response: {response.text}")
logger.error(f"Sample query failed: Status {response.status_code}, Response: {response.text}")
return False
except Exception as e:
print(f"β Sample query error: {str(e)}")
logger.error(f"Sample query error: {str(e)}")
return False
async def test_concurrent_queries(self, num_requests: int = 3) -> bool:
"""Test system under concurrent load"""
async def make_request():
try:
response = requests.post(
f"{self.base_url}/hackrx/run",
headers=self.headers,
json={
"documents": "https://hackrx.blob.core.windows.net/assets/Arogya%20Sanjeevani%20Policy%20-%20CIN%20-%20U10200WB1906GOI001713%201.pdf?sv=2023-01-03&st=2025-07-21T08%3A29%3A02Z&se=2025-09-22T08%3A29%3A00Z&sr=b&sp=r&sig=nzrz1K9Iurt%2BBXom%2FB%2BMPTFMFP3PRnIvEsipAX10Ig4%3D",
"questions": ["What is the grace period for premium payment?"]
},
timeout=60
)
return response.status_code == 200
except Exception as e:
logger.error(f"Concurrent query error: {str(e)}")
return False
print(f"π Testing {num_requests} concurrent queries...")
tasks = [make_request() for _ in range(num_requests)]
results = await asyncio.gather(*tasks, return_exceptions=True)
success_count = sum(1 for result in results if result is True)
print(f"β
Concurrent test completed: {success_count}/{num_requests} successful")
return success_count == num_requests
def test_invalid_token(self) -> bool:
"""Test authentication with invalid token"""
try:
invalid_headers = {
"Authorization": "Bearer invalid_token",
"Content-Type": "application/json"
}
response = requests.post(
f"{self.base_url}/hackrx/run",
headers=invalid_headers,
json={
"documents": "https://hackrx.blob.core.windows.net/assets/Arogya%20Sanjeevani%20Policy%20-%20CIN%20-%20U10200WB1906GOI001713%201.pdf?sv=2023-01-03&st=2025-07-21T08%3A29%3A02Z&se=2025-09-22T08%3A29%3A00Z&sr=b&sp=r&sig=nzrz1K9Iurt%2BBXom%2FB%2BMPTFMFP3PRnIvEsipAX10Ig4%3D",
"questions": ["Test question"]
},
timeout=10
)
if response.status_code == 401:
print("β
Invalid token test passed: Correctly rejected")
return True
else:
print(f"β Invalid token test failed: Expected 401, got {response.status_code}")
logger.warning(f"Invalid token test failed: Expected 401, got {response.status_code}")
return False
except Exception as e:
print(f"β Invalid token test error: {str(e)}")
logger.error(f"Invalid token test error: {str(e)}")
return False
def test_invalid_url(self) -> bool:
"""Test with invalid document URL"""
try:
response = requests.post(
f"{self.base_url}/hackrx/run",
headers=self.headers,
json={
"documents": "https://invalid-url-that-does-not-exist.com/fake.pdf", # Actually invalid URL
"questions": ["Test question"]
},
timeout=30
)
# Accept either 400 or 500 as valid error responses for invalid URLs
if response.status_code in [400, 500]:
print("β
Invalid URL test passed: Correctly handled")
return True
else:
print(f"β Invalid URL test failed: Expected 400/500, got {response.status_code}")
logger.warning(f"Invalid URL test failed: Expected 400/500, got {response.status_code}")
return False
except Exception as e:
print(f"β Invalid URL test error: {str(e)}")
logger.error(f"Invalid URL test error: {str(e)}")
return False
async def run_all_tests(self):
"""Run all test cases"""
print("π Starting RAG System Tests")
print("=" * 50)
results = {
"health_check": self.test_health_check(),
"metrics_endpoint": self.test_metrics_endpoint(),
"sample_query": self.test_sample_query(),
"concurrent_queries": await self.test_concurrent_queries(),
"invalid_token": self.test_invalid_token(),
"invalid_url": self.test_invalid_url()
}
print("\nπ Test Summary")
print("=" * 50)
passed = sum(1 for result in results.values() if result)
total = len(results)
for test_name, passed in results.items():
status = "β
PASSED" if passed else "β FAILED"
print(f"{test_name}: {status}")
print(f"\nπ― Overall: {passed}/{total} tests passed")
return passed == total
def main():
tester = RAGSystemTester()
asyncio.run(tester.run_all_tests())
if __name__ == "__main__":
main() |