import pandas as pd import requests API_URL = "http://localhost:8001/recommend" FILE_PATH = "/home/a-dheeraj/Desktop/work/assesment-shl/shl-assesment/Gen_AI Dataset.xlsx" def debug_first_query(): print("Loading Train-Set...") df = pd.read_excel(FILE_PATH, sheet_name='Train-Set') # Get first query first_query = df.iloc[0]['Query'] ground_truth_urls = df[df['Query'] == first_query]['Assessment_url'].tolist() print(f"\nQuery: {first_query}") print(f"Ground Truth URLs ({len(ground_truth_urls)}):") for u in ground_truth_urls: print(f" - '{u}'") # Call API print("\nCalling API...") try: response = requests.post(API_URL, json={"query": first_query}) response.raise_for_status() preds = response.json() pred_urls = [p['url'] for p in preds] print(f"Predicted URLs ({len(pred_urls)}):") for u in pred_urls: print(f" - '{u}'") # Check intersection gt_set = set(u.strip().rstrip('/') for u in ground_truth_urls) pred_set = set(u.strip().rstrip('/') for u in pred_urls) intersection = gt_set.intersection(pred_set) print(f"\nIntersection ({len(intersection)}):") for u in intersection: print(f" - '{u}'") except Exception as e: print(f"Error: {e}") if __name__ == "__main__": debug_first_query()