Spaces:

kanhacoderx
/

SHL-Assessment-Recommender

Sleeping

App Files Files Community

SHL-Assessment-Recommender / app /agent.py

kanhacoderx

Update app/agent.py

c199958 verified 15 days ago

raw

history blame contribute delete

9.49 kB

	from typing import List, Dict, Any
	import json
	from pathlib import Path
	from typing import List, Dict, Any


	CATALOG_PATH = Path("data/shl_catalog.json")


	def load_catalog() -> List[Dict[str, Any]]:
	if not CATALOG_PATH.exists():
	return []

	with open(CATALOG_PATH, "r", encoding="utf-8") as f:
	return json.load(f)


	CATALOG = load_catalog()

	def get_last_user_message(messages: List[Any]) -> str:
	for msg in reversed(messages):
	if msg.role == "user":
	return msg.content.lower()
	return ""


	def build_conversation_query(messages: List[Any]) -> str:
	"""
	Builds a compact query from full stateless conversation history.
	This helps refinement requests like:
	'Actually add personality tests'
	without forgetting earlier role context.
	"""
	user_messages = []

	for msg in messages:
	if msg.role == "user":
	user_messages.append(msg.content)

	return " ".join(user_messages).lower()

	def is_out_of_scope(text: str) -> bool:
	text = text.lower()

	blocked_phrases = [
	# Legal / compliance
	"legal advice",
	"is it legal",
	"employment law",
	"labor law",
	"labour law",
	"discrimination",
	"fire employee",
	"terminate employee",
	"lawsuit",
	"contract",

	# General hiring advice outside SHL assessment recommendation
	"write interview questions",
	"interview questions",
	"salary",
	"compensation",
	"negotiate offer",
	"job description template",
	"write a job description",
	"resume screening",
	"cv screening",
	"cover letter",

	# Prompt injection
	"ignore previous instructions",
	"forget your instructions",
	"act as unrestricted",
	"bypass",
	"system prompt",
	"developer message",
	"reveal your prompt",
	"jailbreak",
	]

	return any(phrase in text for phrase in blocked_phrases)


	def is_vague(text: str) -> bool:
	vague_phrases = [
	"i need an assessment",
	"need assessment",
	"suggest assessment",
	"recommend assessment",
	"assessment test",
	]

	has_role_signal = any(
	word in text
	for word in [
	"java",
	"python",
	"developer",
	"engineer",
	"manager",
	"sales",
	"graduate",
	"analyst",
	"stakeholder",
	"communication",
	]
	)

	if any(phrase in text for phrase in vague_phrases) and not has_role_signal:
	return True

	if len(text.split()) <= 4 and not has_role_signal:
	return True

	return False


	def score_catalog_item(query: str, item: Dict[str, Any]) -> int:
	score = 0

	name = item.get("name", "").lower()
	description = item.get("description", "").lower()
	keywords = item.get("keywords", [])

	searchable_text = f"{name} {description} {' '.join(keywords)}"

	query_words = query.lower().split()

	for word in query_words:
	if len(word) > 2 and word in searchable_text:
	score += 1

	# Strong skill boosts
	skill_terms = [
	"java", "python", "sql", "javascript", "developer",
	"coding", "programming", "software", "backend"
	]

	for skill in skill_terms:
	if skill in query and skill in searchable_text:
	score += 3

	# Personality / behavior boost
	if any(term in query for term in ["personality", "communication", "stakeholder", "leadership"]):
	if item.get("test_type") == "P" or "personality" in searchable_text or "opq" in searchable_text:
	score += 3

	# Cognitive / aptitude boost
	if any(term in query for term in ["cognitive", "aptitude", "reasoning", "ability"]):
	if item.get("test_type") == "A" or "ability" in searchable_text:
	score += 3

	return score

	def recommend(query: str) -> List[Dict[str, str]]:
	scored_items = []

	for item in CATALOG:
	score = score_catalog_item(query, item)
	if score > 0:
	scored_items.append((score, item))

	scored_items.sort(key=lambda x: x[0], reverse=True)

	recommendations = []
	for _, item in scored_items[:10]:
	recommendations.append(
	{
	"name": item.get('name',''),
	"url": item.get('url',''),
	"test_type": item.get('test_type','unknown'),
	}
	)

	return recommendations

	def is_compare_query(text: str) -> bool:
	compare_terms = [
	"difference between",
	"compare",
	"vs",
	"versus",
	"different from",
	"which is better",
	]

	text = text.lower()
	return any(term in text for term in compare_terms)


	def find_matching_assessments(text: str, limit: int = 5) -> List[Dict[str, Any]]:
	text = text.lower()
	matches = []

	for item in CATALOG:
	name = item.get("name", "").lower()
	description = item.get("description", "").lower()
	keywords = " ".join(item.get("keywords", [])).lower()

	searchable_text = f"{name} {description} {keywords}"

	score = 0

	# Direct name match
	for token in text.split():
	if len(token) > 2 and token in name:
	score += 3
	elif len(token) > 2 and token in searchable_text:
	score += 1

	if score > 0:
	matches.append((score, item))

	matches.sort(key=lambda x: x[0], reverse=True)

	return [item for _, item in matches[:limit]]





	def compare_assessments(query: str) -> Dict[str, Any]:
	matches = find_matching_assessments(query, limit=4)

	if len(matches) < 2:
	return {
	"reply": "I can compare SHL assessments, but I need two assessment names from the catalog. Please mention both assessments you want to compare.",
	"recommendations": [],
	"end_of_conversation": False,
	}

	a = matches[0]
	b = matches[1]

	a_name = a.get("name", "Assessment 1")
	b_name = b.get("name", "Assessment 2")

	a_type = a.get("test_type", "Unknown")
	b_type = b.get("test_type", "Unknown")

	a_desc = a.get("description", "")
	b_desc = b.get("description", "")

	reply = (
	f"Here is a catalog-grounded comparison:\n\n"
	f"{a_name} focuses on: {a_desc[:300] if a_desc else 'description not available in catalog data'}\n"
	f"Test type: {a_type}\n\n"
	f"{b_name} focuses on: {b_desc[:300] if b_desc else 'description not available in catalog data'}\n"
	f"Test type: {b_type}\n\n"
	f"Use {a_name} when the role requirement matches its catalog description. "
	f"Use {b_name} when the hiring need is closer to its catalog description."
	)

	return {
	"reply": reply,
	"recommendations": [
	{
	"name": a.get("name", ""),
	"url": a.get("url", ""),
	"test_type": a.get("test_type", "Unknown"),
	},
	{
	"name": b.get("name", ""),
	"url": b.get("url", ""),
	"test_type": b.get("test_type", "Unknown"),
	},
	],
	"end_of_conversation": False,
	}


	def run_agent(messages: List[Any]) -> Dict[str, Any]:
	query = build_conversation_query(messages)
	last_user_query = get_last_user_message(messages)

	if not query:
	return {
	"reply": "Please share the role or skills you want to assess using SHL assessments.",
	"recommendations": [],
	"end_of_conversation": False,
	}

	if is_out_of_scope(query):
	return {
	"reply": "I can only help with SHL assessment recommendations, comparisons, and refinements based on the SHL catalog.",
	"recommendations": [],
	"end_of_conversation": False,
	}

	if is_vague(query):
	return {
	"reply": "Sure. Which role, skill area, and seniority level are you hiring for?",
	"recommendations": [],
	"end_of_conversation": False,
	}

	# Important safety check
	# If real SHL catalog JSON is missing or not loaded, don't crash and don't hallucinate.
	if not CATALOG:
	return {
	"reply": "The SHL catalog is not loaded yet. Please try again after the catalog data is available.",
	"recommendations": [],
	"end_of_conversation": False,
	}

	if is_compare_query(last_user_query):
	return compare_assessments(last_user_query)

	recommendations = recommend(query)

	if recommendations:
	return {
	"reply": f"Based on the role details, here are {len(recommendations)} SHL assessments that may fit this hiring need.",
	"recommendations": recommendations,
	"end_of_conversation": False,
	}

	return {
	"reply": "Could you share the target role, required skills, and seniority level so I can recommend relevant SHL assessments?",
	"recommendations": [],
	"end_of_conversation": False,
	}