Spaces:

csong03
/

14c_chatbot

Runtime error

csong03

Initial Space upload with LFS-tracked binaries

9e118e4 3 months ago

4.46 kB

	"""
	Shared assertion helpers for BPS chatbot evaluation tests.

	All helpers accept a response string and return a bool or numeric value.
	Use them inside test functions with plain `assert` statements so pytest
	gives a clean failure message.
	"""

	import re
	from typing import List


	def contains_any(response: str, keywords: List[str]) -> bool:
	"""Return True if response contains at least one keyword (case-insensitive)."""
	lower = response.lower()
	return any(kw.lower() in lower for kw in keywords)


	def contains_all(response: str, keywords: List[str]) -> bool:
	"""Return True if response contains every keyword (case-insensitive)."""
	lower = response.lower()
	return all(kw.lower() in lower for kw in keywords)


	def contains_question(response: str) -> bool:
	"""Return True if the response contains at least one question mark."""
	return "?" in response


	def count_school_names(response: str, known_schools: List[str]) -> int:
	"""
	Count how many school names from known_schools appear in response.
	Matching is case-insensitive.
	"""
	lower = response.lower()
	return sum(1 for school in known_schools if school.lower() in lower)


	def has_numbered_list(response: str) -> bool:
	"""
	Return True if response contains a numbered list item like:
	'1.' or '1)' at the start of a line (ignoring leading whitespace).
	"""
	return bool(re.search(r'^\s*\d+[.)]\s+\S', response, re.MULTILINE))


	def has_bulleted_list(response: str) -> bool:
	"""Return True if response contains a bullet point (-, *, •) list item."""
	return bool(re.search(r'^\s[-•]\s+\S', response, re.MULTILINE))


	def has_list(response: str) -> bool:
	"""Return True if response has either a numbered or bulleted list."""
	return has_numbered_list(response) or has_bulleted_list(response)


	def schools_overlap(response: str, db_results: list, min_overlap: int = 1) -> bool:
	"""
	Return True if at least min_overlap schools from db_results appear in response.

	db_results should be the list returned by BPSDatabase methods; each item
	is a dict with a 'school' key.
	"""
	lower = response.lower()
	matched = sum(
	1 for r in db_results
	if isinstance(r, dict) and r.get("school", "").lower() in lower
	)
	return matched >= min_overlap


	def not_gatekeeping(response: str) -> bool:
	"""
	Return True if response does NOT refuse to help without an address.
	Catches patterns like "I can't help without your address" or
	"need your address to" etc.
	"""
	gatekeep_patterns = [
	r"can'?t help without.{0,20}address",
	r"need.{0,20}address.{0,20}(first\|before\|to)",
	r"(without\|unless).{0,30}address",
	r"provide.{0,20}address.{0,20}(first\|before)",
	]
	lower = response.lower()
	return not any(re.search(p, lower) for p in gatekeep_patterns)


	def no_specific_school_recommendation(response: str, known_schools: List[str]) -> bool:
	"""
	Return True if response does NOT mention specific school names.
	Used for Partition 1: the bot should NOT recommend schools when
	eligibility is unknown.
	"""
	lower = response.lower()
	return not any(school.lower() in lower for school in known_schools)


	def asks_about_grade_or_age(response: str) -> bool:
	"""Return True if response asks about grade level or child's age."""
	patterns = [
	r'grade',
	r'\bage\b',
	r'year.{0,5}old',
	r'how old',
	r'kindergarten\|k-\d\|grade \d',
	]
	lower = response.lower()
	return any(re.search(p, lower) for p in patterns)


	def count_recommended_schools(response: str, known_schools: List[str]) -> int:
	"""Count how many known school names appear in the response."""
	return count_school_names(response, known_schools)


	def references_specific_attributes(response: str) -> bool:
	"""
	Return True if the response references concrete school attributes
	like language programs, after-school care, uniforms, AP, IB, etc.
	"""
	attribute_keywords = [
	"language", "spanish", "bilingual", "immersion",
	"after.?school", "surround care",
	"uniform", "no uniform",
	"advanced placement", r"\bap\b",
	"international baccalaureate", r"\bib\b",
	"arts", "stem", "math", "science",
	"special education", "ada",
	]
	lower = response.lower()
	return any(re.search(kw, lower) for kw in attribute_keywords)