Spaces:

satomito
/

contract-clause-analyzer

Paused

App Files Files Community

contract-clause-analyzer / tests /test_benchmark.py

satomitheito

hf streamlit

908ff10 28 days ago

raw

history blame contribute delete

3.56 kB

	"""Test the benchmark agent with sample classified clauses."""

	import json
	import os
	from agents.benchmark_agent import benchmark_clause, benchmark_node

	OUTPUT_DIR = os.path.join(os.path.dirname(__file__), "..", "outputs")

	SAMPLE_RISK_SCORED_CLAUSES = [
	{
	"id": 1,
	"text": "This Agreement shall be governed by and construed in accordance with the laws of the State of Delaware.",
	"section": "General",
	"clause_type": "Governing Law",
	"confidence": 0.99,
	"risk_score": 0.20,
	"risk_factors": ["Missing forum selection clause"],
	},
	{
	"id": 2,
	"text": "During the term of this Agreement and for a period of two years thereafter, the Employee shall not directly or indirectly engage in any business that competes with the Company.",
	"section": "Restrictive Covenants",
	"clause_type": "Non-Compete",
	"confidence": 0.95,
	"risk_score": 0.72,
	"risk_factors": ["Overly broad scope", "No geographic limitation"],
	},
	{
	"id": 3,
	"text": "Either party may terminate this Agreement at any time upon thirty (30) days prior written notice to the other party.",
	"section": "Termination",
	"clause_type": "Termination For Convenience",
	"confidence": 0.95,
	"risk_score": 0.75,
	"risk_factors": ["No wind-down costs", "No cure period"],
	},
	{
	"id": 4,
	"text": "The Company shall indemnify and hold harmless the Contractor from any claims, damages, or expenses arising from the Company's breach of this Agreement.",
	"section": "Liability",
	"clause_type": "Indemnification",
	"confidence": 0.95,
	"risk_score": 0.72,
	"risk_factors": ["One-directional only", "Narrow scope"],
	},
	{
	"id": 5,
	"text": "The Licensor grants to the Licensee a non-exclusive, non-transferable license to use the Software solely for internal business purposes.",
	"section": "License",
	"clause_type": "Non-Transferable License",
	"confidence": 0.95,
	"risk_score": 0.65,
	"risk_factors": ["Undefined internal business purposes"],
	},
	]


	def test_single_benchmark():
	"""Test benchmarking a single clause."""
	clause = SAMPLE_RISK_SCORED_CLAUSES[1] # Non-compete
	result = benchmark_clause(clause["text"], clause["clause_type"])
	print(f"Clause: {clause['text'][:80]}...")
	print(f"Type: {clause['clause_type']}")
	print(f"Similarity: {result['benchmark_similarity']}")
	print(f"Deviations: {result['deviations']}")
	print(f"Standard: {result['standard_language_summary']}")
	print(f"Why: {result['reasoning']}")
	print()


	def test_benchmark_node():
	"""Test the full LangGraph node with multiple clauses."""
	state = {"risk_scores": SAMPLE_RISK_SCORED_CLAUSES}
	result = benchmark_node(state)

	print(f"{'ID':<4} {'Type':<30} {'Similarity':<12} {'Source'}")
	print("-" * 80)
	for clause in result["benchmark_results"]:
	print(f"{clause['id']:<4} {clause['clause_type']:<30} {clause['benchmark_similarity']:<12.2f} {clause['benchmark_source']}")

	output_path = os.path.join(OUTPUT_DIR, "benchmark_results.json")
	with open(output_path, "w") as f:
	json.dump(result["benchmark_results"], f, indent=2)
	print(f"\nResults saved to {output_path}")


	if __name__ == "__main__":
	print("Single Clause Benchmark Test\n")
	test_single_benchmark()

	print("Full Node Test\n")
	test_benchmark_node()