al1808th
/

stanza-digphil

Model card Files Files and versions

stanza-digphil / stanza /server /parser_eval.py

Albin Thörn Cleland

Clean initial commit with LFS

19b8775 about 1 month ago

history blame contribute delete

3.03 kB

	"""
	This class runs a Java process to evaluate a treebank prediction using CoreNLP
	"""

	from collections import namedtuple
	import sys

	import stanza
	from stanza.protobuf import EvaluateParserRequest, EvaluateParserResponse
	from stanza.server.java_protobuf_requests import send_request, build_tree, JavaProtobufContext
	from stanza.models.constituency.tree_reader import read_treebank

	EVALUATE_JAVA = "edu.stanford.nlp.parser.metrics.EvaluateExternalParser"

	ParseResult = namedtuple("ParseResult", ['gold', 'predictions', 'state', 'constituents'])
	ScoredTree = namedtuple("ScoredTree", ['tree', 'score'])

	def build_request(treebank):
	"""
	treebank should be a list of pairs: [gold, predictions]
	each predictions is a list of tuples (prediction, score, state)
	state is ignored and can be None
	Note that for now, only one tree is measured, but this may be extensible in the future
	Trees should be in the form of a Tree from parse_tree.py
	"""
	request = EvaluateParserRequest()
	for raw_result in treebank:
	gold = raw_result.gold
	predictions = raw_result.predictions
	parse_result = request.treebank.add()
	parse_result.gold.CopyFrom(build_tree(gold, None))
	for pred in predictions:
	if isinstance(pred, tuple):
	prediction, score = pred
	else:
	prediction = pred
	score = None
	try:
	parse_result.predicted.append(build_tree(prediction, score))
	except Exception as e:
	raise RuntimeError("Unable to build parser request from tree {}".format(pred)) from e

	return request

	def collate(gold_treebank, predictions_treebank):
	"""
	Turns a list of gold and prediction into a evaluation object
	"""
	treebank = []
	for gold, prediction in zip(gold_treebank, predictions_treebank):
	result = ParseResult(gold, [prediction], None, None)
	treebank.append(result)
	return treebank


	class EvaluateParser(JavaProtobufContext):
	"""
	Parser evaluation context window

	This is a context window which keeps a process open. Should allow
	for multiple requests without launching new java processes each time.
	"""
	def __init__(self, classpath=None, kbest=None, silent=False):
	if kbest is not None:
	extra_args = ["-evalPCFGkBest", "{}".format(kbest), "-evals", "pcfgTopK"]
	else:
	extra_args = []

	if silent:
	extra_args.extend(["-evals", "summary=False"])

	super(EvaluateParser, self).__init__(classpath, EvaluateParserResponse, EVALUATE_JAVA, extra_args=extra_args)

	def process(self, treebank):
	request = build_request(treebank)
	return self.process_request(request)


	def main():
	gold = read_treebank(sys.argv[1])
	predictions = read_treebank(sys.argv[2])
	treebank = collate(gold, predictions)

	with EvaluateParser() as ep:
	ep.process(treebank)


	if __name__ == '__main__':
	main()