test_cases = [ { "generations": ["yes", "no"], "golds": [["yes"], ["yes"]], "keywords": ['yes', 'no'] "strict": True, "result": {"accuracy": 1.0} }, { "generations": ["[up, left]", "[right]"], "golds": [['up', 'left'], ['right', 'down']], "keywords": ['up', 'left', 'right', 'down'] "strict": True, "result": {"accuracy": 0.5} }, { "generations": ["[up, left]", "[right]"], "golds": [['up', 'left'], ['right', 'down']], "keywords": ['up', 'left', 'right', 'down'] "strict": False, "result": {"accuracy": 1.0} } ]