AML_env / graders /aml_easy.py
DataBoySu
all set
81e1efb
raw
history blame contribute delete
510 Bytes
def grade(trajectory) -> float:
# OpenEnv graders usually receive the full trajectory of (observation, action, reward, state)
# We just need to look at the final action
final_action = trajectory[-1].action.action
if final_action.action_type != "submit_decision":
return 0.01 # Failed to submit a decision
if final_action.decision == "CLEAR":
return 1.0 # Correctly identified the False Positive
return 0.1 # Incorrectly flagged an innocent company