Spaces:
Sleeping
Sleeping
| Q = {} | |
| actions = ["important", "spam", "normal"] | |
| def get_action(state): | |
| if state not in Q: | |
| Q[state] = {a: 0 for a in actions} | |
| return max(Q[state], key=Q[state].get) | |
| def update_q(state, action, reward): | |
| if state not in Q: | |
| Q[state] = {a: 0 for a in actions} | |
| Q[state][action] += reward |