File size: 7,730 Bytes
eb34cec
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
import streamlit as st
import numpy as np

import Arena

from MCTS import MCTS

from no_one.NoOneGame import NoOneGame


from no_one.pytorch.NNet import NNetWrapper as NNet
from utils import *

import time


square_content = {
    -1: "❌",
    +0: "·",
    +1: "⭕"
}

players = [{"name": "❌"}, {"name": "⭕"}]
player_types = [":rainbow[AI]", "Human"]
ai_ranks = ["Super", "First Blood", "Random"]
ai_models = {
    "Super": "super.pth.tar",
    "First Blood": "firstBlood.pth.tar",
    "Random": "random.pth.tar",
}

game = NoOneGame(4)

def check_clicked(i, j):
    if st.session_state.clicked == (i, j):
        return True
    return False

class HumanPlayer:
    def __init__(self, game):
        self.game = game
    def encode(self, src, target):
        row, col = src[0] - target[0], src[1] - target[1]
        if (row, col) == (0, -1):
            d = 1
        elif (row, col) == (0, 1):
            d = 3
        elif (row, col) == (-1, 0):
            d = 0
        elif (row, col) == (1, 0):
            d = 2
        else:
            return None
        return self.game.encodeAction(src, d)
    def play(self, board, player, src, target):
        action = self.encode(src, target)
        if action is None:
            return None
        valids = self.game.getValidMoves(board, player)
        if valids[action] != 1:
            return None
        return action


def ai_player(ai_model):
    n1 = NNet(game)
    n1.load_checkpoint('./models/', ai_models[ai_model])
    args1 = dotdict({'numMCTSSims': 50, 'cpuct':1.0})
    msts1 = MCTS(game, n1, args1)
    return lambda x: np.argmax(msts1.getActionProb(x, temp=0))


def human_step(i, j):
    if st.session_state.clicked is None:
        if st.session_state.board[i, j] != st.session_state.player:
            st.toast('Invalid move!')
            return
        st.session_state.clicked = (i, j)
        return
    elif st.session_state.clicked == (i, j):
        # selection canceled
        st.session_state.clicked = None
        return
    elif st.session_state.board[i, j] == st.session_state.player:
        st.session_state.clicked = (i, j)
        return
    else:
        # move
        player = st.session_state.players[st.session_state.player + 1]
        action = player.play(st.session_state.board, st.session_state.player, st.session_state.clicked, (i, j))
        if action is None:
            st.toast('Invalid move!')
            return
        move(action)
        st.session_state.clicked = None


def ai_step():
    p = st.session_state.player
    action = st.session_state.players[p+1](game.getCanonicalForm(st.session_state.board, st.session_state.player))
    # st.session_state.board, st.session_state.player = game.getNextState(
    #     st.session_state.board, p, action,
    # )
    move(action)


def move(action):
    p = st.session_state.player
    st.session_state.board, st.session_state.player = game.getNextState(
        st.session_state.board, p, action,
    )

    res = game.getGameEnded(st.session_state.board, p)
    if res != 0:
        st.session_state.winner = res*p
        st.session_state.win[res*p] += 1
        st.balloons()

def reinit():
    st.session_state.reinit = True

def init(post_init=False):
    st.session_state.reinit = False
    if not post_init:
        st.session_state.win = {-1: 0, 1: 0}

    st.session_state.board = game.getInitBoard()
    st.session_state.player = -1
    st.session_state.players = [None for i in range(2)]
    for i, setting in enumerate(st.session_state.player_settings):
        if setting["pt"] == player_types[1]:
            st.session_state.players[i] = HumanPlayer(game)
        else:
            st.session_state.players[i] = ai_player(setting["ai_model"])
    st.session_state.players.insert(1, None)

    st.session_state.winner = None
    st.session_state.clicked = None


def player_to_index(p):
    if p == -1:
        return 0
    elif p == 1:
        return 1


def main():
    if "player_settings" not in st.session_state:
        st.session_state.player_settings = [
            {"pt": player_types[1], "ai_model": ai_ranks[0]},
            {"pt": player_types[0], "ai_model": ai_ranks[1]},
        ]
    if "reinit" not in st.session_state:
        st.session_state.reinit = False

    fire, settings = st.columns([1, 2])
    fire.button('New Game', on_click=init, args=(True,))
    with settings.expander(
        'Settings',
        expanded=False,
    ):
        st.warning('Any setting changing will restart the game immediately', icon="⚠️")
        for i, p in enumerate(st.columns([0.5, 0.5])):
            with p:
                # players[i]
                st.session_state.player_settings[i]["pt"] = st.radio(
                    f"Who will play %s" % players[i]["name"],
                    player_types,
                    key=f"xp_type_{i}",
                    horizontal=True,
                    index=player_types.index(st.session_state.player_settings[i]["pt"]),
                    on_change=reinit,
                )
                if st.session_state.player_settings[i]["pt"] == player_types[0]:
                    st.session_state.player_settings[i]["ai_model"] = st.radio(
                        "AI rank",
                        ai_ranks,
                        key=f"xp_rank_{i}",
                        index=ai_ranks.index(st.session_state.player_settings[i]["ai_model"]),
                        on_change=reinit,
                    )
        
        st.divider()
        st.checkbox("Show me how to play", key="show_how_to_play")


    if "board" not in st.session_state or st.session_state.reinit:
        init()

    if st.session_state.show_how_to_play:
        with st.sidebar:
            st.title("How to play")
            how_to = '''1. 游戏的目标是吃掉对方的棋子
  开局双方各有四枚棋子,被吃剩一枚棋子即可判负
2. 棋子可以向上下左右移动到空白位置
3. 如何吃子
    1. 移动后的棋子需要跟本方其他某个棋子,在水平方向,或者垂直方向上连住
    2. 如果连住后的棋子两端有对方一个棋子,那么这个对方的棋子就被吃掉
    3. 如果对方也有两颗棋子,则互相不吃
4. 如果落子在对方连起来的两枚棋子一端,也不会被吃
5. 如果选择 AI vs AI,需要手动点击比分下面的回合按钮,触发下一次落子
'''
            st.markdown(how_to)
    

    xp, score, op = st.columns([2, 8, 2])
    for i, p in enumerate([xp, op]):
        p.title(players[i]["name"], anchor=False)
        caption = st.session_state.player_settings[i]["pt"]
        if st.session_state.player_settings[i]["pt"] == player_types[0]:
            caption = st.session_state.player_settings[i]["ai_model"] + " " + caption
        p.caption(caption)

    # st.session_state

    if st.session_state.player_settings[player_to_index(st.session_state.player)]['pt'] != "Human" and st.session_state.winner is None:
        ai_step()

    st.divider()

    for i, row in enumerate(st.session_state.board):
        cols = st.columns([5, 1, 1, 1, 1, 5])
        for j, field in enumerate(row):
            cols[j + 1].button(
                square_content[field],
                key=f"{i}-{j}",
                type=f'{"primary" if check_clicked(i, j) else "secondary"}',
                on_click=human_step,
                args=(i, j),
            )

    s = score.columns([2, 2, 2])
    s[1].title(f'{st.session_state.win[-1]} : {st.session_state.win[1]}', anchor=False)
    s[1].button(
        f'{"❌" if st.session_state.player == -1 else "⭕"}\'s turn'
        if not st.session_state.winner
        else f'🏁 Game finished'
    )



if __name__ == '__main__':
    main()