-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathtictactoe.py
183 lines (139 loc) · 3.91 KB
/
tictactoe.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
"""
Tic Tac Toe Player
"""
import math
from copy import deepcopy
X = "X"
O = "O"
EMPTY = None
def initial_state():
"""
Returns starting state of the board.
"""
return [[EMPTY, EMPTY, EMPTY],
[EMPTY, EMPTY, EMPTY],
[EMPTY, EMPTY, EMPTY]]
def player(board):
"""
Returns player who has the next turn on a board.
"""
return X if non_free_cells(board) % 2 == 0 else O
def actions(board):
"""
Returns set of all possible actions (i, j) available on the board.
"""
actions = set()
for i in range(len(board)):
for j in range((len(board[0]))):
if (board[i][j] is EMPTY):
actions.add((i, j))
return actions
def result(board, action):
"""
Returns the board that results from making move (i, j) on the board.
"""
i, j = action
if (board[i][j] is not EMPTY):
raise ValueError
new_board = deepcopy(board)
new_board[i][j] = player(board)
return new_board
def winner(board):
"""
Returns the winner of the game, if there is one, or None.
"""
win_ways = [
[(0, 0), (0, 1), (0, 2)],
[(1, 0), (1, 1), (1, 2)],
[(2, 0), (2, 1), (2, 2)],
[(0, 0), (1, 0), (2, 0)],
[(0, 1), (1, 1), (2, 1)],
[(0, 2), (1, 2), (2, 2)],
[(0, 0), (1, 1), (2, 2)],
[(0, 2), (1, 1), (2, 0)],
]
for a, b, c in win_ways:
player = board[a[0]][a[1]]
if (player is not EMPTY and player == board[b[0]][b[1]] and player == board[c[0]][c[1]]):
return player
return None
def terminal(board):
"""
Returns True if game is over, False otherwise.
"""
if (winner(board) is not None):
return True
return non_free_cells(board) == 9
def utility(board):
"""
Given a terminal board, returns 1 if X has won the game, -1 if O has won, 0 otherwise.
"""
if (not terminal(board)):
raise ValueError
winner_player = winner(board)
if (winner_player == X): return 1
if (winner_player == O): return -1
if (winner_player == None): return 0
def minimax(board):
"""
Returns the optimal action for the current player on the board.
"""
if (terminal(board)):
return None
curr_player = player(board)
best_value = -math.inf if curr_player == X else math.inf
best_action = ()
for action in actions(board):
# The X player want maximize it.
if curr_player == X:
value = min_value(result(board, action))
if (value > best_value):
best_value = value
best_action = action
# The O player want minimize it.
else:
value = max_value(result(board, action))
if value < best_value:
best_value = value
best_action = action
return best_action
min_value_memo = {}
def min_value(board):
"""
Current player: O.
"""
if terminal(board):
return utility(board)
memo_key = repr(board)
if memo_key in min_value_memo:
return min_value_memo[memo_key]
v = math.inf
for action in actions(board):
v = min(v, max_value(result(board, action)))
min_value_memo[memo_key] = v
return v
max_value_memo = {}
def max_value(board):
"""
Current player: X.
"""
if terminal(board):
return utility(board)
memo_key = repr(board)
if memo_key in max_value_memo:
return max_value_memo[memo_key]
v = -math.inf
for action in actions(board):
v = max(v, min_value(result(board, action)))
max_value_memo[memo_key] = v
return v
def non_free_cells(board):
"""
Returns the quantity of non empty cells on board.
"""
count = 0
for i in range(len(board)):
for j in range((len(board[0]))):
if board[i][j] is not EMPTY:
count += 1
return count