-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgameState.py
360 lines (305 loc) · 14.1 KB
/
gameState.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
import util
import copy
class GameState():
"""
This class contains information of the state of a Gomoku game.
Normally it is 5 in a row. We extend the game to N in a row.
Parameter:
N: N in a row
boardSize: The board will be boardSize x boardSize
numPlayers: How many total players in this game (including computers)
Instance variables:
N: N in a row
boardSize: The board will be boardSize x boardSize
numPlayers: How many total players in this game (including computers)
board: A dictionary of (position => player index)
gameOver: Whether the game is over or not
winner: The index of the winner, -1 if the game is not over
features: A dictionary of ((agentIndex, description) => number)
Ex. (agentIndex, 'open 3') => 2
(agentIndex, 'blocked 4') => 1
"""
def __init__(self, N, boardSize, numPlayers, prevState = None):
self.N = N
self.boardSize = boardSize
self.numPlayers = numPlayers
if prevState == None:
self.board = {}
self.legalActions = set()
self.currentPlayer = 0
self.gameOver = False
self.winner = -1
self.features = {}
self.positionToFeatures = dict()
self.previousAction = None #(player, action)
else:
self.board = dict(prevState.board)
self.legalActions = set(prevState.legalActions)
self.currentPlayer = prevState.currentPlayer
self.gameOver = prevState.gameOver
self.winner = prevState.winner
self.features = dict(prevState.features)
self.positionToFeatures = copy.deepcopy(prevState.positionToFeatures)
self.previousAction = prevState.previousAction
def getLegalActions(self):
"""
If there are no pieces on the board, legal action is the middle of the board.
Otherwise, the legal actions are the positions around the current pieces
"""
if len(self.board) == 0:
return [((self.boardSize + 1) / 2, (self.boardSize + 1) / 2)]
return list(self.legalActions)
def gameEnded(self):
"""
Return True if game has ended. False otherwise.
"""
return self.gameOver
def getWinner(self):
"""
Returns the winner's number.
If the game is a tie or hasn't ended, return -1
"""
if self.gameOver:
return self.winner
return -1
def moveIsValid(self, playerIndex, move):
"""
Check if a move is valid.
"""
if playerIndex < 0 or playerIndex >= self.numPlayers:
print "Agent index " + str(playerIndex) + " is invalid."
return False
# Out of bounds or that position already has a piece
if not self.withinBounds(move) or move in self.board:
return False
return True
def generateSuccessor(self, player, move):
"""
Make a copy of the current state, and simulate the move, and return that copy.
"""
state = GameState(self.N, self.boardSize, self.numPlayers, prevState = self)
state.previousAction = (player, move)
state.makeMove(player, move)
return state
def makeMove(self, player, move):
"""
Player makes a move.
"""
if not self.moveIsValid(player, move):
return
# Update self.features
self.board[move] = player
self.updateFeaturesForMove(player, move)
if self.checkTie():
self.gameOver = True
self.currentPlayer = (self.currentPlayer + 1) % self.numPlayers
# Update self.legalActions
x, y = move
if move in self.legalActions:
self.legalActions.remove(move)
for i in range(x - 1, x + 1 + 1):
for j in range(y - 1, y + 1 + 1):
if self.withinBounds((i, j)) and (i, j) not in self.board:
self.legalActions.add((i, j))
def getFeatures(self, index):
# Return the features that we need for evaluationFunction
# (not the features in state.features)
result = []
for feature in self.features:
num = self.features[feature]
agentIndex = feature[0]
description = feature[1]
newFeature = (description, num, index == agentIndex, self.currentPlayer == index)
result.append(newFeature)
return result
def __str__(self):
s = ' |'
for i in range(self.boardSize):
if i < 10:
s += ' ' + str(i) + ' |'
else:
s += ' ' + str(i) + '|'
s += "\n" + (4 * (self.boardSize + 1) * "-") +'\n'
for y in range(self.boardSize):
if y < 10:
s += ' ' + str(y) + '|'
else:
s += ' ' + str(y) + '|'
for x in range(self.boardSize):
if (x, y) not in self.board:
s += ' |'
else:
s += ' ' + str(self.board[(x,y)]) + ' |'
s += "\n" + (4 * (self.boardSize + 1) * "-") +'\n'
return s
def withinBounds(self, move):
return move[0] >= 0 and move[0] < self.boardSize and move[1] >= 0 and move[1] < self.boardSize
def checkTie(self):
if len(self.board.keys()) == self.boardSize**2 :
return True
else:
return False
def updateFeaturesForMove(self, player, move):
"""
Update the features when a player makes a move.
There are 4 directions (Horizontal, Vertical, Diagonal /, Diagonal \).
"""
# import pdb; pdb.set_trace();
x, y = move
# print move
# print str(self)
############ Horizontal ############
neighbors1 = self.checkNeighboringRows(move, [(i, y) for i in range(x + 1, self.boardSize + 1)])
# print neighbors1
neighbors2 = self.checkNeighboringRows(move, [(i, y) for i in range(x - 1, -2, -1)])
self.updateFeature(player, move, neighbors1, neighbors2)
############ Vertical ############
neighbors1 = self.checkNeighboringRows(move, [(x, j) for j in range(y + 1, self.boardSize + 1)])
neighbors2 = self.checkNeighboringRows(move, [(x, j) for j in range(y - 1, -2, -1)])
self.updateFeature(player, move, neighbors1, neighbors2)
############ Diagonal / ############
neighbors1 = self.checkNeighboringRows(move, [(x + i, y + i) for i in range(1, self.boardSize + 1)])
neighbors2 = self.checkNeighboringRows(move, [(x - i, y - i) for i in range(1, self.boardSize + 1)])
self.updateFeature(player, move, neighbors1, neighbors2)
############ Diagonal \ ############
neighbors1 = self.checkNeighboringRows(move, [(x + i, y - i) for i in range(1, self.boardSize + 1)])
neighbors2 = self.checkNeighboringRows(move, [(x - i, y + i) for i in range(1, self.boardSize + 1)])
self.updateFeature(player, move, neighbors1, neighbors2)
def checkNeighboringRows(self, move, piecesRange):
"""
Return (player, num in a row, blocked or not)
This logic is complicated...
"""
# Hit boundary (no neighbors)
if len(piecesRange) == 0 or not self.withinBounds(piecesRange[0]):
return (-1, 0, 1, set())
# Open end (no neighbors)
if piecesRange[0] not in self.board:
return (-1, 0, 0, set())
piecesInFeature = set()
player = self.board[piecesRange[0]]
num = 0
blocked = 0
for piece in piecesRange:
if not self.withinBounds(piece) or (piece in self.board and self.board[piece] != player):
blocked = 1
break
if piece not in self.board:
break
# print piece
piecesInFeature.add(piece)
# print piecesInFeature
num += 1
return (player, num, blocked, piecesInFeature)
#Delete an instance of a feature from a set of pieces
def deleteFeatureFromDict(self, dict, featureToDelete, move, setOfPiecesToDeleteFeatureFrom):
for piece in setOfPiecesToDeleteFeatureFrom:
if not piece in self.positionToFeatures:
# self.positionToFeatures[move] = {featureToDelete:set()}
continue
if not featureToDelete in self.positionToFeatures[piece]:
# self.positionToFeatures[move][featureToDelete] = set()
continue
# print piece
self.positionToFeatures[piece][featureToDelete].discard(frozenset(setOfPiecesToDeleteFeatureFrom))
if len(self.positionToFeatures[piece][featureToDelete]) == 0:
del self.positionToFeatures[piece][featureToDelete]
if len(self.positionToFeatures[piece]) == 0:
del self.positionToFeatures[piece]
#Add an instance of a feature for a set of pieces
#The structure of the positionToFeatures is:
#positionToFeatures - Dict of move : Dict(player index,feature) key,value pairs
#Dict(player index, feature) is a dict of (player index, feature) : Set of frozen sets
#The set contains frozen sets, where the frozen sets are the pieces that are in one instance of the feature
#So the overall structure is dict:dict:set:set of (x,y) coordinates
def addPiecesToFeatureInDict(self, dict, move, feature, piecesList):
# print "Adding feature: ", feature, "| For move: ", move, "| Pieces: ", piecesList
for piece in piecesList:
if not piece in self.positionToFeatures:
self.positionToFeatures[piece] = {feature:set()}
if not feature in self.positionToFeatures[piece]:
self.positionToFeatures[piece][feature] = set()
self.positionToFeatures[piece][feature].update([frozenset(piecesList)])
# self.positionToFeatures[move][feature].append(piecesInFeature)
def updateFeature(self, player, move, neighbors1, neighbors2):
"""
Delete/Update the features of the neighbors.
For example, if neighbor is an open 3 from a different player,
then update it to be a blocked 3.
Then, add a new feature according to the given move and its neighbors.
Parameters: neighbors: (playerIndex, num, blocked, piecesInFeature)
"""
if neighbors1[1] == 0 and neighbors2[1] == 0:
return
# Delete/Update the features of the neighbors
for neighbor in [neighbors1, neighbors2]:
num = neighbor[1]
if neighbor[0] == -1:
# no neighbor
continue
if neighbor[0] != player:
# neighbor is a different player, so delete or update the feature
if num >= 2:
if neighbor[2] == 0: # not blocked
featureToDelete = (neighbor[0], 'open ' + str(num))
#Delete feature from
self.deleteFeatureFromDict(self.positionToFeatures, featureToDelete, move, neighbor[3])
util.deleteItemFromDict(self.features, featureToDelete)
featureToAdd = (neighbor[0], 'blocked ' + str(num))
piecesInFeature = neighbor[3]
self.addPiecesToFeatureInDict(self.positionToFeatures, move, featureToAdd, piecesInFeature)
util.addItemToDict(self.features, featureToAdd)
else: # blocked
featureToDelete = (neighbor[0], 'blocked ' + str(num))
self.deleteFeatureFromDict(self.positionToFeatures, featureToDelete, move, neighbor[3])
util.deleteItemFromDict(self.features, featureToDelete)
else:
# neighbor is the same player, so delete the feature
if num >= 2:
if neighbor[2] == 0: # not blocked
featureToDelete = (neighbor[0], 'open ' + str(num))
self.deleteFeatureFromDict(self.positionToFeatures, featureToDelete, move, neighbor[3])
util.deleteItemFromDict(self.features, featureToDelete)
else: # blocked
featureToDelete = (neighbor[0], 'blocked ' + str(num))
self.deleteFeatureFromDict(self.positionToFeatures, featureToDelete, move, neighbor[3])
util.deleteItemFromDict(self.features, featureToDelete)
# Add a new feature according to the given move and its neighbors.
num = 1
blocked = 0
piecesInFeature = set([move])
# import pdb; pdb.set_trace();
# print "Neighbor 1", neighbors1
for neighbor in [neighbors1]:
if neighbor[0] != player:
break
piecesInFeature.update(neighbor[3])
# print "Neighbor 2", neighbors2
for neighbor in [neighbors2]:
if neighbor[0] != player:
break
piecesInFeature.update(neighbor[3])
# print "Move:", move, "| Pieces In Feature", piecesInFeature
for neighbor in [neighbors1, neighbors2]:
if neighbor[0] == -1:
blocked += neighbor[2]
elif neighbor[0] == player:
num += neighbor[1]
blocked += neighbor[2]
else:
blocked += 1
# Game ends if num >= self.N
if num >= self.N:
self.gameOver = True
self.winner = player
s = ''
if blocked >= 2 or num <= 1:
return
if blocked == 0:
s = 'open ' + str(num)
elif blocked == 1:
s = 'blocked ' + str(num)
feature = (player, s)
util.addItemToDict(self.features, feature)
self.addPiecesToFeatureInDict(self.positionToFeatures, move, feature, piecesInFeature)
# print "Pieces in feature with: ", move, self.positionToFeatures[move][feature]