-
Notifications
You must be signed in to change notification settings - Fork 71
/
Copy pathpokertrees.py
396 lines (358 loc) · 19.3 KB
/
pokertrees.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
from itertools import combinations
from itertools import permutations
from itertools import product
from collections import Counter
from hand_evaluator import HandEvaluator
from copy import deepcopy
from functools import partial
FOLD = 0
CALL = 1
RAISE = 2
def overlap(t1, t2):
for x in t1:
if x in t2:
return True
return False
def all_unique(hc):
for i in range(len(hc)-1):
for j in range(i+1,len(hc)):
if overlap(hc[i], hc[j]):
return False
return True
def default_infoset_format(player, holecards, board, bet_history):
return "{0}{1}:{2}:".format("".join([str(x) for x in holecards]), "".join([str(x) for x in board]), bet_history)
class GameRules(object):
def __init__(self, players, deck, rounds, ante, blinds, handeval = HandEvaluator.evaluate_hand, infoset_format=default_infoset_format):
assert(players >= 2)
assert(ante >= 0)
assert(rounds != None)
assert(deck != None)
assert(len(rounds) > 0)
assert(len(deck) > 1)
if blinds != None:
if type(blinds) is int or type(blinds) is float:
blinds = [blinds]
for r in rounds:
assert(len(r.maxbets) == players)
self.players = players
self.deck = deck
self.roundinfo = rounds
self.ante = ante
self.blinds = blinds
self.handeval = handeval
self.infoset_format = infoset_format
class RoundInfo(object):
def __init__(self, holecards, boardcards, betsize, maxbets):
self.holecards = holecards
self.boardcards = boardcards
self.betsize = betsize
self.maxbets = maxbets
class GameTree(object):
def __init__(self, rules):
self.rules = deepcopy(rules)
self.information_sets = {}
self.root = None
def build(self):
# Assume everyone is in
players_in = [True] * self.rules.players
# Collect antes
committed = [self.rules.ante] * self.rules.players
bets = [0] * self.rules.players
# Collect blinds
next_player = self.collect_blinds(committed, bets, 0)
holes = [()] * self.rules.players
board = ()
bet_history = ""
self.root = self.build_rounds(None, players_in, committed, holes, board, self.rules.deck, bet_history, 0, bets, next_player)
def collect_blinds(self, committed, bets, next_player):
if self.rules.blinds != None:
for blind in self.rules.blinds:
committed[next_player] += blind
bets[next_player] = int((committed[next_player] - self.rules.ante) / self.rules.roundinfo[0].betsize)
next_player = (next_player + 1) % self.rules.players
return next_player
def deal_holecards(self, deck, holecards, players):
a = combinations(deck, holecards)
return filter(lambda x: all_unique(x), permutations(a, players))
def build_rounds(self, root, players_in, committed, holes, board, deck, bet_history, round_idx, bets = None, next_player = 0):
if round_idx == len(self.rules.roundinfo):
return self.showdown(root, players_in, committed, holes, board, deck, bet_history)
bet_history += "/"
cur_round = self.rules.roundinfo[round_idx]
while not players_in[next_player]:
next_player = (next_player + 1) % self.rules.players
if bets is None:
bets = [0] * self.rules.players
min_actions_this_round = players_in.count(True)
actions_this_round = 0
if cur_round.holecards:
return self.build_holecards(root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets)
if cur_round.boardcards:
return self.build_boardcards(root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets)
return self.build_bets(root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets)
def get_next_player(self, cur_player, players_in):
next_player = (cur_player + 1) % self.rules.players
while not players_in[next_player]:
next_player = (next_player + 1) % self.rules.players
return next_player
def build_holecards(self, root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets):
cur_round = self.rules.roundinfo[round_idx]
hnode = HolecardChanceNode(root, committed, holes, board, self.rules.deck, "", cur_round.holecards)
# Deal holecards
all_hc = self.deal_holecards(deck, cur_round.holecards, players_in.count(True))
# Create a child node for every possible distribution
for cur_holes in all_hc:
dealt_cards = ()
cur_holes = list(cur_holes)
cur_idx = 0
for i,hc in enumerate(holes):
# Only deal cards to players who are still in
if players_in[i]:
cur_holes[cur_idx] = hc + cur_holes[cur_idx]
cur_idx += 1
for hc in cur_holes:
dealt_cards += hc
cur_deck = filter(lambda x: not (x in dealt_cards), deck)
if cur_round.boardcards:
self.build_boardcards(hnode, next_player, players_in, committed, cur_holes, board, cur_deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets)
else:
self.build_bets(hnode, next_player, players_in, committed, cur_holes, board, cur_deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets)
return hnode
def build_boardcards(self, root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets):
cur_round = self.rules.roundinfo[round_idx]
bnode = BoardcardChanceNode(root, committed, holes, board, deck, bet_history, cur_round.boardcards)
all_bc = combinations(deck, cur_round.boardcards)
for bc in all_bc:
cur_board = board + bc
cur_deck = filter(lambda x: not (x in bc), deck)
self.build_bets(bnode, next_player, players_in, committed, holes, cur_board, cur_deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets)
return bnode
def build_bets(self, root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets_this_round):
# if everyone else folded, end the hand
if players_in.count(True) == 1:
self.showdown(root, players_in, committed, holes, board, deck, bet_history)
return
# if everyone checked or the last raisor has been called, end the round
if actions_this_round >= min_actions_this_round and self.all_called_last_raisor_or_folded(players_in, bets_this_round):
self.build_rounds(root, players_in, committed, holes, board, deck, bet_history, round_idx + 1)
return
cur_round = self.rules.roundinfo[round_idx]
anode = ActionNode(root, committed, holes, board, deck, bet_history, next_player, self.rules.infoset_format)
# add the node to the information set
if not (anode.player_view in self.information_sets):
self.information_sets[anode.player_view] = []
self.information_sets[anode.player_view].append(anode)
# get the next player to act
next_player = self.get_next_player(next_player, players_in)
# add a folding option if someone has bet more than this player
if committed[anode.player] < max(committed):
self.add_fold_child(anode, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets_this_round)
# add a calling/checking option
self.add_call_child(anode, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets_this_round)
# add a raising option if this player has not reached their max bet level
if cur_round.maxbets[anode.player] > max(bets_this_round):
self.add_raise_child(anode, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets_this_round)
return anode
def all_called_last_raisor_or_folded(self, players_in, bets):
betlevel = max(bets)
for i,v in enumerate(bets):
if players_in[i] and bets[i] < betlevel:
return False
return True
def add_fold_child(self, root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets_this_round):
players_in[root.player] = False
bet_history += 'f'
self.build_bets(root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round + 1, bets_this_round)
root.fold_action = root.children[-1]
players_in[root.player] = True
def add_call_child(self, root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets_this_round):
player_commit = committed[root.player]
player_bets = bets_this_round[root.player]
committed[root.player] = max(committed)
bets_this_round[root.player] = max(bets_this_round)
bet_history += 'c'
self.build_bets(root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round + 1, bets_this_round)
root.call_action = root.children[-1]
committed[root.player] = player_commit
bets_this_round[root.player] = player_bets
def add_raise_child(self, root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets_this_round):
cur_round = self.rules.roundinfo[round_idx]
prev_betlevel = bets_this_round[root.player]
prev_commit = committed[root.player]
bets_this_round[root.player] = max(bets_this_round) + 1
committed[root.player] += (bets_this_round[root.player] - prev_betlevel) * cur_round.betsize
bet_history += 'r'
self.build_bets(root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round + 1, bets_this_round)
root.raise_action = root.children[-1]
bets_this_round[root.player] = prev_betlevel
committed[root.player] = prev_commit
def showdown(self, root, players_in, committed, holes, board, deck, bet_history):
if players_in.count(True) == 1:
winners = [i for i,v in enumerate(players_in) if v]
else:
scores = [self.rules.handeval(hc, board) for hc in holes]
winners = []
maxscore = -1
for i,s in enumerate(scores):
if players_in[i]:
if len(winners) == 0 or s > maxscore:
maxscore = s
winners = [i]
elif s == maxscore:
winners.append(i)
pot = sum(committed)
payoff = pot / float(len(winners))
payoffs = [-x for x in committed]
for w in winners:
payoffs[w] += payoff
return TerminalNode(root, committed, holes, board, deck, bet_history, payoffs, players_in)
def holecard_distributions(self):
x = Counter(combinations(self.rules.deck, self.holecards))
d = float(sum(x.values()))
return zip(x.keys(),[y / d for y in x.values()])
def multi_infoset_format(base_infoset_format, player, holecards, board, bet_history):
return tuple([base_infoset_format(player, hc, board, bet_history) for hc in holecards])
class PublicTree(GameTree):
def __init__(self, rules):
GameTree.__init__(self, GameRules(rules.players, rules.deck, rules.roundinfo, rules.ante, rules.blinds, rules.handeval, partial(multi_infoset_format, rules.infoset_format)))
def build(self):
# Assume everyone is in
players_in = [True] * self.rules.players
# Collect antes
committed = [self.rules.ante] * self.rules.players
bets = [0] * self.rules.players
# Collect blinds
next_player = self.collect_blinds(committed, bets, 0)
holes = [[()]] * self.rules.players
board = ()
bet_history = ""
self.root = self.build_rounds(None, players_in, committed, holes, board, self.rules.deck, bet_history, 0, bets, next_player)
def build_holecards(self, root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets):
cur_round = self.rules.roundinfo[round_idx]
hnode = HolecardChanceNode(root, committed, holes, board, self.rules.deck, "", cur_round.holecards)
# Deal holecards
all_hc = list(combinations(deck, cur_round.holecards))
updated_holes = []
for player in range(self.rules.players):
if not players_in[player]:
# Only deal to players who are still in the hand
updated_holes.append([old_hc for old_hc in holes[player]])
elif len(holes[player]) == 0:
# If this player has no cards, just set their holecards to be the newly dealt ones
updated_holes.append([new_hc for new_hc in all_hc])
else:
updated_holes.append([])
# Filter holecards to valid combinations
# TODO: Speed this up by removing duplicate holecard combinations
for new_hc in all_hc:
for old_hc in holes[player]:
if not overlap(old_hc, new_hc):
updated_holes[player].append(old_hc + new_hc)
if cur_round.boardcards:
self.build_boardcards(hnode, next_player, players_in, committed, updated_holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets)
else:
self.build_bets(hnode, next_player, players_in, committed, updated_holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets)
return hnode
def build_boardcards(self, root, next_player, players_in, committed, holes, board, deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets):
cur_round = self.rules.roundinfo[round_idx]
bnode = BoardcardChanceNode(root, committed, holes, board, deck, bet_history, cur_round.boardcards)
all_bc = combinations(deck, cur_round.boardcards)
for bc in all_bc:
cur_board = board + bc
cur_deck = filter(lambda x: not (x in bc), deck)
updated_holes = []
# Filter any holecards that are now impossible
for player in range(self.rules.players):
updated_holes.append([])
for hc in holes[player]:
if not overlap(hc, bc):
updated_holes[player].append(hc)
self.build_bets(bnode, next_player, players_in, committed, updated_holes, cur_board, cur_deck, bet_history, round_idx, min_actions_this_round, actions_this_round, bets)
return bnode
def showdown(self, root, players_in, committed, holes, board, deck, bet_history):
# TODO: Speedup
# - Pre-order list of hands
pot = sum(committed)
showdowns_possible = self.showdown_combinations(holes)
if players_in.count(True) == 1:
fold_payoffs = [-x for x in committed]
fold_payoffs[players_in.index(True)] += pot
payoffs = { hands: fold_payoffs for hands in showdowns_possible }
else:
scores = {}
for i in range(self.rules.players):
if players_in[i]:
for hc in holes[i]:
if not (hc in scores):
scores[hc] = self.rules.handeval(hc, board)
payoffs = { hands: self.calc_payoffs(hands, scores, players_in, committed, pot) for hands in showdowns_possible }
return TerminalNode(root, committed, holes, board, deck, bet_history, payoffs, players_in)
def showdown_combinations(self, holes):
# Get all the possible holecard matchups for a given showdown.
# Every card must be unique because two players cannot have the same holecard.
return list(filter(lambda x: all_unique(x), product(*holes)))
def calc_payoffs(self, hands, scores, players_in, committed, pot):
winners = []
maxscore = -1
for i,hand in enumerate(hands):
if players_in[i]:
s = scores[hand]
if len(winners) == 0 or s > maxscore:
maxscore = s
winners = [i]
elif s == maxscore:
winners.append(i)
payoff = pot / float(len(winners))
payoffs = [-x for x in committed]
for w in winners:
payoffs[w] += payoff
return payoffs
class Node(object):
def __init__(self, parent, committed, holecards, board, deck, bet_history):
self.committed = deepcopy(committed)
self.holecards = deepcopy(holecards)
self.board = deepcopy(board)
self.deck = deepcopy(deck)
self.bet_history = deepcopy(bet_history)
if parent:
self.parent = parent
self.parent.add_child(self)
def add_child(self, child):
if self.children is None:
self.children = [child]
else:
self.children.append(child)
class TerminalNode(Node):
def __init__(self, parent, committed, holecards, board, deck, bet_history, payoffs, players_in):
Node.__init__(self, parent, committed, holecards, board, deck, bet_history)
self.payoffs = payoffs
self.players_in = deepcopy(players_in)
class HolecardChanceNode(Node):
def __init__(self, parent, committed, holecards, board, deck, bet_history, todeal):
Node.__init__(self, parent, committed, holecards, board, deck, bet_history)
self.todeal = todeal
self.children = []
class BoardcardChanceNode(Node):
def __init__(self, parent, committed, holecards, board, deck, bet_history, todeal):
Node.__init__(self, parent, committed, holecards, board, deck, bet_history)
self.todeal = todeal
self.children = []
class ActionNode(Node):
def __init__(self, parent, committed, holecards, board, deck, bet_history, player, infoset_format):
Node.__init__(self, parent, committed, holecards, board, deck, bet_history)
self.player = player
self.children = []
self.raise_action = None
self.call_action = None
self.fold_action = None
self.player_view = infoset_format(player, holecards[player], board, bet_history)
def valid(self, action):
if action == FOLD:
return self.fold_action
if action == CALL:
return self.call_action
if action == RAISE:
return self.raise_action
raise Exception("Unknown action {0}. Action must be FOLD, CALL, or RAISE".format(action))
def get_child(self, action):
return self.valid(action)