-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathhog.py
534 lines (432 loc) · 16 KB
/
hog.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
"""The Game of Hog."""
from dice import four_sided, six_sided, make_test_dice
from ucb import main, trace, log_current_line, interact
GOAL_SCORE = 100 # The goal of Hog is to score 100 points.
######################
# Phase 1: Simulator #
######################
def roll_dice(num_rolls, dice=six_sided):
"""Roll DICE for NUM_ROLLS times. Return either the sum of the outcomes,
or 1 if a 1 is rolled (Pig out). This calls DICE exactly NUM_ROLLS times.
num_rolls: The number of dice rolls that will be made; at least 1.
dice: A zero-argument function that returns an integer outcome.
"""
# These assert statements ensure that num_rolls is a positive integer.
assert type(num_rolls) == int, 'num_rolls must be an integer.'
assert num_rolls > 0, 'Must roll at least once.'
"*** YOUR CODE HERE ***"
total=0
sensor=False
while num_rolls>0:
a=dice()
if a!=1:
total=total+a
num_rolls=num_rolls-1
else:
sensor=True
num_rolls=num_rolls-1
if sensor==True:
return 1
else:
return total
def take_turn(num_rolls, opponent_score, dice=six_sided):
"""Simulate a turn rolling NUM_ROLLS dice, which may be 0 (Free bacon).
num_rolls: The number of dice rolls that will be made.
opponent_score: The total score of the opponent.
dice: A function of no args that returns an integer outcome.
"""
assert type(num_rolls) == int, 'num_rolls must be an integer.'
assert num_rolls >= 0, 'Cannot roll a negative number of dice.'
assert num_rolls <= 10, 'Cannot roll more than 10 dice.'
assert opponent_score < 100, 'The game should be over.'
"*** YOUR CODE HERE ***"
score=0
sensor=False
if num_rolls==0:
if opponent_score>=10:
score=score+abs(opponent_score//10-opponent_score%10)+1
else:
score=score+(1+opponent_score)
return score
elif num_rolls>0:
while num_rolls>0:
a=dice()
if a!=1:
score=score+a
num_rolls=num_rolls-1
else:
sensor=True
num_rolls=num_rolls-1
if sensor==True:
return 1
else:
return score
def select_dice(score, opponent_score):
"""Select six-sided dice unless the sum of SCORE and OPPONENT_SCORE is a
multiple of 7, in which case select four-sided dice (Hog wild).
"""
"*** YOUR CODE HERE ***"
if (score+opponent_score)%7==0:
return four_sided
else:
return six_sided
def bid_for_start(bid0, bid1, goal=GOAL_SCORE):
"""Given the bids BID0 and BID1 of each player, returns three values:
- the starting score of player 0
- the starting score of player 1
- the number of the player who rolls first (0 or 1)
"""
assert bid0 >= 0 and bid1 >= 0, "Bids should be non-negative!"
assert type(bid0) == int and type(bid1) == int, "Bids should be integers!"
# The buggy code is below:
if bid0 == bid1:
return goal,goal,0
elif bid0 == bid1 + 5:
return 10, 0, 0
elif bid1 == bid0 + 5:
return 0, 10, 1
elif bid1 > bid0:
return bid1, bid0, 1
else:
return bid1, bid0, 0
def other(who):
"""Return the other player, for a player WHO numbered 0 or 1.
>>> other(0)
1
>>> other(1)
0
"""
return 1 - who
def play(strategy0, strategy1, score0=0, score1=0, goal=GOAL_SCORE):
"""Simulate a game and return the final scores of both players, with
Player 0's score first, and Player 1's score second.
A strategy is a function that takes two total scores as arguments
(the current player's score, and the opponent's score), and returns a
number of dice that the current player will roll this turn.
strategy0: The strategy function for Player 0, who plays first
strategy1: The strategy function for Player 1, who plays second
score0 : The starting score for Player 0
score1 : The starting score for Player 1
"""
who = 0 # Which player is about to take a turn, 0 (first) or 1 (second)
"*** YOUR CODE HERE ***"
while score0<100 and score1<100:
if who==0:
score_this_round=take_turn(strategy0(score0,score1),score1,select_dice(score0,score1))
score0=score0+score_this_round
who=other(who)
elif who==1:
score_this_round=take_turn(strategy1(score1,score0),score0,select_dice(score0,score1))
score1=score1+score_this_round
who=other(who)
score0,score1=swine_swap(score0,score1)
return score0, score1 # You may want to change this line.
#######################
# Phase 2: Strategies #
#######################
def always_roll(n):
"""Return a strategy that always rolls N dice.
A strategy is a function that takes two total scores as arguments
(the current player's score, and the opponent's score), and returns a
number of dice that the current player will roll this turn.
>>> strategy = always_roll(5)
>>> strategy(0, 0)
5
>>> strategy(99, 99)
5
"""
def strategy(score, opponent_score):
return n
return strategy
# Experiments
def make_averaged(fn, num_samples=10000):
"""Return a function that returns the average_value of FN when called.
To implement this function, you will have to use *args syntax, a new Python
feature introduced in this project. See the project description.
>>> dice = make_test_dice(3, 1, 5, 6)
>>> averaged_dice = make_averaged(dice, 1000)
>>> averaged_dice()
3.75
>>> make_averaged(roll_dice, 1000)(2, dice)
6.0
In this last example, two different turn scenarios are averaged.
- In the first, the player rolls a 3 then a 1, receiving a score of 1.
- In the other, the player rolls a 5 and 6, scoring 11.
Thus, the average value is 6.0.
"""
"*** YOUR CODE HERE ***"
def average_value(*args):
total=0
n=num_samples
while n>0:
result=fn(*args)
total=total+result
n=n-1
return total/num_samples
return average_value
def max_scoring_num_rolls(dice=six_sided):
"""Return the number of dice (1 to 10) that gives the highest average turn
score by calling roll_dice with the provided DICE. Assume that dice always
return positive outcomes.
>>> dice = make_test_dice(3)
>>> max_scoring_num_rolls(dice)
10
"""
"*** YOUR CODE HERE ***"
n=1
average=0
average_score=0
while n<=10:
average_score=make_averaged(roll_dice,10000)(n,dice)
if average_score>average:
average=average_score
n=n+1
else:
n=n+1
n=1
while n<=10:
average_score=make_averaged(roll_dice,10000)(n,dice)
if average_score==average:
return n
else:
n=n+1
def winner(strategy0, strategy1):
"""Return 0 if strategy0 wins against strategy1, and 1 otherwise."""
score0, score1 = play(strategy0, strategy1)
if score0 > score1:
return 0
else:
return 1
def average_win_rate(strategy, baseline=always_roll(5)):
"""Return the average win rate (0 to 1) of STRATEGY against BASELINE."""
win_rate_as_player_0 = 1 - make_averaged(winner)(strategy, baseline)
win_rate_as_player_1 = make_averaged(winner)(baseline, strategy)
return (win_rate_as_player_0 + win_rate_as_player_1) / 2 # Average results
def run_experiments():
"""Run a series of strategy experiments and report results."""
if False: # Change to False when done finding max_scoring_num_rolls
six_sided_max = max_scoring_num_rolls(six_sided)
print('Max scoring num rolls for six-sided dice:', six_sided_max)
four_sided_max = max_scoring_num_rolls(four_sided)
print('Max scoring num rolls for four-sided dice:', four_sided_max)
if False: # Change to True to test always_roll(8)
print('always_roll(8) win rate:', average_win_rate(always_roll(8)))
if False: # Change to True to test bacon_strategy
print('bacon_strategy win rate:', average_win_rate(bacon_strategy))
if False: # Change to True to test swap_strategy
print('swap_strategy win rate:', average_win_rate(swap_strategy))
if True: # Change to True to test final_strategy
print('final_strategy win rate:', average_win_rate(final_strategy))
if False:
print('baseline always_roll(5) win rate:', average_win_rate(always_roll(5)))
"*** You may add additional experiments as you wish ***"
if False:
print('always_roll(6) win rate:',average_win_rate(always_roll(6)))
if False:
print('always_roll(3) win rate:',average_win_rate(always_roll(3)))
if False:
print('always_roll(4) win rate:',average_win_rate(always_roll(4)))
if False:
print('always_roll(7) win rate:',average_win_rate(always_roll(7)))
if False:
print('always_roll(9) win rate:',average_win_rate(always_roll(9)))
# Strategies
def bacon_strategy(score, opponent_score, margin=8, num_rolls=5):
"""This strategy rolls 0 dice if that gives at least MARGIN points,
and rolls NUM_ROLLS otherwise.
"""
"*** YOUR CODE HERE ***"
score_difference=0
if opponent_score>=10:
score_difference=abs(opponent_score//10-opponent_score%10)+1
else:
score_difference=1+opponent_score
if score_difference>=margin:
return 0
else:
return num_rolls
def swap_strategy(score, opponent_score, margin=8, num_rolls=5):
"""This strategy rolls 0 dice when it would result in a beneficial swap and
rolls NUM_ROLLS if it would result in a harmful swap. It also rolls
0 dice if that gives at least MARGIN points and rolls
NUM_ROLLS otherwise.
"""
"*** YOUR CODE HERE ***"
score_difference=0
if opponent_score>=10:
score_difference=abs(opponent_score//10-opponent_score%10)+1
else:
score_difference=1+opponent_score
if (score+score_difference)==opponent_score/2:
return 0
elif(score+score_difference)==opponent_score*2:
return num_rolls
elif score_difference>=margin:
return 0
else:
return num_rolls
def final_strategy(score, opponent_score):
"""Write a brief description of your final strategy.
1. if your score is less than your opponent's score, you want to play boldly.
Therefore you play swap_strategy and you roll more dices
2. if your score is more than your opponent_score,you want to play safe.
So play bacon_strategy and roll less dices
3. In the beginning of each roll, see if you can make your opponent play with
a four-sided dice. If so, call hog wild
4. If your_score is higher than 70, decreases the number of dices you roll to
play safe
5. You play more dices with a six_sided dice and less with a four_sided dice
*** YOUR DESCRIPTION HERE ***
"""
"*** YOUR CODE HERE ***"
if score<opponent_score and score<70:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return swap_strategy(score,opponent_score,9,5)
elif n==six_sided:
return swap_strategy(score,opponent_score,9,7)
elif score<opponent_score and score<90:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return bacon_strategy(score,opponent_score,9,4)
elif n==six_sided:
return bacon_strategy(score,opponent_score,9,5)
elif score<opponent_score and score>=90:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return bacon_strategy(score,opponent_score,8,2)
elif n==six_sided:
return bacon_strategy(score,opponent_score,8,3)
elif score>opponent_score and score<70:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return bacon_strategy(score,opponent_score,9,4)
elif n==six_sided:
return bacon_strategy(score,opponent_score,9,6)
elif score>opponent_score and score<90:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return bacon_strategy(score,opponent_score,8,3)
elif n==six_sided:
return bacon_strategy(score,opponent_score,8,4)
elif score>opponent_score and score>=90:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return bacon_strategy(score,opponent_score,8,2)
elif n==six_sided:
return bacon_strategy(score,opponent_score,8,3)
elif score==opponent_score and score<50:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return bacon_strategy(score,opponent_score,9,3)
elif n==six_sided:
return bacon_strategy(score,opponent_score,9,5)
elif score==opponent_score and score<70:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return bacon_strategy(score,opponent_score,9,3)
elif n==six_sided:
return bacon_strategy(score,opponent_score,9,4)
elif score==opponent_score and score<90:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return bacon_strategy(score,opponent_score,9,2)
elif n==six_sided:
return bacon_strategy(score,opponent_score,9,3)
elif score==opponent_score and score>=90:
a=hog_wild(score,opponent_score)
if a==0:
return a
else:
pass
n=select_dice(score,opponent_score)
if n==four_sided:
return bacon_strategy(score,opponent_score,8,2)
elif n==six_sided:
return bacon_strategy(score,opponent_score,8,3)
final_bid=0
def swine_swap(your_score, opponent_score):
if your_score==2*opponent_score:
store=opponent_score
opponent_score=your_score
your_score=store
return your_score, opponent_score
elif opponent_score==2*your_score:
store=opponent_score
opponent_score=your_score
your_score=store
return your_score, opponent_score
else:
return your_score, opponent_score
def hog_wild(score,opponent_score,num_rolls=5,margin=8):
difference=0
if opponent_score>=10:
score_difference=abs(opponent_score//10-opponent_score%10)+1
else:
score_difference=1+opponent_score
if (score+score_difference+opponent_score)%7==0 and score_difference>=margin:
return 0
else:
return num_rolls
##########################
# Command Line Interface #
##########################
# Note: Functions in this section do not need to be changed. They use features
# of Python not yet covered in the course.
@main
def run(*args):
"""Read in the command-line argument and calls corresponding functions.
This function uses Python syntax/techniques not yet covered in this course.
"""
import argparse
parser = argparse.ArgumentParser(description="Play Hog")
parser.add_argument('--run_experiments', '-r', action='store_true',
help='Runs strategy experiments')
args = parser.parse_args()
if args.run_experiments:
run_experiments()