forked from sandiegocsp/prisoners
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathprisoners_dilemma.py
382 lines (350 loc) · 15.8 KB
/
prisoners_dilemma.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
from __future__ import print_function
#####
# Computer Science and Software Engineering
# PLTW AP CS Principles
# (c)2014 Project Lead The Way, Inc.
#
# Activity 1.3.9 Tools for Collaboration
# Project 1.3.10 Collaborating on a Project
#
# To run a tournament, execute this file.
# Place each team's strategy in a file in the same directory as this file.
# Tournament results saved to tournament.txt in this directory.
#
# prisoners_dilemma.py automates competition among different strategies
# for the Iterative Prisoners Dilemma, the canonical game of game-theory.
# Each strategy is pitted against each other strategy for 100 to 200 rounds.
# The results of all previous rounds within a 100-200 round stretch are known
# to both players.
#
# play_tournament([team0, team1, team2]) executes a tournament and writes to tournament.txt
#
# Each team's strategy should be coded in their assigned Python file, called a module.
# Each player should have their own .py file containing
# three strings team_name, strategy_name, and strategy_description
# and a function move(my_history, their_history, my_score, their_score)
#
# By default, when executing this file, [example0, example1, example2, example3]
# play a tournament. To run the tournament of [team, team1, team1, example1]:
# scores, moves, reports = main_play([team1]*3+[example1])
# section0, section1, section2, section3 = reports
#######
import random
import os.path
import example0, example1, example2, example3
import example4, example5, example6, example7
import team0, team1, team2, team3, team4
import team5, team6, team7, team8, team9
import team10, team11, team12, team13, team14
betray = example1
collude = example0
modules = [example0, example1, example2, example3, example4, example5, example6, example7,
team0, team1, team2, team3, team4, team5, team6, team7, team8, team9, team10,
team11, team12, team13, team14]
for module in modules:
reload(module)
print ('reloaded',module)
for required_variable in ['team_name', 'strategy_name', 'strategy_description']:
if not hasattr(module, required_variable):
setattr(module, required_variable, 'missing assignment')
def main_play(modules):
'''main_play plays a tournament and outputs results to screen and file.
This function is called once when this file is executed.
modules: a list of modules such as [team1, team2]
Returns:
scores:
moves:
sections: a list of [str, str, str, list of str]
'''
scores, moves = play_tournament(modules)
section0, section1, section2, section3 = make_reports(modules, scores, moves)
code = make_code_string(modules)
# On screen, include the first three out of four sections of the report.
print(section0+section1+section2)
# To file output, store all teams' code and all teams' section 3 reports.
post_to_file(section0+section1+section2 + code + ''.join(section3))
return scores, moves, [section0, section1, section2, section3]
def play_tournament(modules):
'''Each argument is a module name
Each module must contain
team_name: a string
strategy_name: a string
strategy_description: a string
move: A function that returns 'c' or 'b'
'''
zeros_list = [0]*len(modules) # to initialize each player's head-to-head scores
scores = [zeros_list[:] for module in modules] # Copy it or it's only 1 list
moves = [zeros_list[:] for module in modules] # Copy it or it's only 1 list
for first_team_index in range(len(modules)):
for second_team_index in range(first_team_index):
player1 = modules[first_team_index]
player2 = modules[second_team_index]
score1, score2, moves1, moves2 = play_iterative_rounds(player1, player2)
capitalize(moves1, moves2)
scores[first_team_index][second_team_index] = score1/len(moves1) # int division not an issue
moves[first_team_index][second_team_index] = moves1
# Redundant, but record this for the other player, from their perspective
scores[second_team_index][first_team_index] = score2/len(moves2)
moves[second_team_index][first_team_index] = moves2
# Playing yourself doesn't do anything
scores[first_team_index][first_team_index] = 0
moves[first_team_index][first_team_index] = ''
return scores, moves
def play_iterative_rounds(player1, player2):
'''
Plays a random number of rounds (between 100 and 200 rounds)
of the iterative prisoners' dilemma between two strategies.
player1 and player2 are modules.
Returns 4-tuple, for example ('cc', 'bb', -200, 600)
but with much longer strings
'''
number_of_rounds = random.randint(100, 200)
moves1 = ''
moves2 = ''
score1 = 0
score2 = 0
for round in range(number_of_rounds):
score1, score2, moves1, moves2 = play_round(player1, player2, score1, score2, moves1, moves2)
return (score1, score2, moves1, moves2)
def play_round(player1, player2, score1, score2, moves1, moves2):
'''
Calls the move() function from each module which return
'c' or 'b' for collude or betray for each player.
The history is provided in a string, e.g. 'ccb' indicates the player
colluded in the first two rounds and betrayed in the most recent round.
Returns a 2-tuple with score1 and score2 incremented by this round
'''
RELEASE = 0 # (R, "reward" in literature) when both players collude
TREAT = 100 # (T, "temptation" in literature) when you betray your partner
SEVERE_PUNISHMENT = -500 # (S, "sucker" in literature) when your partner betrays you
PUNISHMENT = -250 # (P) when both players betray each other
# Keep T > R > P > S to be a Prisoner's Dilemma
# Keep 2R > T + S to be an Iterative Prisoner's Dilemma
ERROR = -250
# Get the two players' actions and remember them.
action1 = player1.move(moves1, moves2, score1, score2)
action2 = player2.move(moves2, moves1, score2, score1)
if (type(action1) != str) or (len(action1) != 1):
action1=' '
if (type(action2) != str) or (len(action2) != 1):
action2=' '
# Change scores based upon player actions.
actions = action1 + action2
if actions == 'cc':
# Both players collude; get reward.
score1 += RELEASE
score2 += RELEASE
elif actions == 'cb':
# Player 1 colludes, player 2 betrays; get severe, treat.
score1 += SEVERE_PUNISHMENT
score2 += TREAT
elif actions == 'bc':
# Player 1 betrays, player 2 colludes; get treat, severe.
score1 += TREAT
score2 += SEVERE_PUNISHMENT
elif actions == 'bb':
# Both players betray; get punishment.
score1 += PUNISHMENT
score2 += PUNISHMENT
else:
# Both players get the "error score" if someone's code returns an improper action.
score1 += ERROR
score2 += ERROR
# Append the actions to the previous histories.
if action1 in 'bc':
moves1 += action1
else:
moves1 += ' '
if action2 in 'bc':
moves2 += action2
else:
moves2 += ' '
# Return scores incremented by this round's results.
return (score1, score2, moves1, moves2)
def make_reports(modules, scores, moves):
section0 = make_section0(modules, scores)
section1 = make_section1(modules, scores)
section2 = make_section2(modules, scores)
section3 = []
for index in range(len(modules)):
section3.append(make_section3(modules, moves, scores, index))
return section0, section1, section2, section3
def make_section0(modules, scores):
'''
Produce the following string:
----------------------------------------------------------------------------
Section 0 - Line up
----------------------------------------------------------------------------
Player 0 (P0): Team name 0, Strategy name 0,
Strategy 0 description
Player 1 (P1): Team name 1, Strategy name 1,
Strategy 1 description
'''
section0 = '-'*80+'\n'
section0 += 'Section 0 - Line up\n'
section0 += '-'*80+'\n'
for index in range(len(modules)):
section0 += 'Player ' + str(index) + ' (P' + str(index) + '): '
section0 += str(modules[index].team_name) + ', ' + str(modules[index].strategy_name) + '\n'
strategy_description = str(modules[index].strategy_description)
# Format with 8 space indent 80 char wide
while len(strategy_description) > 1:
newline = strategy_description[:72].find('\n')
if newline> -1:
section0 += ' '*8 + strategy_description[:newline+1]
strategy_description = strategy_description[newline+1:]
else:
section0 += ' '*8 + strategy_description[:72] + '\n'
strategy_description = strategy_description[72:]
return section0
def make_section1(modules, scores):
'''
----------------------------------------------------------------------------
Section 1 - Player vs. Player
----------------------------------------------------------------------------
A column shows pts/round earned against each other player:
P0 P1
vs. P0 : 0 100
vs. P1 : -500 0
TOTAL : -500 100
'''
# First line
section1 = '-'*80+'\nSection 1 - Player vs. Player\n'+'-'*80+'\n'
section1 += 'Each column shows pts/round earned against each other player:\n'
# Second line
section1 += ' '
for i in range(len(modules)):
section1 += '{:>7}'.format('P'+str(i))
section1 += '\n'
# Add one line per team
for index in range(len(modules)):
section1 += 'vs. P' + str(index) + ' :'
for i in range(len(modules)):
section1 += '{:>7}'.format(scores[i][index])
section1 += '\n'
# Last line
section1 += 'TOTAL :'
for index in range(len(modules)):
section1 += '{:>7}'.format(sum(scores[index]))
return section1+'\n'
def make_section2(modules, scores):
'''
----------------------------------------------------------------------------
Section 2 - Leaderboard
----------------------------------------------------------------------------
Average points per round:
Team name (P#): Score with strategy name
Champ10nz (P0): 100 points with Loyal
Rockettes (P1): -500 points with Backstabber
'''
section2 = '-'*80+'\nSection 2 - Leaderboard\n'+'-'*80+'\n'
section2 += 'Average points per round:\n'
section2 += 'Team name (P#): Score with strategy name\n'
# Make a list of teams' 4-tuples
section2_list = []
for index in range(len(modules)):
section2_list.append((modules[index].team_name,
'P'+str(index),
str(sum(scores[index])/len(modules)),
str(modules[index].strategy_name)))
section2_list.sort(key=lambda x: int(x[2]), reverse=True)
# Generate one string per team
# Rockettes (P1): -500 points with Backstabber
for team in section2_list:
team_name, Pn, n_points, strategy_name = team
section2 += '{:<10}({}): {:>10} points with {:<40}\n'.format(team_name[:10], Pn, n_points, strategy_name[:40])
return section2
def make_section3(modules, moves, scores, index):
'''Return a string with information for the player at index, like:
----------------------------------------------------------------------------
Section 3 - Game Data for Team Colloid c=-500 b=-250 C=0 B=+100
----------------------------------------------------------------------------
-133 pt/round: Colloid (P6) "Collude every 3rd round"
-233 pt/round: 2PwnU (P8) "Betray, then alternate"
bBcBbCbBcBbCbBcBbCbBcBbCbBcBbCbBcBbCbBcBbCbBcBbCbBcBbCbBcBbCbBcBbCbBcBbCbBcB
bcBcbCbcbcbCBcbcbCBcbcbCBcbcbCBcbcbCBcbcbCBcbcbCBcbcbCBcbcbCBcbcbCBcbcbCBcbc
'''
section3 = '-'*80+'\nSection 3 - Game Data for Team '
section3 += modules[index].team_name + '\n'
section3 += '-'*80+'\n'
# Make 4 lines per opponent
for opponent_index in range(len(modules)):
if opponent_index != index:
# Line 1
section3 += str(scores[index][opponent_index])
section3 += ' pt/round: ' + modules[index].team_name +'(P'
section3 += str(index)+') "'+modules[index].strategy_name + '"\n'
# Line 2
section3 += str(scores[opponent_index][index])
section3 += ' pt/round: ' + modules[opponent_index].team_name +'(P'
section3 += str(opponent_index)+') "'+modules[opponent_index].strategy_name + '"\n'
# Lines 3-4
hist1, hist2 = capitalize(moves[index][opponent_index], moves[opponent_index][index])
while len(hist1) > 1:
section3 += hist1[:80] + '\n'
section3 += hist2[:80] + '\n\n'
hist1 = hist1[80:]
hist2 = hist2[80:]
section3 += '-'*80 + '\n'
return section3
def capitalize(history1, history2):
'''Accept two strings of equal length.
Return the same two strings but capitalizing the opponent of 'c' each round.
'''
caphistory1, caphistory2 = '', ''
for i in range(len(history1)):
p1 = history1[i]
p2 = history2[i]
if p1 == 'c':
p2 = p2.upper()
if p2 in 'cC':
p1 = p1.upper()
caphistory1 += p1
caphistory2 += p2
return caphistory1, caphistory2
def make_code_string(modules):
'''Returns a string of the code from each file.
'''
code = '-'*80 + '\n'
code += 'Code of each player\'s algorithm\n'
code = '-'*80 + '\n'
for index in range(len(modules)):
players_code_filename = str(modules[index]).split(' ')[1].replace('\'','')
directory = os.path.dirname(os.path.abspath(__file__))
filename = os.path.join(directory, players_code_filename)
players_code_file = open(filename+'.py', 'r')
code += '-'*80 + '\n'
code += players_code_filename
code +='-'*80 + '\n'
code += ''.join(players_code_file.readlines())
return code
def copy_template():
'''Transfer code in team0.py to team1.py though team14.py
'''
directory = os.path.dirname(os.path.abspath(__file__))
with open(os.path.join(directory, 'team0.py'), 'r') as sourcefile:
source = sourcefile.readlines()
for i in range(1, 15):
target = 'team'+str(i)+'.py'
filename = os.path.join(directory, target)
with open(filename, 'w') as target_file:
target_file.write(''.join(source))
def post_to_api():
pass
def post_to_local_html():
pass
def post_to_file(string, filename='tournament.txt', directory=''):
'''Write output in a txt file.
'''
# Use the same directory as the python script
if directory=='':
directory = os.path.dirname(os.path.abspath(__file__))
# Name the file tournament.txt
filename = os.path.join(directory, filename)
# Create the file for the round-by-round results
filehandle = open(filename,'w')
filehandle.write(string)
### Call main_play() if this file is executed
if __name__ == '__main__':
scores, moves, reports = main_play(modules[0:4])
section0, section1, section2, section3 = reports