-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathwl_ranking.py
executable file
·168 lines (150 loc) · 6.52 KB
/
wl_ranking.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
#!/usr/bin/env python3
import argparse
import json
import math
import sys
from collections import Counter, namedtuple
import utility
MU = 25.
SIGMA = MU / 3
BETA = SIGMA / 2
Rating = namedtuple("Rating", ("mu", "sigma"))
"""
Rating system from the paper "A Bayesian Approximation Method for Online Ranking"
by Ruby Weng and Chih-Jen Lin
paper and original code found at
http://www.csie.ntu.edu.tw/~cjlin/papers/online_ranking/
"""
def wl_bt_ratings(game_results, last_ratings=dict()):
"""Weng-Lin Bradley-Terry Full Pair update rule ratings"""
players = list(set(p for game in game_results for p in game))
first = Rating(MU, SIGMA)
mu = {p: last_ratings.get(p, first).mu for p in players}
sigma = {p: last_ratings.get(p, first).sigma for p in players}
for gnum, game in enumerate(game_results, start=1):
omega = dict()
delta = dict()
for player, prank in game.items():
omega[player] = 0.
delta[player] = 0.
for opp, orank in game.items():
if opp == player:
continue
ciq = math.sqrt(sigma[player]**2 + sigma[opp]**2 + (2*BETA**2))
piq = 1. / (1. + math.exp((mu[opp] - mu[player]) / ciq))
s = 0
if orank > prank:
s = 1
elif orank == prank:
s = 0.5
omega[player] += (sigma[player]**2 / ciq) * (s - piq)
gamma = sigma[player] / ciq
delta[player] += gamma * (sigma[player]**2 / ciq) / ciq * piq * (1 - piq)
for player in game:
mu[player] += omega[player]
sigma[player] *= math.sqrt(max(1 - delta[player], 0.0001))
if gnum % 10000 == 0:
print("\rRated %d games" % (gnum,), end="")
if gnum >= 10000:
print("\r", end="")
if gnum > 5000:
print("Rated %d games" % (gnum,))
return {player: Rating(mu[player], sigma[player]) for player in players}
def wl_pl_ratings(game_results, last_ratings=dict()):
"""Weng-Lin Plackett-Luce update rule ratings"""
players = list(set(p for game in game_results for p in game))
first = Rating(MU, SIGMA)
mu = {p: last_ratings.get(p, first).mu for p in players}
sigma = {p: last_ratings.get(p, first).sigma for p in players}
for gnum, game in enumerate(game_results, start=1):
c = math.sqrt(sum(sigma[p]**2 + BETA**2 for p in game))
Aq = Counter(r for r in game.values())
if Aq.most_common()[0][0] != 1:
print("Found tied ranks")
sumCq = {q: sum(math.exp(mu[i] / c) for i in game if game[i] >= game[q])
for q in game}
omega = dict()
delta = dict()
for player, prank in game.items():
omega[player] = 0.
delta[player] = 0.
gamma = sigma[player] / c
for opp, orank in game.items():
if orank > prank:
continue
PiCq = math.exp(mu[player] / c) / sumCq[opp]
if player == opp:
mf = 1 - PiCq
else:
mf = 0 - PiCq
omega[player] += mf * (sigma[player]**2 / (c * Aq[orank]))
etaq = (gamma * sigma[player]**2) / (c**2 * Aq[orank])
etaq *= PiCq * (1 - PiCq)
delta[player] += etaq
for player in game:
mu[player] += omega[player]
sigma[player] *= math.sqrt(max(1 - delta[player], 0.0001))
if gnum % 10000 == 0:
print("\rRated %d games" % (gnum,), end="")
if gnum >= 10000:
print("\r", end="")
if gnum > 5000:
print("Rated %d games" % (gnum,))
return {player: Rating(mu[player], sigma[player]) for player in players}
def main(args=sys.argv[1:]):
parser = argparse.ArgumentParser("Create Weng-Lin ratings from game data.")
parser.add_argument("game_files", nargs="+",
help="Json files containing game data.")
parser.add_argument("-d", "--display", type=int, default=40,
help="Limit display of rating to top N (0 for all)")
parser.add_argument("-n", "--num-games", type=int,
help="Limit the number of games used (positive for first, negative for last")
parser.add_argument("--remove-suspect", action="store_true",
help="Filter out suspect games based on workerID.")
parser.add_argument("--no-error", action="store_true",
help="Filter out games that had bot errors.")
parser.add_argument("-o", "--out-file",
help="If specified will write the full ratings to given filename")
parser.add_argument("--plackett-luce", action="store_true",
help="Use Plackett-Luce update rule.")
config = parser.parse_args(args)
games = utility.load_games(config.game_files)
if config.no_error:
games = utility.filter_error_games(games)
print("Filtered out error games, leaving %d" % (len(games),))
if config.remove_suspect:
start_num = len(games)
games = utility.filter_suspect_games(games)
print("Filtered out %d suspect games, leaving %d" % (
start_num - len(games), len(games)))
game_results = [{"%s (%s)" % (u['username'], u['userID']): int(u['rank'])
for u in g['users']}
for g in games]
if config.num_games:
if config.num_games > 0:
game_results = game_results[:config.num_games]
print("Using first %d games." % (len(game_results),))
else:
game_results = game_results[config.num_games:]
print("Using last %d games." % (len(game_results),))
wl_ratings = wl_bt_ratings
if config.plackett_luce:
wl_ratings = wl_pl_ratings
ratings = wl_ratings(game_results)
ratings = sorted(ratings.items(), key=lambda x: -(x[1].mu - (x[1].sigma*3)))
if config.out_file:
with open(config.out_file, 'w') as out:
for rank, (player, rating) in enumerate(ratings, start=1):
score = rating.mu - (rating.sigma * 3)
out.write('%d,%s,%f,%r,%r\n' % (rank, player, score,
rating.mu, rating.sigma))
if config.display > 0:
ratings = ratings[:config.display]
rwidth = math.floor(math.log10(len(ratings))) + 1
pwidth = max(len(r[0]) for r in ratings)
for rank, (player, rating) in enumerate(ratings, start=1):
score = rating.mu - (rating.sigma * 3)
print("%*d: %*s %.2f (%.2f, %.2f)" % (rwidth, rank, pwidth, player,
score, rating.mu, rating.sigma))
if __name__ == "__main__":
main()