4 # Author:: Daigo Moriwaki
5 # Homepage:: http://sourceforge.jp/projects/shogi-server/
8 # Copyright (C) 2006-2012 Daigo Moriwaki <daigo at debian dot org>
10 # This program is free software; you can redistribute it and/or modify
11 # it under the terms of the GNU General Public License as published by
12 # the Free Software Foundation; either version 2 of the License, or
13 # (at your option) any later version.
15 # This program is distributed in the hope that it will be useful,
16 # but WITHOUT ANY WARRANTY; without even the implied warranty of
17 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 # GNU General Public License for more details.
20 # You should have received a copy of the GNU General Public License
21 # along with this program; if not, write to the Free Software
22 # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
27 # mk_rate reads game results files generated by the mk_game_results command,
28 # calculates rating scores of each player, and then outputs a yaml file
29 # (players.yaml) that Shogi-server can recognize.
33 # ./mk_rate [options] GAME_RESULTS_FILE [...]
38 # a path to a file listing results of games, which is generated by the
39 # mk_game_results command.
40 # In the second style above, the file content can be read from the stdin.
42 # --abnormal-threshold::
43 # n [plies] (default 30)
44 # Games that end with the 'abnormal' status are counted in win/lost games
45 # for the rating calculation if a game plays more than n plies. Otherwise
46 # (or if n is zero), abnormal games are counted out of rating games.
49 # a base time point for this calculation (default now). Ex. '2009-10-31'
52 # n [days] (default 60)
54 # --half-life-ignore::
55 # m [days] (default 7)
56 # after m days, the half-life effect works
59 # m [days] (default 365*2)
60 # old results will be ignored
62 # --fixed-rate-player::
63 # player whose rate is fixed at the rate
69 # skip draw games. [default: draw games are counted in as 0.5 win and 0.5
77 # Sample Command lines that install prerequires will work on Debian.
79 # * Ruby 1.9.3 or 1.8.7 (including Rubygems)
81 # $ sudo aptitude install ruby1.9.1
83 # * Ruby bindings for the GNU Scientific Library (GSL[http://rb-gsl.rubyforge.org/])
85 # $ sudo aptitude install ruby-gsl
87 # * RGL: {Ruby Graph Library}[http://rubyforge.org/projects/rgl/]
89 # $ sudo gem1.9.1 install rgl
93 # $ ./mk_rate game_results.txt > players.yaml
95 # $ ./mk_game_results . | ./mk_rate > players.yaml
97 # If you do not want the file to be update in case of errors,
99 # $ ./mk_rate game_results.txt && ./mk_rate game_results.txt > players.yaml
101 # == How players are rated
103 # The conditions that games and players are rated as following:
105 # * Rated games, which were played by both rated players.
106 # * Rated players, who logged in the server with a name followed by a trip: "name,trip".
107 # * (Rated) players, who played more than $GAMES_LIMIT [15] (rated) games.
110 $:.unshift(File.dirname(File.expand_path(__FILE__)))
111 require 'utils/csa-filter'
118 require 'rgl/adjacency'
119 require 'rgl/connected_components'
121 #################################################
125 # Count out players who play less games than $GAMES_LIMIT
126 $GAMES_LIMIT = $DEBUG ? 0 : 15
133 # Holds the last time when a player gamed
134 $players_time = Hash.new { Time.at(0) }
135 # Holds history of input lines to check duplicated inputs
139 #################################################
140 # Keeps the value of the lowest key
148 if @lowest.empty? || key < @lowest[0]
149 @lowest = [key, value]
162 #################################################
163 # Calculates rates of every player from a Win Loss GSL::Matrix
168 # The model of the win possibility is 1/(1 + 10^(-d/400)).
169 # The equation in this class is 1/(1 + e^(-Kd)).
170 # So, K should be calculated like this.
171 K = Math.log(10.0) / 400.0
173 # Convergence limit to stop Newton method.
175 # Stop Newton method after this iterations.
178 # Average rate among the players
187 # Calcurates the average of the vector.
189 def Rating.average(vector, mean=0.0)
190 sum = Array(vector).inject(0.0) {|sum, n| sum + n}
191 vector -= GSL::Vector[*Array.new(vector.size, sum/vector.size - mean)]
198 def initialize(win_loss_matrix)
202 when GSL::Matrix, GSL::Matrix::Int
211 attr_reader :rate, :n
215 (0...@size).collect {|k| yield k}
220 (0...@size).each {|k| yield k}
224 # The possibility that the player k will beet the player i.
227 1.0/(1.0 + exp(@rate[i]-@rate[k]))
231 # Most possible equation
238 sum += @n[k,i] * win_rate(i,k) - @n[i,k] * win_rate(k,i)
245 # / f0/R0 f0/R1 f0/R2 ... \
246 # dfk/dRj = | f1/R0 f1/R1 f1/R2 ... |
247 # \ f2/R0 f2/R1 f2/R2 ... /
253 sum += win_rate(i,k) * win_rate(k,i) * (@n[k,i] + @n[i,k])
257 sum = 2.0 * win_rate(j,k) * win_rate(k,j) * (@n[k,j] + @n[j,k])
263 # Jacobi matrix of the func().
269 (0...@size).collect do |k|
270 (0...@size).collect do |j|
278 # The initial value of the rate, which is of very importance for Newton
279 # method. This is based on my huristics; the higher the win probablity of
280 # a player is, the greater points he takes.
285 v = GSL::Vector[0, 0]
288 v += GSL::Vector[@n[k,i], @n[i,k]]
290 v.nrm2 < 1 ? 0 : v[0] / (v[0] + v[1])
292 rank = possibility.sort_index
293 @rate = player_vector do |k|
294 K*500 * (rank[k]+1) / @size
300 # Resets @rate as the higher the current win probablity of a player is,
301 # the greater points he takes.
304 @rate = @record.get || @rate
305 rank = @rate.sort_index
306 @rate = player_vector do |k|
307 K*@count*1.5 * (rank[k]+1) / @size
312 # mu is the deaccelrating parameter in Deaccelerated Newton method
313 def deaccelrate(mu, old_rate, a, old_f_nrm2)
314 @rate = old_rate - a * mu
315 if func_vector.nrm2 < (1 - mu / 4.0 ) * old_f_nrm2 then
319 @record.set(func_vector.nrm2, @rate)
323 $stderr.puts "mu: %f " % [mu] if $DEBUG
324 deaccelrate(mu*0.5, old_rate, a, old_f_nrm2)
328 # Main process to calculate ratings.
331 # Counter to stop the process.
332 # Calulation in Newton method may fall in an infinite loop
337 # Solve the equation:
339 # @rate_(n+1) = @rate_(n) - a
341 # f.nrm2 should approach to zero.
345 # $stderr.puts "j: %s" % [j.inspect] if $DEBUG
346 $stderr.puts "f: %s -> %f" % [f.to_a.inspect, f.nrm2] if $DEBUG
348 # GSL::Linalg::LU.solve or GSL::Linalg::HH.solve would be available instead.
349 #a = GSL::Linalg::HH.solve(j, f)
350 a, = GSL::MultiFit::linear(j, f)
351 a = self.class.average(a)
352 # $stderr.puts "a: %s -> %f" % [a.to_a.inspect, a.nrm2] if $DEBUG
354 # Deaccelerated Newton method
355 # GSL::Vector object should be immutable.
358 old_f_nrm2 = old_f.nrm2
359 deaccelrate(1.0, old_rate, a, old_f_nrm2)
360 #@rate -= a # Instead, do not deaccelerate
361 @record.set(func_vector.nrm2, @rate)
363 $stderr.printf "|error| : %5.2e\n", a.nrm2 if $DEBUG
366 if @count > COUNT_MAX
367 $stderr.puts "Values seem to oscillate. Stopped the process."
368 $stderr.puts "f: %s -> %f" % [func_vector.to_a.inspect, func_vector.nrm2]
372 end while (a.nrm2 > ERROR_LIMIT * @rate.nrm2)
375 $stderr.puts "resolved f: %s -> %f" %
376 [func_vector.to_a.inspect, func_vector.nrm2] if $DEBUG
377 $stderr.puts "Count: %d" % [@count] if $DEBUG
385 # Make the values of @rate finite.
388 @rate = @rate.collect do |a|
390 a.infinite? * AVERAGE_RATE * 100
398 # Flatten the values of @rate.
400 def average!(mean=0.0)
401 @rate = self.class.average(@rate, mean)
407 def translate!(value)
412 # Make the values of @rate integer.
415 @rate = @rate.collect do |a|
421 a.infinite? * AVERAGE_RATE * 100
427 #################################################
428 # Encapsulate a pair of keys and win loss matrix.
429 # - keys is an array of player IDs; [gps+123, foo+234, ...]
430 # - matrix holds games # where player i (row index) beats player j (column index).
431 # The row and column indexes match with the keys.
433 # This object should be immutable. If an internal state is being modified, a
434 # new object is always returned.
442 def self.mk_matrix(players)
443 keys = players.keys.sort
447 ((0...size).collect do |k|
449 p1_hash = players[p1]
450 ((0...size).collect do |j|
455 v = p1_hash[p2] || GSL::Vector[0,0]
460 return WinLossMatrix.new(keys, matrix)
463 def self.mk_win_loss_matrix(players)
464 obj = mk_matrix(players)
472 # an array of player IDs; [gps+123, foo+234, ...]
475 # matrix holds games # where player i (row index) beats player j (column index).
476 # The row and column indexes match with the keys.
479 def initialize(keys, matrix)
485 # Returns the size of the keys/matrix
496 # Removes players in a rows such as [1,3,5], and then returns a new
499 def delete_rows(rows)
500 rows = rows.sort.reverse
503 (0...size).each do |i|
504 next if rows.include?(i)
505 row = @matrix.row(i).clone
511 if copied_cols.size == 0
512 new_matrix = GSL::Matrix.new
514 new_matrix = GSL::Matrix[*copied_cols]
517 new_keys = @keys.clone
519 new_keys.delete_at(j)
522 return WinLossMatrix.new(new_keys, new_matrix)
526 # Removes players who do not pass a criteria to be rated, and returns a
530 $stderr.puts @keys.inspect if $DEBUG
531 $stderr.puts @matrix.inspect if $DEBUG
533 (0...size).each do |i|
538 if win < 1 || loss < 1 || win + loss < $GAMES_LIMIT
543 # The recursion ends if there is nothing to delete
544 return self if delete.empty?
546 new_obj = delete_rows(delete)
551 # Cuts self into connecting groups such as each player in a group has at least
552 # one game with other players in the group. Returns them as an array.
554 def connected_subsets
555 g = RGL::AdjacencyGraph.new
556 (0...size).each do |k|
557 (0...size).each do |i|
566 g.each_connected_component do |c|
569 new_keys << keys[v.to_s.to_i]
574 subsets = subsets.sort {|a,b| b.size <=> a.size}
576 result = subsets.collect do |keys|
579 ((0...keys.size).collect do |k|
580 p1 = @keys.index(keys[k])
581 ((0...keys.size).collect do |j|
585 p2 = @keys.index(keys[j])
590 WinLossMatrix.new(keys, matrix)
597 "size : #{@keys.size}" + "\n" +
598 @keys.inspect + "\n" +
605 #################################################
610 # After NHAFE_LIFE days value will get half.
611 # 0.693 is constant, where exp(0.693) ~ 0.5
613 if days < $options["half-life-ignore"]
616 Math::exp(-0.693/$options["half-life"]*(days-$options["half-life-ignore"]))
620 def _add_win_loss(winner, loser, time)
621 how_long_days = ($options["base-date"] - time)/(3600*24)
622 $players[winner] ||= Hash.new { GSL::Vector[0,0] }
623 $players[loser] ||= Hash.new { GSL::Vector[0,0] }
624 $players[winner][loser] += GSL::Vector[1.0*half_life(how_long_days),0]
625 $players[loser][winner] += GSL::Vector[0,1.0*half_life(how_long_days)]
628 def _add_draw(player1, player2, time)
629 how_long_days = ($options["base-date"] - time)/(3600*24)
630 $players[player1] ||= Hash.new { GSL::Vector[0,0] }
631 $players[player2] ||= Hash.new { GSL::Vector[0,0] }
632 $players[player1][player2] += GSL::Vector[0.5*half_life(how_long_days),0.5*half_life(how_long_days)]
633 $players[player2][player1] += GSL::Vector[0.5*half_life(how_long_days),0.5*half_life(how_long_days)]
636 def _add_time(player, time)
637 $players_time[player] = time if $players_time[player] < time
640 def add(black_mark, black_name, white_name, white_mark, time)
641 if black_mark == WIN_MARK && white_mark == LOSS_MARK
642 _add_win_loss(black_name, white_name, time)
643 elsif black_mark == LOSS_MARK && white_mark == WIN_MARK
644 _add_win_loss(white_name, black_name, time)
645 elsif black_mark == DRAW_MARK && white_mark == DRAW_MARK
646 if $options["skip-draw-games"]
649 _add_draw(black_name, white_name, time)
652 raise "Never reached!"
654 _add_time(black_name, time)
655 _add_time(white_name, time)
659 if /@NORATE\+/ =~ id # the player having @NORATE in the name should not be rated
662 id.gsub(/@.*?\+/,"+")
665 # Parse a game result line
668 if $history.include? line
669 $stderr.puts "[WARNING] Duplicated: #{line}"
674 time, state, black_mark, black_id, white_id, white_mark, file = line.split("\t")
675 unless time && state && black_mark && black_id &&
676 white_id && white_mark && file
677 $stderr.puts "Failed to parse the line : #{line}"
681 if state == "abnormal"
682 csa = CsaFileReader.new(file, "EUC-JP")
683 if $options["abnormal-threshold"] == 0 || csa.ply <= $options["abnormal-threshold"]
687 time = Time.parse(time)
688 return if $options["base-date"] < time
689 how_long_days = ($options["base-date"] - time)/(3600*24)
690 if (how_long_days > $options["ignore"])
694 black_id = identify_id(black_id)
695 white_id = identify_id(white_id)
697 if black_id && white_id && (black_id != white_id) &&
698 black_mark && white_mark
699 add(black_mark, black_id, white_id, white_mark, time)
704 yaml["players"].each do |group_key, group|
705 group.each do |player_key, player|
706 rate = player['rate']
708 if rate > 10000 || rate < -10000
718 USAGE: #{$0} [options] GAME_RESULTS_FILE [...]
722 a path to a file listing results of games, which is genrated by the
723 mk_game_results command.
724 In the second style above, the file content can be read from the stdin.
727 --base-date a base time point for this calicuration (default now). Ex. '2009-10-31'
728 --half-life n [days] (default 60)
729 --half-life-ignore m [days] (default 7)
730 after m days, half-life effect works
731 --ignore n [days] (default 730 [=365*2]).
732 Results older than n days from the 'base-date' are ignored.
733 --fixed-rate-player player whose rate is fixed at the rate
735 --skip-draw-games skip draw games. [default: draw games are counted in
736 as 0.5 win and 0.5 lost]
737 --help show this message
743 parser = GetoptLong.new(
744 ["--abnormal-threshold", GetoptLong::REQUIRED_ARGUMENT],
745 ["--base-date", GetoptLong::REQUIRED_ARGUMENT],
746 ["--half-life", GetoptLong::REQUIRED_ARGUMENT],
747 ["--half-life-ignore", GetoptLong::REQUIRED_ARGUMENT],
748 ["--help", "-h", GetoptLong::NO_ARGUMENT],
749 ["--ignore", GetoptLong::REQUIRED_ARGUMENT],
750 ["--fixed-rate-player", GetoptLong::REQUIRED_ARGUMENT],
751 ["--fixed-rate", GetoptLong::REQUIRED_ARGUMENT],
752 ["--skip-draw-games", GetoptLong::NO_ARGUMENT])
755 parser.each_option do |name, arg|
757 $options[name] = arg.dup
759 if ( $options["fixed-rate-player"] && !$options["fixed-rate"]) ||
760 (!$options["fixed-rate-player"] && $options["fixed-rate"]) ||
761 ( $options["fixed-rate-player"] && $options["fixed-rate"].to_i <= 0)
767 raise parser.error_message
773 if $options["base-date"]
774 $options["base-date"] = Time::parse $options["base-date"]
776 $options["base-date"] = Time.now
778 $options["abnormal-threshold"] ||= 30
779 $options["abnormal-threshold"] = $options["abnormal-threshold"].to_i
780 $options["half-life"] ||= 60
781 $options["half-life"] = $options["half-life"].to_i
782 $options["half-life-ignore"] ||= 7
783 $options["half-life-ignore"] = $options["half-life-ignore"].to_i
784 $options["ignore"] ||= 365*2
785 $options["ignore"] = $options["ignore"].to_i
786 $options["fixed-rate"] = $options["fixed-rate"].to_i if $options["fixed-rate"]
789 while line = $stdin.gets do
793 while file = ARGV.shift do
794 File.open(file) do |f|
795 f.each_line do |line|
806 obj = WinLossMatrix::mk_win_loss_matrix($players)
807 obj.connected_subsets.each do |win_loss_matrix|
808 yaml["players"][rating_group] = {}
810 rating = Rating.new(win_loss_matrix.matrix)
812 rating.average!(Rating::AVERAGE_RATE)
815 if $options["fixed-rate-player"]
816 # first, try exact match
817 index = win_loss_matrix.keys.index($options["fixed-rate-player"])
818 # second, try regular match
820 win_loss_matrix.keys.each_with_index do |p, i|
821 if %r!#{$options["fixed-rate-player"]}! =~ p
827 the_rate = rating.rate[index]
828 rating.translate!($options["fixed-rate"] - the_rate)
832 win_loss_matrix.keys.each_with_index do |p, i| # player_id, index#
833 win = win_loss_matrix.matrix.row(i).sum
834 loss = win_loss_matrix.matrix.col(i).sum
836 yaml["players"][rating_group][p] =
837 { 'name' => p.split("+")[0],
838 'rating_group' => rating_group,
839 'rate' => rating.rate[i],
840 'last_modified' => $players_time[p].dup,
848 non_rated_group = 999 # large enough
849 yaml["players"][non_rated_group] = {}
850 $players.each_key do |id|
851 # skip players who have already been rated
853 (0..rating_group).each do |i|
854 found = true if yaml["players"][i][id]
859 v = GSL::Vector[0, 0]
860 $players[id].each_value {|value| v += value}
861 next if v[0] < 1 && v[1] < 1
863 yaml["players"][non_rated_group][id] =
864 { 'name' => id.split("+")[0],
865 'rating_group' => non_rated_group,
867 'last_modified' => $players_time[id].dup,
871 unless validate(yaml)
872 $stderr.puts "Aborted. It did not result in valid ratings."
873 $stderr.puts yaml.to_yaml if $DEBUG
883 # vim: ts=2 sw=2 sts=0