rank est in bots

sanderland · Jun 27, 2020 · aaa2e81 · aaa2e81
1 parent 853e340
commit aaa2e81
Show file tree

Hide file tree

Showing 7 changed files with 144 additions and 115 deletions.
diff --git a/ai2gtp.py b/ai2gtp.py
@@ -8,6 +8,8 @@
 import traceback
 import math
 
+from rank_utils import rank_game
+
 os.environ["KCFG_KIVY_LOG_LEVEL"] = os.environ.get("KCFG_KIVY_LOG_LEVEL", "warning")
 
 
@@ -25,7 +27,7 @@
 REPORT_SCORE_THRESHOLD = 1.5
 MAX_WAIT_ANALYSIS = 10
 MAX_PASS = 3  # after opponent passes this many times, we always pass
-
+len_segment = 80
 
 logger = Logger()
 
@@ -69,6 +71,13 @@ def rank_to_string(r):
         return f"{30 - r}k"
 
 
+def format_rank(rank):
+    if rank <= 0:
+        return f"{1 - rank:.1f}d"
+    else:
+        return f"{rank:.1f}k"
+
+
 def malkovich_analysis(cn):
     start = time.time()
     while not cn.analysis_ready:
@@ -202,6 +211,15 @@ def malkovich_analysis(cn):
                 )
                 if any(gamedata["players"][p]["username"] == "katrain-dev-beta" for p in ["white", "black"]):
                     sgf_dir = "sgf_ogs_beta/"
+
+                if game.board_size == (19, 19):
+                    ranks = rank_game(game, len_segment)
+                    if ranks:
+                        for start, end, rank in ranks:
+                            print(
+                                f"DISCUSSION: Experimental Rank Estimation for moves {start:3d} to {end:3d}: B ~ {format_rank(rank['B'])}, W ~ {format_rank(rank['W'])}"
+                            )
+
             except Exception as e:
                 _, _, tb = sys.exc_info()
                 logger.log(f"error while processing gamedata: {e}\n{traceback.format_tb(tb)}", OUTPUT_ERROR)

diff --git a/analyze_rank.py b/analyze_rank.py
@@ -1,122 +1,34 @@
-import math, glob, time, os
-import numpy as np
+import glob
 
 from katrain.core.base_katrain import KaTrainBase
 from katrain.core.game import Game, KaTrainSGF
 from katrain.core.engine import KataGoEngine
+from rank_utils import rank_game
 
-def gauss(data):
-    return math.exp(-1 * (data) ** 2)
 
-def median(data):
-    sorteddata = sorted(data)
-    lendata = len(data)
-    index = (lendata - 1) // 2
-    if (lendata % 2):
-        return sorteddata[index]
+def format_rank(rank):
+    if rank <= 0:
+        return f"{1-rank:5.1f}d"
     else:
-        return (sorteddata[index] + sorteddata[index + 1])/2.0
-
-def averagemod(data):
-    sorteddata = sorted(data)
-    lendata = len(data)
-    return sum(sorteddata[int(lendata * 0.2) : int(lendata * 0.8) + 1]) / (
-        (int(lendata * 0.8) + 1) - int(lendata * 0.2)
-    )  # average without the best and worst 20% of ranks
-
-
-def calculate_rank_for_player(segment_stats, num_intersec, player):
-        non_obvious_moves = [
-            (nl, r, val)
-            for nl, r, val, pl in segment_stats
-            if nl is not None and val < (0.8 * (1 - (num_intersec - nl) / num_intersec * 0.5)) and pl == player
-        ]
-        num_legal, rank, value = zip(*non_obvious_moves)
-        rank = list(rank)
-        for (i, item) in enumerate(rank):
-            if item > num_legal[i] * 0.09:
-                rank[i] = num_legal[i] * 0.09
-        rank = tuple(rank)
-        averagemod_rank = averagemod(rank)
-        averagemod_len_legal = averagemod(num_legal)
-        norm_avemod_len_legal = averagemod_len_legal / num_intersec
-        if averagemod_rank > 0.1:
-            rank_kyu = (
-                -0.97222
-                * math.log(averagemod_rank)
-                / (0.24634 + averagemod_rank * gauss(3.3208 * (norm_avemod_len_legal)))
-                + 12.703 * (norm_avemod_len_legal)
-                + 11.198 * math.log(averagemod_rank)
-                + 12.28 * gauss(2.379 * (norm_avemod_len_legal))
-                - 16.544
-            )
-        else:
-            rank_kyu = -4
-        if rank_kyu < -4:
-            rank_kyu = -4
-        return rank_kyu  # dan rank
-
-
-def calculate_rank_for_player_alternative_try(segment_stats, num_intersec, player):
-    non_obvious_moves = [
-        (nl, r, val)
-        for nl, r, val, pl in segment_stats
-        if val < (0.8 * (1 - (num_intersec - nl) / num_intersec * 0.5)) and pl == player
-    ]
-    num_legal, rank, value = zip(*non_obvious_moves)
-    # we expect r = (ll-npicked)/(npicked+1) so naively say npicked = (ll - r)/(r+1)
-    est_n_picked = [(nl - r) / (r + 1) for nl, r in zip(num_legal, rank)]
-    n_moves = np.mean(est_n_picked)
-    rank_kyu = (
-        math.log10(n_moves * 361 / num_intersec) - 1.9482
-    ) / -0.05737  # using the calibration curve of p:pick:rank
-    return rank_kyu
-
-
-def calculate_ranks(segment_stats, num_intersec):
-    return {pl: calculate_rank_for_player(segment_stats, num_intersec, pl) for pl in "BW"}
-
-
-def rank_game(game, len_segment):
-    game.redo(999)
-    moves = game.current_node.nodes_from_root[1:]  # without root
-    while not all(m.analysis_ready for m in moves):
-        time.sleep(0.01)
-
-    parent_policy_per_move = [move.parent.policy_ranking for move in moves]
-    num_legal_moves = [sum(pv >= 0 for pv, _ in policy_ranking) for policy_ranking in parent_policy_per_move]
-    policy_stats = [
-        [(num_mv, rank, value, mv.player) for rank, (value, mv) in enumerate(policy_ranking) if mv == move.move][0]
-        for move, policy_ranking, num_mv in zip(moves, parent_policy_per_move, num_legal_moves)
-    ]
-    size = game.board_size
-    num_intersec = size[0] * size[1]
-    half_seg = len_segment // 2
-
-    ranks = [[1, len(moves), {}]]  # entire game
-    for segment_mid in range(half_seg, len(moves), half_seg):
-        bounds = (segment_mid - half_seg, min(segment_mid + half_seg, len(moves)))
-        rank = calculate_ranks(policy_stats[bounds[0] : bounds[1]], num_intersec)
-        ranks.append([bounds[0] + 1, bounds[1], rank])
-    ranks[0][2]['B'] = median([sl[2]['B'] for sl in ranks[1:]])
-    ranks[0][2]['W'] = median([sl[2]['W'] for sl in ranks[1:]])
-    return ranks
+        return f"{rank:5.1f}k"
 
 
 if __name__ == "__main__":
-    kt = KaTrainBase()
+    kt = KaTrainBase(force_package_config=True)
     e_config = kt.config("engine")
     e_config["max_visits"] = e_config["fast_visits"] = 1  # since it's just policy anyway
     engine = KataGoEngine(kt, e_config)
 
-    for filename in [
-        "sgf_ogs\katrain_tsstaff (6k) vs katrain-weighted (6k) 2020-06-09 15 52 45_W+72.9.sgf"
-    ]:  # glob.glob("sgf_ogs/*.sgf"):
+    for filename in glob.glob("sgf_ogs/*.sgf"):
         game = Game(kt, engine, move_tree=KaTrainSGF.parse_file(filename))
         size = game.board_size
-        len_segment = round(50 * size[0] * size[1] / 361)
+        len_segment = 80
 
         ranks = rank_game(game, len_segment)
+        if not ranks:
+            continue
         print("* File name: {0:s}".format(filename))
         for start, end, rank in ranks:
-            print(f"\tMove quality for moves {start:3d} to {end:3d}\tB: {rank['B']:5.1f}k\tW: {rank['W']:5.1f}k")
+            print(
+                f"\tMove quality for moves {start:3d} to {end:3d}\tB: {format_rank(rank['B'])}\tW: {format_rank(rank['W'])}"
+            )
diff --git a/engine_server.py b/engine_server.py
@@ -14,7 +14,7 @@
 ENGINE_SETTINGS = {
     "katago": "katago/katago25",
     "model": "katrain/models/g170e-b15c192-s1672170752-d466197061.bin.gz",
-    #"model": "~/Desktop/g170e-b20c256x2-s5303129600-d1228401921.bin.gz",
+    # "model": "~/Desktop/g170e-b20c256x2-s5303129600-d1228401921.bin.gz",
     "config": "katrain/KataGo/analysis_config.cfg",
     "max_visits": 50,
     "max_time": 1.0,

diff --git a/move-eval-interpolate.py b/move-eval-interpolate.py
@@ -14,10 +14,10 @@
 
 plt.xlabel("Move #")
 plt.ylabel("kyu rank")
-plt.plot(x, yB, 'ok', label='Black estimated kyu')
-plt.plot(x, yW, 'og', label='White estimated kyu')
-plt.plot(xn, yBn, label='Black estimated kyu interpolated')
-plt.plot(xn, yWn, label='White estimated kyu interpolated')
+plt.plot(x, yB, "ok", label="Black estimated kyu")
+plt.plot(x, yW, "og", label="White estimated kyu")
+plt.plot(xn, yBn, label="Black estimated kyu interpolated")
+plt.plot(xn, yWn, label="White estimated kyu interpolated")
 
 plt.legend()
 plt.show()
diff --git a/rank_utils.py b/rank_utils.py
@@ -0,0 +1,103 @@
+import math, time
+
+
+def gauss(data):
+    return math.exp(-1 * (data) ** 2)
+
+
+def median(data):
+    sorteddata = sorted(data)
+    lendata = len(data)
+    index = (lendata - 1) // 2
+    if lendata % 2:
+        return sorteddata[index]
+    else:
+        return (sorteddata[index] + sorteddata[index + 1]) / 2.0
+
+
+def averagemod(data):
+    sorteddata = sorted(data)
+    lendata = len(data)
+    return sum(sorteddata[int(lendata * 0.2) : int(lendata * 0.8) + 1]) / (
+        (int(lendata * 0.8) + 1) - int(lendata * 0.2)
+    )  # average without the best and worst 20% of ranks
+
+
+def calculate_rank_for_player(segment_stats, num_intersec, player):
+    non_obvious_moves = [
+        (nl, r, val)
+        for nl, r, val, pl in segment_stats
+        if nl is not None and val < (0.8 * (1 - (num_intersec - nl) / num_intersec * 0.5)) and pl == player
+    ]
+    num_legal, rank, value = zip(*non_obvious_moves)
+    rank = list(rank)
+    for (i, item) in enumerate(rank):
+        if item > num_legal[i] * 0.09:
+            rank[i] = num_legal[i] * 0.09
+    rank = tuple(rank)
+    averagemod_rank = averagemod(rank)
+    averagemod_len_legal = averagemod(num_legal)
+    norm_avemod_len_legal = averagemod_len_legal / num_intersec
+    if averagemod_rank > 0.1:
+        rank_kyu = (
+            -0.97222 * math.log(averagemod_rank) / (0.24634 + averagemod_rank * gauss(3.3208 * (norm_avemod_len_legal)))
+            + 12.703 * (norm_avemod_len_legal)
+            + 11.198 * math.log(averagemod_rank)
+            + 12.28 * gauss(2.379 * (norm_avemod_len_legal))
+            - 16.544
+        )
+    else:
+        rank_kyu = -4
+    if rank_kyu < -4:
+        rank_kyu = -4
+    return rank_kyu  # dan rank
+
+
+def calculate_ranks(segment_stats, num_intersec):
+    return {pl: calculate_rank_for_player(segment_stats, num_intersec, pl) for pl in "BW"}
+
+
+def rank_game(game, len_segment):
+    game.redo(999)
+    moves = game.current_node.nodes_from_root[1:]  # without root
+    if len(moves) < 1.5 * len_segment:
+        return None
+
+    while not all(m.analysis_ready for m in moves):
+        time.sleep(0.01)
+
+    parent_policy_per_move = [move.parent.policy_ranking for move in moves]
+    num_legal_moves = [sum(pv >= 0 for pv, _ in policy_ranking) for policy_ranking in parent_policy_per_move]
+    policy_stats = [
+        [(num_mv, rank, value, mv.player) for rank, (value, mv) in enumerate(policy_ranking) if mv == move.move][0]
+        for move, policy_ranking, num_mv in zip(moves, parent_policy_per_move, num_legal_moves)
+    ]
+    size = game.board_size
+    num_intersec = size[0] * size[1]
+    half_seg = len_segment // 2
+
+    ranks = [[1, len(moves), {}]]  # entire game
+    for segment_mid in range(half_seg, len(moves), half_seg):
+        bounds = (segment_mid - half_seg, min(segment_mid + half_seg, len(moves)))
+        if bounds[1] - bounds[0] >= 0.75 * len_segment:
+            rank = calculate_ranks(policy_stats[bounds[0] : bounds[1]], num_intersec)
+            ranks.append([bounds[0] + 1, bounds[1], rank])
+    ranks[0][2]["B"] = median([sl[2]["B"] for sl in ranks[1:]])
+    ranks[0][2]["W"] = median([sl[2]["W"] for sl in ranks[1:]])
+    return ranks
+
+
+# def calculate_rank_for_player_alternative_try(segment_stats, num_intersec, player):
+#    non_obvious_moves = [
+#        (nl, r, val)
+#        for nl, r, val, pl in segment_stats
+#        if val < (0.8 * (1 - (num_intersec - nl) / num_intersec * 0.5)) and pl == player
+#    ]
+#    num_legal, rank, value = zip(*non_obvious_moves)
+#    # we expect r = (ll-npicked)/(npicked+1) so naively say npicked = (ll - r)/(r+1)
+#    est_n_picked = [(nl - r) / (r + 1) for nl, r in zip(num_legal, rank)]
+#    n_moves = np.mean(est_n_picked)
+#    rank_kyu = (
+#        math.log10(n_moves * 361 / num_intersec) - 1.9482
+#    ) / -0.05737  # using the calibration curve of p:pick:rank
+#    return rank_kyu
diff --git a/selfplay.py b/selfplay.py
@@ -48,7 +48,7 @@ class AI:
     DEFAULT_ENGINE_SETTINGS = {
         "katago": "katrain/KataGo/katago",
         "model": "katrain/models/g170e-b15c192-s1672170752-d466197061.bin.gz",
-#        "config": "lowmem.cfg",
+        #        "config": "lowmem.cfg",
         "config": "kata_config.cfg",
         "max_visits": 1,
         "max_time": 300.0,
@@ -147,7 +147,7 @@ def retrieve_ais(selected_ais):
 N_GAMES = 5
 BOARDSIZE = 19
 
-ais_to_test = retrieve_ais(test_ais+reference_ais)
+ais_to_test = retrieve_ais(test_ais + reference_ais)
 
 results = defaultdict(list)
 
@@ -204,7 +204,7 @@ def fmt_score(score):
         e.shutdown()
     AI.ENGINES = []
 
-    with ThreadPoolExecutor(max_workers=4*AI.NUM_THREADS) as threadpool:
+    with ThreadPoolExecutor(max_workers=4 * AI.NUM_THREADS) as threadpool:
         for b in ais_to_test:
             for w in ais_to_test:
                 if b is not w:

diff --git a/settings.py b/settings.py
@@ -6,10 +6,6 @@
 from katrain.core.constants import *
 
 
-class PLayer(object):
-    pass
-
-
 class Logger:
     def log(self, msg, level=OUTPUT_INFO):
         if level <= OUTPUT_INFO: