forked from pnprog/goreviewpartner
-
Notifications
You must be signed in to change notification settings - Fork 0
/
leela_zero_analysis.py
340 lines (273 loc) · 10 KB
/
leela_zero_analysis.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
# -*- coding: utf-8 -*-
from gtp import gtp, GtpException
import sys
from gomill import sgf, sgf_moves
from sys import exit,argv
from Tkinter import *
import sys
import os
import ConfigParser
from time import sleep
import os
import threading
import ttk
from toolbox import *
from toolbox import _
import tkMessageBox
class LeelaZeroAnalysis():
def run_analysis(self,current_move):
one_move=go_to_move(self.move_zero,current_move)
player_color=guess_color_to_play(self.move_zero,current_move)
leela_zero=self.leela_zero
log()
log("==============")
log("move",str(current_move))
additional_comments=""
if player_color in ('w',"W"):
log("leela Zero play white")
answer=leela_zero.play_white()
else:
log("leela Zero play black")
answer=leela_zero.play_black()
best_answer=answer
all_moves=leela_zero.get_all_leela_zero_moves()
if (answer.lower() not in ["pass","resign"]):
one_move.set("CBM",answer.lower()) #Computer Best Move
all_moves2=all_moves[:]
nb_undos=1
#log("====move",current_move+1,all_moves[0],'~',answer)
#making sure the first line of play is more than one move deep
while (len(all_moves2[0][1].split(' '))==1) and (answer.lower() not in ["pass","resign"]) and (nb_undos<=20):
log("going deeper for first line of play (",nb_undos,")")
if player_color in ('w',"W") and nb_undos%2==0:
answer=leela_zero.play_white()
elif player_color in ('w',"W") and nb_undos%2==1:
answer=leela_zero.play_black()
elif player_color not in ('w',"W") and nb_undos%2==0:
answer=leela_zero.play_black()
else:
answer=leela_zero.play_white()
nb_undos+=1
#linelog(all_moves[0],'+',answer)
all_moves2=leela_zero.get_all_leela_zero_moves()
if (answer.lower() not in ["pass","resign"]):
#log('+',all_moves2)
all_moves[0][1]+=" "+all_moves2[0][1]
if (player_color.lower()=='b' and nb_undos%2==1) or (player_color.lower()=='w' and nb_undos%2==1):
all_moves[0][2]=all_moves2[0][2]
else:
all_moves[0][2]=100-all_moves2[0][2]
else:
log()
log("last play on the fist of play was",answer,"so leaving")
for u in range(nb_undos):
#log("undo...")
leela_zero.undo()
best_move=True
#variation=-1
log("Number of alternative sequences:",len(all_moves))
#log(all_moves)
for sequence_first_move,one_sequence,one_value_network,one_policy_network,one_nodes in all_moves[:self.maxvariations]:
log("Adding sequence starting from",sequence_first_move)
previous_move=one_move.parent
current_color=player_color
first_variation_move=True
for one_deep_move in one_sequence.split(' '):
if one_deep_move.lower() in ["pass","resign"]:
log("Leaving the variation when encountering",one_deep_move.lower())
break
i,j=gtp2ij(one_deep_move)
new_child=previous_move.new_child()
new_child.set_move(current_color,(i,j))
if player_color=='b':
black_win_rate=str(one_value_network)+'%'
white_win_rate=str(100-one_value_network)+'%'
else:
black_win_rate=str(100-one_value_network)+'%'
white_win_rate=str(one_value_network)+'%'
if first_variation_move:
first_variation_move=False
variation_comment=_("Value network black/white win probability for this move: ")+black_win_rate+'/'+white_win_rate
new_child.set("BWR",black_win_rate) #Black value network
new_child.set("WWR",white_win_rate) #White value network
variation_comment+="\n"+_("Policy network value for this move: ")+str(one_policy_network)+'%'
variation_comment+="\n"+_("Number of playouts used to estimate this variation: ")+str(one_nodes)
new_child.add_comment_text(variation_comment)
if best_move:
best_move=False
additional_comments+="\n"+_("Value network black/white win probability for this move: ")+black_win_rate+'/'+white_win_rate
one_move.set("BWR",black_win_rate) #Black value network
one_move.set("WWR",white_win_rate) #White value network
previous_move=new_child
if current_color in ('w','W'):
current_color='b'
else:
current_color='w'
log("==== no more sequences =====")
else:
log('adding "'+answer.lower()+'" to the sgf file')
additional_comments+="\n"+_("For this position, %s would %s"%("Leela Zero",answer.lower()))
if answer.lower()=="pass":
leela_zero.undo()
elif answer.lower()=="resign":
if self.stop_at_first_resign:
log("")
log("The analysis will stop now")
log("")
self.move_range=[]
one_move.add_comment_text(additional_comments)
return best_answer
def initialize_bot(self,profil="slow"):
leela_zero=leela_zero_starting_procedure(self.g,"slow") #analysis is always "slow"
self.leela_zero=leela_zero
self.time_per_move=0
return leela_zero
def leela_zero_starting_procedure(sgf_g,profil="slow",silentfail=False):
if profil=="slow":
timepermove_entry="TimePerMove"
elif profil=="fast":
timepermove_entry="ReviewTimePerMove"
Config = ConfigParser.ConfigParser()
Config.read(config_file)
leela_zero=bot_starting_procedure("LeelaZero","Leela Zero",Leela_Zero_gtp,sgf_g,profil,silentfail)
if not leela_zero:
return False
try:
time_per_move=Config.get("LeelaZero", timepermove_entry)
if time_per_move:
time_per_move=int(time_per_move)
if time_per_move>0:
log("Setting time per move")
leela_zero.set_time(main_time=0,byo_yomi_time=time_per_move,byo_yomi_stones=1)
#self.time_per_move=time_per_move #why is that needed???
except:
log("Wrong value for Leela thinking time:",Config.get("LeelaZero", timepermove_entry))
log("Erasing that value in the config file")
Config.set("LeelaZero",timepermove_entry,"")
Config.write(open(config_file,"w"))
return leela_zero
class RunAnalysis(LeelaZeroAnalysis,RunAnalysisBase):
def __init__(self,parent,filename,move_range,intervals,variation,komi):
RunAnalysisBase.__init__(self,parent,filename,move_range,intervals,variation,komi)
class LiveAnalysis(LeelaZeroAnalysis,LiveAnalysisBase):
def __init__(self,g,filename):
LiveAnalysisBase.__init__(self,g,filename)
import ntpath
import subprocess
import threading, Queue
class Leela_Zero_gtp(gtp):
def __init__(self,command):
self.c=1
leela_zero_working_directory=command[0][:-len(ntpath.basename(command[0]))]
log("Leela Zero working directory:",leela_zero_working_directory)
self.process=subprocess.Popen(command,cwd=leela_zero_working_directory, stdin=subprocess.PIPE, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
self.size=0
self.stderr_queue=Queue.Queue()
threading.Thread(target=self.consume_stderr).start()
def get_leela_zero_final_score(self):
self.write("final_score")
answer=self.readline()
try:
return " ".join(answer.split(" ")[1:])
except:
raise GtpException("GtpException in Get_leela_zero_final_score()")
def get_leela_zero_influence(self):
self.write("influence")
one_line=self.readline() #empty line
buff=[]
while self.stderr_queue.empty():
sleep(.1)
while not self.stderr_queue.empty():
while not self.stderr_queue.empty():
buff.append(self.stderr_queue.get())
sleep(.1)
buff.reverse()
#log(buff)
influence=[]
for i in range(self.size):
one_line=buff[i].strip()
one_line=one_line.replace(".","0").replace("x","1").replace("o","2").replace("O","0").replace("X","0").replace("w","1").replace("b","2")
one_line=[int(s) for s in one_line.split(" ")]
influence.append(one_line)
return influence
def get_all_leela_zero_moves(self):
buff_size=18
buff=[]
sleep(.1)
while not self.stderr_queue.empty():
while not self.stderr_queue.empty():
buff.append(self.stderr_queue.get())
sleep(.1)
buff.reverse()
answers=[]
for err_line in buff:
if " ->" in err_line:
#log(err_line)
one_answer=err_line.strip().split(" ")[0]
nodes=int(err_line.strip().split("(")[0].split("->")[1].replace(" ",""))
value_network=float(err_line.split("(V:")[1].split('%')[0].strip())
policy_network=float(err_line.split("(N:")[1].split('%)')[0].strip())
sequence=err_line.split("PV: ")[1].strip()
answers=[[one_answer,sequence,value_network,policy_network,nodes]]+answers
return answers
from leela_analysis import LeelaSettings
class LeelaZeroSettings(LeelaSettings):
def __init__(self,parent):
Frame.__init__(self,parent)
self.name="LeelaZero"
self.initialize()
class LeelaZeroOpenMove(BotOpenMove):
def __init__(self,sgf_g):
BotOpenMove.__init__(self,sgf_g)
self.name='Leela Zero'
self.my_starting_procedure=leela_zero_starting_procedure
LeelaZero={}
LeelaZero['name']="LeelaZero"
LeelaZero['gtp_name']="Leela Zero"
LeelaZero['analysis']=LeelaZeroAnalysis
LeelaZero['openmove']=LeelaZeroOpenMove
LeelaZero['settings']=LeelaZeroSettings
LeelaZero['gtp']=Leela_Zero_gtp
LeelaZero['liveanalysis']=LiveAnalysis
LeelaZero['runanalysis']=RunAnalysis
LeelaZero['starting']=leela_zero_starting_procedure
import getopt
if __name__ == "__main__":
if len(argv)==1:
temp_root = Tk()
filename = open_sgf_file(parent=temp_root)
temp_root.destroy()
log(filename)
log("gamename:",filename[:-4])
if not filename:
sys.exit()
log("filename:",filename)
top = Tk()
RangeSelector(top,filename,bots=[LeelaZero]).pack()
top.mainloop()
else:
try:
parameters=getopt.getopt(argv[1:], '', ['no-gui','range=', 'color=', 'komi=',"variation="])
except Exception, e:
show_error(str(e)+"\n"+usage)
sys.exit()
if not parameters[1]:
show_error("SGF file missing\n"+usage)
sys.exit()
top=None
batch=[]
for filename in parameters[1]:
move_selection,intervals,variation,komi,nogui=parse_command_line(filename,parameters[0])
if nogui:
log("File to analyse:",filename)
app=RunAnalysis("no-gui",filename,move_selection,intervals,variation-1,komi)
app.terminate_bot()
else:
if not top:
top = Tk()
top.withdraw()
one_analysis=[RunAnalysis,filename,move_selection,intervals,variation-1,komi]
batch.append(one_analysis)
if not nogui:
top.after(1,lambda: batch_analysis(top,batch))
top.mainloop()