Commit 8cb5bfd0 by songxinkai

Enable to run on MLUs, and add some analysis tools.

parent e3cc7fb5
#!/usr/bin/python
# coding=utf-8
import os import os
from PK import pk from PK import pk
import time import time
import random import random
import re import re
import sys
commdir='share' #共享目录 commdir='share' #共享目录
def cd(path): def cd(path):
...@@ -12,11 +15,9 @@ def choose_game(): ...@@ -12,11 +15,9 @@ def choose_game():
dir=os.listdir(cd('comm')) dir=os.listdir(cd('comm'))
random.shuffle(dir) random.shuffle(dir)
for d in dir: for d in dir:
res=re.match(r'(\d+)_(\d+)\.init',d) if d.endswith('.init'):
if res: black, white = d.replace('.init', '').split('-')[0:2]
black=res.group(1) name=black+'-'+white
white=res.group(2)
name=black+'_'+white
try: try:
src=cd('comm/'+d) src=cd('comm/'+d)
dst=cd('comm/'+name+'.running') dst=cd('comm/'+name+'.running')
...@@ -28,21 +29,23 @@ def choose_game(): ...@@ -28,21 +29,23 @@ def choose_game():
return None return None
def main(): def main():
time.sleep(random.uniform(3,6)) mlu_id = int(sys.argv[1])
assert(mlu_id < 4 and mlu_id >= 0)
# time.sleep(random.uniform(3,6))
while not os.path.exists(cd('stop.txt')): while not os.path.exists(cd('stop.txt')):
if os.path.exists(cd('pause.txt')): if os.path.exists(cd('pause.txt')):
time.sleep(10) time.sleep(0.1)
continue continue
game=choose_game() game=choose_game()
if game: if game:
winrate=pk(game[0],game[1]) winrate=pk(game[0],game[1], 1, mlu_id)
name='comm/'+'_'.join([game[0],game[1],str(winrate)])+'.finish' name='comm/'+'-'.join([game[0],game[1],str(winrate)])+'.finish'
os.system('touch '+cd(name)) os.system('touch '+cd(name))
os.remove(cd('comm/'+game[0]+'_'+game[1]+'.running')) try:
os.remove(cd('comm/'+game[0]+'-'+game[1]+'.running'))
except:
continue
else: else:
time.sleep(1) time.sleep(0.1)
if __name__ == '__main__': if __name__ == '__main__':
main() main()
# coding=utf-8
from elorating import EloRatingSystem from elorating import EloRatingSystem
import numpy as np import numpy as np
import random import random
...@@ -8,13 +9,13 @@ import time ...@@ -8,13 +9,13 @@ import time
commdir='share' #共享目录 commdir='share' #共享目录
def cd(path): def cd(path):
return os.path.join(commdir,path) return os.path.join(commdir,path)
elo=EloRatingSystem(recordSaveFile='gameRecord.txt') #初始化 elo=EloRatingSystem(recordSaveFile='gameRecord.txt') #初始化
save_step = 1000
def askYes(str): def askYes(str):
ans='' ans=''
while True: while True:
ans=input(str) ans=raw_input(str)
ans=ans.lower() ans=ans.lower()
if ans=='y' or ans=='yes': if ans=='y' or ans=='yes':
return True return True
...@@ -52,7 +53,7 @@ def main(): ...@@ -52,7 +53,7 @@ def main():
commandList=[r'play (\d+)','summary','stop','save'] commandList=[r'play (\d+)','summary','stop','save']
print('commandList:\n '+'\n '.join(commandList)) print('commandList:\n '+'\n '.join(commandList))
ans=input('>>') ans=raw_input('>>')
while True: while True:
if ans=='stop': if ans=='stop':
os.system('touch '+cd('stop.txt')) os.system('touch '+cd('stop.txt'))
...@@ -60,18 +61,17 @@ def main(): ...@@ -60,18 +61,17 @@ def main():
elif ans=='summary': elif ans=='summary':
elo.summary() elo.summary()
elif ans=='save': elif ans=='save':
elo.save(saveFile='output.txt',sortByRank=False) elo.save(saveFile='output.txt',sortByRank=True)
else: else:
matchRes=re.match(r'play (\d+)',ans) matchRes=re.match(r'play (\d+)',ans)
if matchRes: if matchRes:
num=matchRes.group(1) num=matchRes.group(1)
play(int(num)) play(int(num))
print('commandList:\n '+'\n '.join(commandList)) print('commandList:\n '+'\n '.join(commandList))
ans=input('>>') ans=raw_input('>>')
def play(total_game): def play(total_game):
max_game=500 max_game=800
complete_game=0 complete_game=0
pause_flag='pause.txt' pause_flag='pause.txt'
if os.path.exists(cd(pause_flag)): if os.path.exists(cd(pause_flag)):
...@@ -95,58 +95,63 @@ def play(total_game): ...@@ -95,58 +95,63 @@ def play(total_game):
i=0 i=0
while i<num: while i<num:
black,white=choose() black,white=choose()
name=black+'_'+white name=black+'-'+white
if os.path.exists(cd('comm/'+name+'.init')) or os.path.exists(cd('comm/'+name+'.running')) or os.path.exists(cd('comm/'+name+'.complete')): if os.path.exists(cd('comm/'+name+'.init')) or os.path.exists(cd('comm/'+name+'.running')) or os.path.exists(cd('comm/'+name+'.complete')):
continue continue
os.system('touch '+cd('comm/'+name+'.init')) os.system('touch '+cd('comm/'+name+'.init'))
i+=1 i+=1
def read(): def read(dir):
#读取完成的比赛记录 #读取完成的比赛记录
count=0 count=0
dir=os.listdir(cd('comm'))
for d in dir: for d in dir:
res=re.match(r'(\d+)_(\d+)_(\d+)\.finish',d) # res=re.match(r'(\d+)-(\d+)-(\d+)\.finish',d)
if res: if d.endswith('.finish'):
black=res.group(1) black, white, winrate = d.replace(".finish", '').split('-')[0:3]
white=res.group(2) winrate = int(float(winrate))
winrate=int(res.group(3)) # black=res.group(1)
# white=res.group(2)
# winrate=int(res.group(3))
elo.playgame(black,white,winrate) elo.playgame(black,white,winrate)
os.remove(cd(os.path.join('comm',d))) os.remove(cd(os.path.join('comm',d)))
count+=1 count+=1
return count return count
def exist_game(): def exist_game(dir):
count=0 count=0
dir=os.listdir(cd('comm'))
for d in dir: for d in dir:
res=re.match(r'(\d+)_(\d+)\.running',d) if d.endswith('running') or d.endswith('init'):
if res: count += 1
count+=1
continue
res=re.match(r'(\d+)_(\d+)\.init',d)
if res:
count+=1
continue continue
# res=re.match(r'(\d+)-(\d+)\.running',d)
# if res:
# count+=1
# continue
# res=re.match(r'(\d+)-(\d+)\.init',d)
# if res:
# count+=1
# continue
return count return count
idx=0 idx=0
while complete_game<total_game: elo.save(saveFile='output.txt',sortByRank=True)
complete_game+=read() tstart = time.time()
num=exist_game() save_step_id = 0
create_game(min(max_game-num,total_game-complete_game-num+10)) while True:
if idx==5: dir=os.listdir(cd('comm'))
print('{}/{}'.format(complete_game,total_game)) complete_game += read(dir)
idx=0 num = exist_game(dir)
if complete_game < total_game:
create_game(min(max_game - num, total_game - complete_game - num + 10))
elif num == 0:
break
if (complete_game >= save_step_id * save_step):
print('{}/{} games completed, taking {}s'.format(complete_game,total_game, time.time() - tstart))
if (save_step_id > 0):
elo.save(saveFile='output.txt',sortByRank=True)
save_step_id = complete_game / save_step + 1
idx+=1 idx+=1
elo.save(saveFile='output.txt',sortByRank=True)
time.sleep(1)
os.system('touch '+cd('pause.txt')) #通知client先暂停行动 os.system('touch '+cd('pause.txt')) #通知client先暂停行动
if __name__ == '__main__': if __name__ == '__main__':
main() main()
# coding=utf-8
import random import random
import time import time
import os
import commands as cmd
pj_dir = "/share/sxk_mlu_alphago"
data_dir = "/share/data_sxk"
model_dir = "/share/elo-rating/models/"
def get_cmd(num_games, mlu, model1, model2, rollout, c_puct):
cmd_str = ""
cmd_str += "%s " % (os.path.join(pj_dir, "build", "pk"))
cmd_str += "--eval_game_num %d " %(num_games)
cmd_str += "--mlu_list_0 %d "%(mlu)
cmd_str += "--mlu_list_1 %d "%(mlu)
cmd_str += "--config_path_0 %s "%(os.path.join(pj_dir, "etc", "9_pk_offline.conf"))
cmd_str += "--config_path_1 %s "%(os.path.join(pj_dir, "etc", "9_pk_offline.conf"))
cmd_str += "--model_path_0 %s "%(model1)
cmd_str += "--model_path_1 %s "%(model2)
cmd_str += "--rollout_0 %d "%(rollout)
cmd_str += "--rollout_1 %d "%(rollout)
cmd_str += "--rollouts_0 %s "%("-1")
cmd_str += "--rollouts_1 %s "%("-1")
cmd_str += "--c_puct_0 %f "%(c_puct)
cmd_str += "--c_puct_1 %f "%(c_puct)
# TODO: check this
# cmd_str += "--result_path %s "%("-1")
return cmd_str
def pk(model1, model2, num_games = 1, mlu_id = 0):
rollout = 400
c_puct = 0.8
model1 = model_dir + model1
model2 = model_dir + model2
cmd_str = get_cmd(num_games, mlu_id, model1, model2, rollout, c_puct)
s, o = cmd.getstatusoutput(cmd_str)
win = 0
assert(s == 0)
win = 1 - float(o.strip().split(":")[-1])
print("%s vs %s, win_rate = %f" % (model1.split('/')[-1], model2.split('/')[-1], win))
return win
if __name__ == "__main__":
model1 = "R1600_M1600_600000"
model2 = "R400_M400_180000"
res = pk(model1, model2, 100, 3)
#测试用pk函数 #测试用pk函数
def pk(model1,model2,num_games=1): # def pk(model1,model2,num_games=1):
time.sleep(random.uniform(2,4)) # time.sleep(random.uniform(2,4))
winrate=1-0.5**(abs(int(model1)-int(model2))/1) #假设新模型以一定概率战胜旧模型 # winrate=1-0.5**(abs(int(model1)-int(model2))/1) #假设新模型以一定概率战胜旧模型
res=random.choices([1,0.5,0],weights=[winrate,0,1-winrate],k=1) # res=random.choices([1,0.5,0],weights=[winrate,0,1-winrate],k=1)
if int(model1)>int(model2): # if int(model1)>int(model2):
return res[0] # return res[0]
else: # else:
return 1-res[0] # return 1-res[0]
\ No newline at end of file
# coding=utf-8
import os import os
import time import time
for i in range(200): for i in range(200):
os.system('nohup python ELO_client.py &') os.system('nohup python ELO_client.py &')
time.sleep(0.1) time.sleep(0.1)
\ No newline at end of file
import matplotlib
matplotlib.use('Agg')
import matplotlib.pyplot as plt
model={}
with open('bak/output.txt_bak', 'r') as f:
lines = f.readlines()
for l in lines:
if l.startswith('R'):
l = l.strip()
model[l.split()[0]] = float(l.split()[1])
def getInfo(k):
ks = k.split('_')
r = int(ks[0].lstrip('R'))
m = int(ks[1].lstrip('M'))
i = int(ks[2])
return r, m, i
def cmpKey(k1, k2):
k1 = k1[0]
k2 = k2[0]
r1, m1, i1 = getInfo(k1)
r2, m2, i2 = getInfo(k2)
if (r1 != r2):
return r1 - r2
elif (m1 != m2):
return m1 - m2
else:
return i1 - i2
smodel = model.items()
smodel.sort(cmp = cmpKey)
print(smodel)
def getPlot(mp, r, m):
x = []
y = []
for k, v in mp:
kr, km, ki = getInfo(k)
if km == m and kr == r:
x.append(ki)
y.append(v)
return x, y
def getStr(r, m):
return "R%d_M%d" % (r, m)
routines = [[400, 400],[400, 1600],[1600,400],[1600, 1600]]
colors = ['red', 'blue', 'black', 'yellow', 'green', 'cyan', 'slateblue', 'peru', 'slategrey']
for i in range(len(routines)):
plt.plot(*getPlot(smodel, *routines[i]), color = colors[i], linestyle='--', label=getStr(*routines[i]))
# plt.plot(*getPlot(smodel, *routines[0]), color = colors[0], linestyle='--', label=getStr(*routines[0]))
# plt.plot(*getPlot(smodel, *routines[1]), color = colors[1], linestyle='--', label=getStr(*routines[1]))
# plt.plot(*getPlot(smodel, *routines[2]), color = colors[2], linestyle='--', label=getStr(*routines[2]))
# plt.plot(*getPlot(smodel, *routines[3]), color = colors[3], linestyle='--', label=getStr(*routines[3]))
plt.legend()
plt.show()
plt.savefig('figure.png')
# x_data = ['2011','2012','2013','2014','2015','2016','2017']
# y_data = [58000,60200,63000,71000,84000,90500,107000]
# y_data2 = [52000,54200,51500,58300,56800,59500,62700]
#
# plt.plot(x_data,y_data,color='red',linewidth=2.0,linestyle='--')
# plt.plot(x_data,y_data2,color='blue',linewidth=3.0,linestyle='-.')
# plt.show()
# table = Texttable()
# table.add_rows()
# print(table.draw())
# def getRoutine(k):
# k = k[0]
# return k.split('_')[0] + '_' + k.split('_')[1]
# rm = {}
# for k in smodel:
# krm = getRoutine(k)
# if krm not in rm:
# rm[krm] = list()
# rm[krm].append(k[1])
# print(rm)
# print(max_iter)
rm -rf share/*
mkdir share/comm
#!/usr/bin/env python3 #!/usr/bin/env python3
# coding=utf-8
# -*- coding: utf-8 -*- # -*- coding: utf-8 -*-
#---------------------------------------------- #----------------------------------------------
...@@ -20,6 +21,7 @@ ...@@ -20,6 +21,7 @@
import numpy as np import numpy as np
import random import random
import os import os
from PK import pk
def main(): def main():
models=[str(i) for i in range (0,50000,1000)] models=[str(i) for i in range (0,50000,1000)]
...@@ -39,24 +41,25 @@ def play(models,total_game=5000): ...@@ -39,24 +41,25 @@ def play(models,total_game=5000):
players=elo.getPlayers(sortByRank=True) #选择分数相近的作为比赛对手 players=elo.getPlayers(sortByRank=True) #选择分数相近的作为比赛对手
black=random.choice(players).name black=random.choice(players).name
matchList=elo.getNearPlayer(black) matchList=elo.getNearPlayer(black)
white = []
if matchList: if matchList:
white=random.choice(matchList) white=random.choice(matchList)
else: else:
continue #找不到对手,谁都打不过,或者谁都打不过 continue #找不到对手,谁都打不过,或者谁都打不过
num=1 #比赛局数 num=4 #比赛局数
winrate=pk(black,white,num) winrate=pk(black,white,num)
elo.playgame(black,white,winrate,numgames=num) #得到胜率后时用elo.playgame elo.playgame(black,white,winrate,numgames=num) #得到胜率后时用elo.playgame
elo.summary() elo.summary()
#测试用pk函数 #测试用pk函数
def pk(model1,model2,num_games): # def pk(model1,model2,num_games):
winrate=1-0.5**(abs(int(model1)-int(model2))/1000) #假设新模型以一定概率战胜旧模型 # winrate=1-0.5**(abs(int(model1)-int(model2))/1000) #假设新模型以一定概率战胜旧模型
res=random.choices([1,0.5,0],weights=[winrate,0,1-winrate],k=1) # res=random.choices([1,0.5,0],weights=[winrate,0,1-winrate],k=1)
if int(model1)>int(model2): # if int(model1)>int(model2):
return res[0] # return res[0]
else: # else:
return 1-res[0] # return 1-res[0]
#以上是测试代码 #以上是测试代码
...@@ -76,7 +79,7 @@ class EloRatingSystem: ...@@ -76,7 +79,7 @@ class EloRatingSystem:
WIN=1 WIN=1
LOSS=0 LOSS=0
DRAW=0.5 DRAW=0.5
def __init__(self,base_rating=1500,recordSaveFile='gameRecord.txt'): def __init__(self,base_rating=1500.0,recordSaveFile='gameRecord.txt'):
self.base_rating=base_rating self.base_rating=base_rating
self.players={} self.players={}
...@@ -100,7 +103,6 @@ class EloRatingSystem: ...@@ -100,7 +103,6 @@ class EloRatingSystem:
print('{} not in player list,please use <addmodel> to add it'.format(name)) print('{} not in player list,please use <addmodel> to add it'.format(name))
return False return False
return True return True
def playgame(self,p1,p2,winrate,numgames=1,online=True): def playgame(self,p1,p2,winrate,numgames=1,online=True):
''' '''
...@@ -165,7 +167,7 @@ class EloRatingSystem: ...@@ -165,7 +167,7 @@ class EloRatingSystem:
player2.rating=0 player2.rating=0
if online: if online:
#print('{}\'s rating:{}->{} ; {}\'s rating:{}->{}'.format(p1,R1,player1.rating,p2,R2,player2.rating)) # print('winrate: {}. {}\'s rating:{}->{} ; {}\'s rating:{}->{}'.format(winrate, p1,R1,player1.rating,p2,R2,player2.rating))
pass pass
def readRecords(self,filename): def readRecords(self,filename):
...@@ -190,17 +192,17 @@ class EloRatingSystem: ...@@ -190,17 +192,17 @@ class EloRatingSystem:
players.sort(key=sortKey,reverse=True) players.sort(key=sortKey,reverse=True)
print('{:<20s}{:<10s}{:<10s}{:<10s}{:<10s}'.format('model','rating','games','wins','losses')) print('{:<60s}{:<10s}{:<10s}{:<10s}{:<10s}'.format('model','rating','games','wins','losses'))
for p in players: for p in players:
print('{:<20s}{:<10.2f}{:<10d}{:<10d}{:<10d}'.format(str(p.name),p.rating,p.num_game,p.wins,p.losses)) print('{:<60s}{:<10.2f}{:<10d}{:<10d}{:<10d}'.format(str(p.name),p.rating,p.num_game,p.wins,p.losses))
def save(self,saveFile='elo_rating_output.txt',sortByRank=False): def save(self,saveFile='elo_rating_output.txt',sortByRank=False):
players=self.getPlayers(sortByRank) players=self.getPlayers(sortByRank)
with open(saveFile,'w') as f: with open(saveFile,'w') as f:
f.write('{:<20s}{:<10s}{:<10s}{:<10s}{:<10s}\n'.format('model','rating','games','wins','losses')) f.write('{:<60s}{:<10s}{:<10s}{:<10s}{:<10s}\n'.format('model','rating','games','wins','losses'))
for p in players: for p in players:
f.write('{:<20s}{:<10.2f}{:<10d}{:<10d}{:<10d}\n'.format(str(p.name),p.rating,p.num_game,p.wins,p.losses)) f.write('{:<60s}{:<10.2f}{:<10d}{:<10d}{:<10d}\n'.format(str(p.name),p.rating,p.num_game,p.wins,p.losses))
def getPlayers(self,sortByRank=False): def getPlayers(self,sortByRank=False):
......
import os
step_delta = 10000
models_file = "../models.txt"
routines = ["R1600_M1600", "R400_M1600", "R400_M400", "R1600_M400", "R1600_M100"]
# pwd = "/share/go9_data/routines/R1600_M1600/test1/caffemodel/received_9b/"
# prefix = "R1600_M1600_"
def getModels(pwd, prefix):
models = []
with open(pwd + "time_record", 'r') as f:
lines = f.readlines()
for l in lines:
l = l.strip().split(':')[0]
if "cambricon" in l:
step_iter = int(l.split('.')[0].split('_')[-1])
if step_iter % step_delta == 0:
m_name = prefix + str(step_iter)
os.system("ln -s %s %s" %(pwd + l, m_name))
models.append(m_name)
with open(models_file, 'a+') as f:
for m in models:
f.write(m + "\n")
def getPwd(routine):
pwd = "/share/go9_data/routines/" + routine + "/test1/caffemodel/received_9b/"
prefix = routine + "_"
return pwd, prefix
if __name__ == "__main__":
for routine in routines:
pwd, prefix = getPwd(routine)
getModels(pwd, prefix)
cd /share/elo-rating
./ELO_client.py 0 & ./ELO_client.py 1 & ./ELO_client.py 2 & ./ELO_client.py 3
cd /share/elo-rating
python ELO_server.py
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment