tanuki- 2017-10-14 depth 10 epoch 2
- 棋譜生成
- 評価関数
- 2017-10-26-17-06-28 評価関数
- 開始局面
- 2chkifuおよびfloodgateの棋譜からから選択
- 1~32手目からランダムに局面を選択
- 選択した局面から0~6手、MultiPV5の中から等確率に指し手を選択
- MultiPVで選択した指し手も教師局面に含める
- 探索深さ 12
- 自己対戦は途中で打ち切らず詰みの局面まで学習データに含める
- 入玉宣言勝ちも学習データに含める
- 生成局面数 1.3億
- 機械学習
- 学習手法 Adam ミニバッチ法
- 学習率 0.5
- ミニバッチサイズ 100万
- 元の評価関数 2017-10-26-17-06-28
- 検証データは100万局面生成したものをそのまま使っている
- 学習データ 1.3億 + epoch 2の2.6億 + floodgateの棋譜のうち入玉宣言勝ちしているもの = 3.9億局面
- 学習局面数 4.0億局面
実験結果
elmo lambda = 0.2
04:13:57.244 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-04-10-48-05\400000000 04:13:57.244 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:13:57.244 T1,b2000,481 - 53 - 466(50.79% R5.50) win black: white = 51.32% : 48.68% declaration win engine1=0 engine2=0
07:03:01.629 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-04-10-48-05\400000000 07:03:01.629 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:03:01.629 T1,b2000,670 - 13 - 317(67.88% R130.01) win black: white = 51.67% : 48.33% declaration win engine1=0 engine2=0
elmo lambda = 0.3
04:15:02.881 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-04-03-42-31\400000000 04:15:02.881 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:15:02.881 T1,b2000,517 - 45 - 438(54.14% R28.81) win black: white = 52.57% : 47.43% declaration win engine1=0 engine2=0
07:05:31.526 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-04-03-42-31\400000000 07:05:31.526 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:05:31.526 T1,b2000,662 - 15 - 323(67.21% R124.66) win black: white = 53.60% : 46.40% declaration win engine1=0 engine2=0
elmo lambda = 0.4
04:10:22.615 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-20-43-03\400000000 04:10:22.615 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:10:22.615 T1,b2000,479 - 45 - 476(50.16% R1.09) win black: white = 50.37% : 49.63% declaration win engine1=0 engine2=0
06:59:28.367 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-20-43-03\400000000 06:59:28.367 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 06:59:28.367 T1,b2000,661 - 11 - 328(66.84% R121.73) win black: white = 50.86% : 49.14% declaration win engine1=0 engine2=0
elmo lambda = 0.5
04:22:12.704 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-02-16-26-41\400000000 04:22:12.704 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:22:12.704 T1,b2000,493 - 41 - 466(51.41% R9.78) win black: white = 53.18% : 46.82% declaration win engine1=0 engine2=0
07:11:47.587 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-02-16-26-41\400000000 07:11:47.587 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:11:47.587 T1,b2000,652 - 16 - 332(66.26% R117.24) win black: white = 52.95% : 47.05% declaration win engine1=0 engine2=0
elmo lambda = 0.6
04:10:33.107 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-02-23-30-16\400000000 04:10:33.107 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:10:33.107 T1,b2000,521 - 30 - 449(53.71% R25.84) win black: white = 51.44% : 48.56% declaration win engine1=0 engine2=0
07:01:07.446 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-02-23-30-16\400000000 07:01:07.446 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:01:07.446 T1,b2000,652 - 14 - 334(66.13% R116.20) win black: white = 53.55% : 46.45% declaration win engine1=0 engine2=0
elmo lambda = 0.7
04:10:47.409 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-06-31-22\400000000 04:10:47.409 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:10:47.409 T1,b2000,461 - 42 - 497(48.12% R-13.06) win black: white = 49.58% : 50.42% declaration win engine1=0 engine2=0
07:03:08.634 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-06-31-22\400000000 07:03:08.634 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:03:08.634 T1,b2000,659 - 13 - 328(66.77% R121.20) win black: white = 51.98% : 48.02% declaration win engine1=0 engine2=0
elmo lambda = 0.8
04:12:29.005 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-13-34-32\400000000 04:12:29.005 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:12:29.005 T1,b2000,477 - 53 - 470(50.37% R2.57) win black: white = 53.33% : 46.67% declaration win engine1=0 engine2=0
07:08:30.227 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-13-34-32\400000000 07:08:30.227 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:08:30.227 T1,b2000,645 - 14 - 341(65.42% R110.72) win black: white = 52.64% : 47.36% declaration win engine1=0 engine2=0