nodchipのコンピューター将棋ブログ

コンピューター将棋ソフト「tanuki-」シリーズの実験結果を掲載しています。

tanuki- 2017-11-02 depth 12 epoch 3

tanuki- 2017-10-14 depth 10 epoch 2

  • 棋譜生成
    • 評価関数
      • 2017-10-26-17-06-28 評価関数
    • 開始局面
      • 2chkifuおよびfloodgateの棋譜からから選択
      • 1~32手目からランダムに局面を選択
      • 選択した局面から0~6手、MultiPV5の中から等確率に指し手を選択
      • MultiPVで選択した指し手も教師局面に含める
    • 探索深さ 12
    • 自己対戦は途中で打ち切らず詰みの局面まで学習データに含める
    • 入玉宣言勝ちも学習データに含める
    • 生成局面数 1.3億
  • 機械学習
    • 学習手法 Adam ミニバッチ法
    • 学習率 0.5
    • ミニバッチサイズ 100万
    • 元の評価関数 2017-10-26-17-06-28
    • 検証データは100万局面生成したものをそのまま使っている
    • 学習データ 1.3億 + epoch 2の2.6億 + floodgateの棋譜のうち入玉宣言勝ちしているもの = 3.9億局面
    • 学習局面数 4.0億局面

    実験結果

    elmo lambda = 0.2

    04:13:57.244 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-04-10-48-05\400000000 04:13:57.244 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:13:57.244 T1,b2000,481 - 53 - 466(50.79% R5.50) win black: white = 51.32% : 48.68% declaration win engine1=0 engine2=0

    07:03:01.629 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-04-10-48-05\400000000 07:03:01.629 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:03:01.629 T1,b2000,670 - 13 - 317(67.88% R130.01) win black: white = 51.67% : 48.33% declaration win engine1=0 engine2=0

    elmo lambda = 0.3

    04:15:02.881 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-04-03-42-31\400000000 04:15:02.881 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:15:02.881 T1,b2000,517 - 45 - 438(54.14% R28.81) win black: white = 52.57% : 47.43% declaration win engine1=0 engine2=0

    07:05:31.526 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-04-03-42-31\400000000 07:05:31.526 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:05:31.526 T1,b2000,662 - 15 - 323(67.21% R124.66) win black: white = 53.60% : 46.40% declaration win engine1=0 engine2=0

    elmo lambda = 0.4

    04:10:22.615 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-20-43-03\400000000 04:10:22.615 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:10:22.615 T1,b2000,479 - 45 - 476(50.16% R1.09) win black: white = 50.37% : 49.63% declaration win engine1=0 engine2=0

    06:59:28.367 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-20-43-03\400000000 06:59:28.367 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 06:59:28.367 T1,b2000,661 - 11 - 328(66.84% R121.73) win black: white = 50.86% : 49.14% declaration win engine1=0 engine2=0

    elmo lambda = 0.5

    04:22:12.704 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-02-16-26-41\400000000 04:22:12.704 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:22:12.704 T1,b2000,493 - 41 - 466(51.41% R9.78) win black: white = 53.18% : 46.82% declaration win engine1=0 engine2=0

    07:11:47.587 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-02-16-26-41\400000000 07:11:47.587 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:11:47.587 T1,b2000,652 - 16 - 332(66.26% R117.24) win black: white = 52.95% : 47.05% declaration win engine1=0 engine2=0

    elmo lambda = 0.6

    04:10:33.107 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-02-23-30-16\400000000 04:10:33.107 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:10:33.107 T1,b2000,521 - 30 - 449(53.71% R25.84) win black: white = 51.44% : 48.56% declaration win engine1=0 engine2=0

    07:01:07.446 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-02-23-30-16\400000000 07:01:07.446 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:01:07.446 T1,b2000,652 - 14 - 334(66.13% R116.20) win black: white = 53.55% : 46.45% declaration win engine1=0 engine2=0

    elmo lambda = 0.7

    04:10:47.409 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-06-31-22\400000000 04:10:47.409 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:10:47.409 T1,b2000,461 - 42 - 497(48.12% R-13.06) win black: white = 49.58% : 50.42% declaration win engine1=0 engine2=0

    07:03:08.634 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-06-31-22\400000000 07:03:08.634 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:03:08.634 T1,b2000,659 - 13 - 328(66.77% R121.20) win black: white = 51.98% : 48.02% declaration win engine1=0 engine2=0

    elmo lambda = 0.8

    04:12:29.005 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-13-34-32\400000000 04:12:29.005 engine2=YaneuraOu-2017-early.exe eval2=eval\2017-10-26-17-06-28\260000000 04:12:29.005 T1,b2000,477 - 53 - 470(50.37% R2.57) win black: white = 53.33% : 46.67% declaration win engine1=0 engine2=0

    07:08:30.227 engine1=YaneuraOu-2017-early.exe eval1=eval\2017-11-03-13-34-32\400000000 07:08:30.227 engine2=YaneuraOu-2017-early.exe eval2=eval\elmo_wcsc27 07:08:30.227 T1,b2000,645 - 14 - 341(65.42% R110.72) win black: white = 52.64% : 47.36% declaration win engine1=0 engine2=0