alreadydone · alreadydone · Aug 6, 2018 · Aug 9, 2018 · Aug 10, 2018 · Aug 14, 2018
diff --git a/.gitignore b/.gitignore
@@ -8,3 +8,6 @@ training/tf/venv
 leelaz-model*
 *.orig
 leelaz_opencl_tuning
+/build-autogtp-*
+/build-validation-*
+.vs/
diff --git a/.gitmodules b/.gitmodules
@@ -1,3 +1,6 @@
 [submodule "gtest"]
 	path = gtest
 	url = https://github.com/google/googletest.git
+[submodule "src/Eigen"]
+	path = src/Eigen
+	url = https://github.com/eigenteam/eigen-git-mirror
diff --git a/.travis.yml b/.travis.yml
@@ -14,12 +14,21 @@ jobs:
       script:
       - docker build -f Dockerfiles/Dockerfile.gpu -t leela-zero:gpu .
       - docker run leela-zero:gpu
+    - script:
+      - docker build -f Dockerfiles/Dockerfile.gpu-blas -t leela-zero:gpu-blas .
+      - docker run leela-zero:gpu-blas
     - script:
       - docker build -f Dockerfiles/Dockerfile.cpu -t leela-zero:cpu .
       - docker run leela-zero:cpu
+    - script:
+      - docker build -f Dockerfiles/Dockerfile.cpu-blas -t leela-zero:cpu-blas .
+      - docker run leela-zero:cpu-blas
     - script:
       - docker build -f Dockerfiles/Dockerfile.tests -t leela-zero:tests .
       - docker run leela-zero:tests
+    - script:
+      - docker build -f Dockerfiles/Dockerfile.tests-blas -t leela-zero:tests-blas .
+      - docker run leela-zero:tests-blas
     - stage: style
       before_install:
-      script: find . -regex ".*\.\(cpp\|h\|hpp\)" -not -regex ".*moc_.*.cpp" -not -path "./gtest/*" -not -path "./training/*" -not -path "./src/half/*" -not -path "./src/CL/*" | xargs python2 scripts/cpplint.py --filter=-build/c++11,-build/include,-build/include_order,-build/include_what_you_use,-build/namespaces,-readability/braces,-readability/casting,-readability/fn_size,-readability/namespace,-readability/todo,-runtime/explicit,-runtime/indentation_namespace,-runtime/int,-runtime/references,-whitespace/blank_line,-whitespace/braces,-whitespace/comma,-whitespace/comments,-whitespace/empty_loop_body,-whitespace/line_length,-whitespace/semicolon
+      script: find . -regex ".*\.\(cpp\|h\|hpp\)" -not -regex ".*moc_.*.cpp" -not -path "./gtest/*" -not -path "./training/*" -not -path "./src/half/*" -not -path "./src/CL/*" -not -path "./src/Eigen/*" | xargs python2 scripts/cpplint.py --filter=-build/c++11,-build/include,-build/include_order,-build/include_what_you_use,-build/namespaces,-readability/braces,-readability/casting,-readability/fn_size,-readability/namespace,-readability/todo,-runtime/explicit,-runtime/indentation_namespace,-runtime/int,-runtime/references,-whitespace/blank_line,-whitespace/braces,-whitespace/comma,-whitespace/comments,-whitespace/empty_loop_body,-whitespace/line_length,-whitespace/semicolon
diff --git a/AUTHORS b/AUTHORS
@@ -1,40 +1,54 @@
-Gian-Carlo Pascutto
+Gian-Carlo Pascutto 
+Henrik Forstén
 Seth Troisi
 Marco Calignano
-Henrik Forstén
-Andy Olsen
-Junhee Yoo
 TFiFiE
+Junhee Yoo
+Andy Olsen
 Bood Qian
 Peter Wen
 ywrt
+Hersmunch
 Arseny Krasutsky
 earthengine
+Mankit Pong
 michael
-Hersmunch
 Barry G Becker
+Jonathan Roy
+Junyan Xu
 Maks Kolman
+kuba97531
 Antti Korhonen
-Mankit Pong
+Chin-Chang Yang
 Xingcan LAN
+bittsitt
 tux3
 5525345551
 Alderi-Tokori
+Ancalagon
 Ashley Griffiths
+Barry Becker
 Ed Lee
 Eddh
 F. Huizinga
 FFLaguna
 Jiannan Liu
 Joe Ren
-Jonathan Roy
+LL145
+Mark Andrew Gerads
 Nate
+OmnipotentEntity
+Przemek Wesołek
+Sebastian
 Shen-Ta Hsieh(BestSteve)
 Virgile Andreani
+Ximin Luo
 afalturki
 cheshirecats
 fohristiwhirl
 gaieepo
 tterava
+wonderingabout
+zediir
 Пахотин Иван
 Google LLC
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -1,6 +1,6 @@
 # This file is part of Leela Zero.
 # Copyright (C) 2017 Marco Calignano
-# Copyright (C) 2017-2018 Gian-Carlo Pascutto and contributors
+# Copyright (C) 2017-2019 Gian-Carlo Pascutto and contributors
 # Leela Zero is free software: you can redistribute it and/or modify
 # it under the terms of the GNU General Public License as published by
 # the Free Software Foundation, either version 3 of the License, or
@@ -15,14 +15,15 @@
 cmake_minimum_required(VERSION 3.1)
 
 set(CMAKE_MODULE_PATH ${CMAKE_MODULE_PATH} "${CMAKE_SOURCE_DIR}/cmake/Modules/")
+include(GNUInstallDirs)
 
 project(leelaz)
 add_subdirectory(gtest EXCLUDE_FROM_ALL) # We don't want to install gtest, exclude it from `all`
 
 # Required Packages
 set(Boost_MIN_VERSION "1.58.0")
 set(Boost_USE_MULTITHREADED ON)
-find_package(Boost 1.58.0 REQUIRED program_options)
+find_package(Boost 1.58.0 REQUIRED program_options filesystem)
 find_package(Threads REQUIRED)
 find_package(ZLIB REQUIRED)
 find_package(OpenCL REQUIRED)
@@ -32,14 +33,20 @@ find_package(OpenCL REQUIRED)
 if(NOT APPLE)
   set(BLA_VENDOR OpenBLAS)
 endif()
-find_package(BLAS REQUIRED)
-find_path(BLAS_INCLUDE_DIRS openblas_config.h
-  /usr/include
-  /usr/local/include
-  /usr/include/openblas
-  /opt/OpenBLAS/include
-  /usr/include/x86_64-linux-gnu
-  $ENV{BLAS_HOME}/include)
+if(USE_BLAS)
+  message(STATUS "Looking for system BLAS/OpenBLAS library.")
+  find_package(BLAS REQUIRED)
+  find_path(BLAS_INCLUDE_DIRS openblas_config.h
+    /usr/include
+    /usr/local/include
+    /usr/include/openblas
+    /opt/OpenBLAS/include
+    /usr/include/x86_64-linux-gnu
+    $ENV{BLAS_HOME}/include)
+    add_definitions(-DUSE_BLAS)
+else()
+message(STATUS "Using built-in matrix library.")
+endif()
 find_package(Qt5Core)
 
 set(CMAKE_CXX_STANDARD 14)
@@ -79,7 +86,7 @@ if(USE_HALF)
   add_definitions(-DUSE_HALF)
 endif()
 
-set(IncludePath "${CMAKE_CURRENT_SOURCE_DIR}/src")
+set(IncludePath "${CMAKE_CURRENT_SOURCE_DIR}/src" "${CMAKE_CURRENT_SOURCE_DIR}/src/Eigen")
 set(SrcPath "${CMAKE_CURRENT_SOURCE_DIR}/src")
 
 include_directories(${IncludePath})
@@ -108,7 +115,7 @@ target_link_libraries(leelaz ${BLAS_LIBRARIES})
 target_link_libraries(leelaz ${OpenCL_LIBRARIES})
 target_link_libraries(leelaz ${ZLIB_LIBRARIES})
 target_link_libraries(leelaz ${CMAKE_THREAD_LIBS_INIT})
-install(TARGETS leelaz DESTINATION bin)
+install(TARGETS leelaz DESTINATION ${CMAKE_INSTALL_BINDIR})
 
 if(Qt5Core_FOUND)
     if(NOT Qt5Core_VERSION VERSION_LESS "5.3.0")

diff --git a/COLAB.md b/COLAB.md
diff --git a/Dockerfiles/Dockerfile.cpu-blas b/Dockerfiles/Dockerfile.cpu-blas
@@ -0,0 +1,6 @@
+FROM leela-zero:base
+
+# CPU build
+RUN CXX=g++ CC=gcc cmake -DUSE_CPU_ONLY=1 -DUSE_BLAS=1 ..
+
+CMD cmake --build . --target leelaz --config Release -- -j2
diff --git a/Dockerfiles/Dockerfile.gpu-blas b/Dockerfiles/Dockerfile.gpu-blas
@@ -0,0 +1,6 @@
+FROM leela-zero:base
+
+# GPU build
+RUN CXX=g++ CC=gcc cmake -DUSE_BLAS=1 ..
+
+CMD cmake --build . --target leelaz --config Release -- -j2
diff --git a/Dockerfiles/Dockerfile.tests-blas b/Dockerfiles/Dockerfile.tests-blas
@@ -0,0 +1,8 @@
+FROM leela-zero:base
+
+# CPU build
+RUN CXX=g++ CC=gcc cmake -DUSE_CPU_ONLY=1 -DUSE_BLAS=1 ..
+RUN cmake --build . --target tests --config Release -- -j2
+
+CMD ./tests
+
diff --git a/FAQ.md b/FAQ.md
@@ -8,17 +8,6 @@
 
 AZ also had this behavior, besides we're testing our approach right now. Please be patient.
 
-## 为什么现在训练的是5/6 block网络，而AZ用的是20block ##
-## Why the network size is only 6 blocks comparing to 20 blocks of AZ ##
-
-在项目起步阶段，较小的网络可以在短时间内得到结果，也可以尽早发现/解决问题，
-
-目前的主要目的是为了测试系统的可行性，这对今后的完整重现十分重要（为将来的大网络打好基础）。
-
-This is effectively a testing run to see if the system works, and which things are important for doing a full run. I expected 10 to 100 people to run the client, not 600.
-
-Even so, the 20 block version is 13 times more computationally expensive, and expected to make SLOWER progress early on. I think it's unwise to do such a run unless it's proven that the setup works, because you are going to be in for a very long haul.
-
 ## 为什么比较两个网络强弱时经常下十几盘就不下了 ##
 ## Why only dozens of games are played when comparing two networks ##
 
@@ -33,27 +22,6 @@ We use SPRT to decide if a newly trained network is better. A better network is
 
 The MCTS playouts of self-play games is only 3200, and with noise added (For randomness of each move thus training has something to learn from). If you load Leela Zero with Sabaki, you'll probably find it is actually not that weak.
 
-## 自对弈为什么使用1000的模拟次数，而不是AZ的1600 ##
-## For self-play, why use 3200 visits instead of 1600 playouts as AZ ##
-
-没人知道AZ的1600是怎么得到的。这里的3200是基于下面几点估计得到的：
-
-1. 对于某一个选点，MCTS需要模拟几次才能得出概率结果。在开始阶段，每个选点的概率不会差太多，所以开始的360次模拟大概会覆盖整个棋盘。所以如果要让某些选点可以做几次模拟的话，大概需要2到3 x 360次的模拟。
-
-2. 在computer-go上有人跑过7x7的实验，看到模拟次数从1000到2000的时候性能有提高。所以如果我们观察到瓶颈的时候，可能是可以考虑增加模拟次数。
-
-3. 模拟次数太多会影响得到数据的速度。
-
-Nobody knows. The Zero paper doesn't mention how they arrive at this number, and I know of no sound background to estimate the optimal. I chose it based on some observations:
-
-a) For the MCTS to feed back search probabilities to the learning, it must be able to achieve a reasonable amount of look-ahead on at least a few variations. In the beginning, when the network is untrained, the move probabilities are not very extreme, and this means that the first 360~ simulations will be spent expanding every answer at the root. So if we want to expand at least a few moves, we probably need 2 to 3 x 360 playouts.
-
-b) One person on computer-go, who ran a similar experiment on 7x7, reported that near the end of the learning, he observed increased performance from increasing the number from 1000 to 2000. So maybe this is worthwhile to try when the learning speed starts to decrease or flatten out. But it almost certainly isn't needed early on.
-
-c) Obviously, the speed of acquiring data is linearly related to this setting.
-
-So, the current number is a best guess based on these observations. To be sure what the best value is, one would have to rerun this experiment several times.
-
 ## 有些自对弈对局非常短 ##
 ## Very short self-play games ends with White win?! ##