aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--.gitignore12
-rw-r--r--README.md19
-rw-r--r--doc/Makefile17
-rw-r--r--doc/diagrams/ASTNode.pumlc12
-rw-r--r--doc/diagrams/ConvNeuralNetwork.pumlc7
-rw-r--r--doc/diagrams/DecisionAlgorithm.pumlc9
-rw-r--r--doc/diagrams/DenseNeuralNetwork.pumlc7
-rw-r--r--doc/diagrams/GameBoard.pumlc29
-rw-r--r--doc/diagrams/GameEngine.pumlc18
-rw-r--r--doc/diagrams/GameMove.pumlc25
-rw-r--r--doc/diagrams/GameState.pumlc18
-rw-r--r--doc/diagrams/GameTree.pumlc4
-rw-r--r--doc/diagrams/ImagoIO.pumlc10
-rw-r--r--doc/diagrams/Keras.pumlc12
-rw-r--r--doc/diagrams/MCTS.pumlc11
-rw-r--r--doc/diagrams/MCTSNode.pumlc18
-rw-r--r--doc/diagrams/NeuralNetwork.pumlc13
-rw-r--r--doc/diagrams/Property.pumlc10
-rw-r--r--doc/diagrams/SGF.pumlc5
-rw-r--r--doc/diagrams/analysisClasses.puml56
-rw-r--r--doc/diagrams/engineModule.puml32
-rw-r--r--doc/diagrams/fullClasses.puml16
-rw-r--r--doc/diagrams/gameModule.puml18
-rw-r--r--doc/diagrams/gameRepresentation.puml14
-rw-r--r--doc/diagrams/gtpEngine.puml29
-rw-r--r--doc/diagrams/interfaces.puml20
-rw-r--r--doc/diagrams/keras.puml13
-rw-r--r--doc/diagrams/modules.puml2
-rw-r--r--doc/diagrams/planificationWorkPlanEngine.puml46
-rw-r--r--doc/diagrams/planificationWorkPlanGame.puml30
-rw-r--r--doc/diagrams/skinparams.puml12
-rw-r--r--doc/diagrams/skinparamsGantt.puml14
-rw-r--r--doc/diagrams/trainingModule.puml20
-rw-r--r--doc/diagrams/useCase_generateAMove.puml24
-rw-r--r--doc/diagrams/useCase_playAMatch.puml20
-rw-r--r--doc/diagrams/useCase_useAsBackend.puml32
-rw-r--r--doc/diagrams/useCases.puml18
-rw-r--r--doc/listings/convModel.txt23
-rw-r--r--doc/listings/convTraining.txt40
-rw-r--r--doc/listings/denseModel.txt17
-rw-r--r--doc/listings/denseTraining.txt40
-rw-r--r--doc/listings/trainCommand.sh1
-rw-r--r--doc/tex/biber.bib156
-rw-r--r--doc/tex/conclusions.tex128
-rw-r--r--doc/tex/imago.tex178
-rw-r--r--doc/tex/implementation.tex181
-rw-r--r--doc/tex/interface.tex6
-rw-r--r--doc/tex/introduction.tex8
-rw-r--r--doc/tex/planification.tex197
-rw-r--r--doc/tex/previousWorks.tex21
-rw-r--r--doc/tex/results.tex416
-rw-r--r--doc/tex/systemAnalysis.tex892
-rw-r--r--doc/tex/systemDesign.tex324
-rw-r--r--doc/tex/tfg.tex60
-rwxr-xr-xgo.py14
-rw-r--r--imago/data/enums.py6
-rw-r--r--imago/engine/core.py39
-rw-r--r--imago/engine/createDecisionAlgorithm.py21
-rw-r--r--imago/engine/decisionAlgorithm.py18
-rw-r--r--imago/engine/imagoIO.py105
-rw-r--r--imago/engine/keras/__init__.py0
-rw-r--r--imago/engine/keras/convNeuralNetwork.py54
-rw-r--r--imago/engine/keras/denseNeuralNetwork.py40
-rw-r--r--imago/engine/keras/initialDenseNeuralNetwork.py28
-rw-r--r--imago/engine/keras/keras.py49
-rw-r--r--imago/engine/keras/neuralNetwork.py217
-rw-r--r--imago/engine/monteCarlo.py187
-rw-r--r--imago/engine/parseHelpers.py44
-rw-r--r--imago/gameLogic/gameBoard.py292
-rw-r--r--imago/gameLogic/gameMove.py142
-rw-r--r--imago/gameLogic/gameState.py90
-rw-r--r--imago/gameLogic/gameTree.py8
-rw-r--r--imago/scripts/__init__.py0
-rw-r--r--imago/scripts/monteCarloSimulation.py25
-rwxr-xr-ximago/scripts/monteCarloSimulation.sh24
-rw-r--r--imago/sgfParser/astNode.py85
-rw-r--r--imago/sgfParser/sgf.py20
-rwxr-xr-ximago/sgfParser/sgflex.py22
-rwxr-xr-ximago/sgfParser/sgfyacc.py40
-rwxr-xr-ximagocli.py22
-rw-r--r--models/testModel.h5bin0 -> 43120 bytes
-rw-r--r--results.txt41
-rwxr-xr-xsimulationMatchesPyplot.py27
-rwxr-xr-xtestSGF.py20
-rw-r--r--tests/test_enums.py15
-rw-r--r--tests/test_gameBoard.py118
-rw-r--r--tests/test_gameMove.py78
-rw-r--r--tests/test_monteCarlo.py30
-rw-r--r--tests/test_parseHelpers.py68
-rwxr-xr-xtrain.py27
90 files changed, 4807 insertions, 569 deletions
diff --git a/.gitignore b/.gitignore
index 750838b..0a4eeda 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,9 +1,15 @@
*.sgf
+# images
+*.png
+*.jpg
+*.xcf
+
# doc
*.pdf
doc/out/
doc/diagrams/*.png
+_minted-imago/
# src
__pycache__/
@@ -12,3 +18,9 @@ __pycache__/
# ply
parser.out
parsetab.py
+
+# logs
+*.log
+
+# NN models
+models/
diff --git a/README.md b/README.md
index ccd8f6c..3e6a01d 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
# Imago
-A Go AI.
+An AI player of the game of Go.
## The project
@@ -10,22 +10,19 @@ Software Engineering of the University of Oviedo.
## Implementation
Imago is written in Python and the source code is inside the `imago` folder. The
-implementation is on an early stage and includes core game logic, a basic GTP
-engine and a placeholder AI function which plays on random empty vertices.
+implementation includes core game logic and a GTP engine able to play using
+either Monte Carlo Tree Search or a neural network trained on human matches.
A game of go with no AI can be played by running the `go.py` script. This is
useful to test the core game logic. The GTP engine can be started by the
`imagocli.py` script. Following the GTP specification, known commands can be
listed by entering `list_commands` on the GTP engine's interface.
-Tests are stored in the `tests` folder which as of now contains an example
-tests file. The tests can be run with the `test.sh` script which uses the
-Python package `coverage` to get coverage statistics.
+Tests are stored in the `tests` folder. The tests can be run with the `test.sh`
+script which uses the Python package `coverage` to get coverage statistics.
## Documentation
-The source code for a work in progress documentation is laid out inside the
-`doc` folder, including a Makefile to compile it. This documentation compiling
-process depends on `xelatex`, `biber`, `plantuml` and some `LaTeX` packages.
-This documentation is fully subject to change in any moment of development and
-it probably already contradicts the actual implementation.
+The source code for the documentation is laid out inside the `doc` folder,
+including a Makefile to compile it. The documentation compiling process depends
+on `xelatex`, `biber`, `plantuml` and some `LaTeX` packages.
diff --git a/doc/Makefile b/doc/Makefile
index 954ae3c..284000e 100644
--- a/doc/Makefile
+++ b/doc/Makefile
@@ -1,18 +1,23 @@
.SUFFIXES: .puml .png
-docName = tfg
+docName = imago
outputFolder = out
-texFiles = tex/tfg.tex tex/introduction.tex tex/previousWorks.tex tex/interface.tex tex/implementation.tex
-diagramImgs = diagrams/gameRepresentation.png diagrams/modules.png diagrams/sgfModule.png diagrams/gtpEngine.png
+texFiles = tex/$(docName).tex tex/introduction.tex tex/planification.tex tex/systemAnalysis.tex tex/systemDesign.tex tex/implementation.tex tex/results.tex tex/conclusions.tex tex/biber.bib
+
+diagramImgs = diagrams/planificationWorkPlanEngine.png diagrams/planificationWorkPlanGame.png diagrams/useCases.png diagrams/analysisClasses.png diagrams/useCase_generateAMove.png diagrams/useCase_useAsBackend.png diagrams/useCase_playAMatch.png diagrams/interfaces.png diagrams/gameModule.png diagrams/engineModule.png diagrams/trainingModule.png diagrams/modules.png diagrams/fullClasses.png
+
+imgs = img/imago.jpg img/models/denseModel.png img/models/convModel.png
+
+listings = listings/denseModel.txt listings/convModel.txt listings/denseTraining.txt listings/convTraining.txt listings/trainCommand.sh
all: $(docName).pdf
-$(docName).pdf: $(texFiles) $(diagramImgs)
+$(docName).pdf: $(texFiles) $(diagramImgs) $(imgs) $(listings) Makefile
[ -d $(outputFolder) ] || mkdir $(outputFolder)
- xelatex -output-directory $(outputFolder) tex/$(docName).tex
+ xelatex -shell-escape -output-directory $(outputFolder) tex/$(docName).tex
biber $(outputFolder)/$(docName)
- xelatex -output-directory $(outputFolder) tex/$(docName).tex
+ xelatex -shell-escape -output-directory $(outputFolder) tex/$(docName).tex
mv $(outputFolder)/$(docName).pdf .
.puml.png:
diff --git a/doc/diagrams/ASTNode.pumlc b/doc/diagrams/ASTNode.pumlc
index 05c13ac..945b24d 100644
--- a/doc/diagrams/ASTNode.pumlc
+++ b/doc/diagrams/ASTNode.pumlc
@@ -1,10 +1,14 @@
@startuml
class ASTNode {
- ASTNode[] children
- Property properties
- void addtoSequence()
- GameTree toGameTree()
+ ASTNode[] children
+ Property[] props
+
+ addtoSequence()
+ toGameTree()
+ toGameMoveTree(previousMove)
+ hasProperty(propertyName)
+ getPropertyValue(propertyName)
}
@enduml
diff --git a/doc/diagrams/ConvNeuralNetwork.pumlc b/doc/diagrams/ConvNeuralNetwork.pumlc
new file mode 100644
index 0000000..2254e5d
--- /dev/null
+++ b/doc/diagrams/ConvNeuralNetwork.pumlc
@@ -0,0 +1,7 @@
+@startuml
+
+class ConvNeuralNetwork {
+
+}
+
+@enduml
diff --git a/doc/diagrams/DecisionAlgorithm.pumlc b/doc/diagrams/DecisionAlgorithm.pumlc
new file mode 100644
index 0000000..c3e9e8a
--- /dev/null
+++ b/doc/diagrams/DecisionAlgorithm.pumlc
@@ -0,0 +1,9 @@
+@startuml
+
+interface DecisionAlgorithm {
+ {abstract} forceNextMove(coords)
+ {abstract} pickMove()
+ {abstract} clearBoard()
+}
+
+@enduml
diff --git a/doc/diagrams/DenseNeuralNetwork.pumlc b/doc/diagrams/DenseNeuralNetwork.pumlc
new file mode 100644
index 0000000..a9e7d1c
--- /dev/null
+++ b/doc/diagrams/DenseNeuralNetwork.pumlc
@@ -0,0 +1,7 @@
+@startuml
+
+class DenseNeuralNetwork {
+
+}
+
+@enduml
diff --git a/doc/diagrams/GameBoard.pumlc b/doc/diagrams/GameBoard.pumlc
new file mode 100644
index 0000000..ebeedd7
--- /dev/null
+++ b/doc/diagrams/GameBoard.pumlc
@@ -0,0 +1,29 @@
+@startuml
+
+class GameBoard {
+ int[][] board
+ int capturesBlack
+ int capturesWhite
+
+ getBoard()
+ getBoardHeight()
+ getBoardWidth()
+ getDeepCopy()
+ getGroupLiberties(row, col)
+ getGroupLibertiesCount(row, col)
+ getGroupVertices(row, col)
+ getGroupVerticesCount(row, col)
+ moveAndCapture(row, col, player)
+ isMoveInBoardBounds(row, col)
+ isCellEmpty(row, col)
+ isCellEye(row, col)
+ isMoveSuicidal(row, col, player)
+ isMoveKoIllegal(row, col, player, prevBoards)
+ isPlayable(row, col, player, prevBoards)
+ isSensible(row, col, player, prevBoards)
+ score()
+ equals(otherBoard)
+ printBoard()
+}
+
+@enduml
diff --git a/doc/diagrams/GameEngine.pumlc b/doc/diagrams/GameEngine.pumlc
new file mode 100644
index 0000000..62b892e
--- /dev/null
+++ b/doc/diagrams/GameEngine.pumlc
@@ -0,0 +1,18 @@
+@startuml
+
+class GameEngine {
+ int komi
+ GameState gameState
+ Enum daId
+ DecisionAlgorithm da
+
+ setBoardsize(newSize)
+ clearBoard()
+ setKomi(komi)
+ setFixedHandicap(stones)
+ play(color, vertex)
+ genmove(color)
+ undo()
+}
+
+@enduml
diff --git a/doc/diagrams/GameMove.pumlc b/doc/diagrams/GameMove.pumlc
index 7dcb5e3..a1d0d73 100644
--- a/doc/diagrams/GameMove.pumlc
+++ b/doc/diagrams/GameMove.pumlc
@@ -1,13 +1,28 @@
@startuml
class GameMove {
- int player
- int row
- int col
- int[2] makesKo
- int[] board
+ GameBoard board
GameMove[] nextMoves
GameMove previousMove
+ boolean isPass
+ int[] coords
+ Player playerWhoPassed
+
+ getRow()
+ getCol()
+ getPlayer()
+ getNextPlayer()
+ getGameLength()
+ getThisAndPrevBoards()
+ getPlayableVertices()
+ getSensibleVertices()
+ addMove(row, col)
+ addMoveBcoords(coords)
+ addMoveForPlayer(row, col, player)
+ addPass()
+ addPassForPlayer()
+ getMainLineOfPlay()
+ printBoard()
}
@enduml
diff --git a/doc/diagrams/GameState.pumlc b/doc/diagrams/GameState.pumlc
index db39d8f..a913855 100644
--- a/doc/diagrams/GameState.pumlc
+++ b/doc/diagrams/GameState.pumlc
@@ -1,14 +1,18 @@
@startuml
class GameState {
- int player
- int capturesBlack
- int capturesWhite
- List board
- List prevBoards # for ko
- GameTree gameTree
+ int size
GameMove lastMove
- GameData gameData
+
+ getCurrentPlayer()
+ getPlayerCode()
+ getBoard()
+ clearBoard()
+ playMove(row, col)
+ playMoveForPlayer(row, col, player)
+ playPass()
+ playPassForPlayer(player)
+ undo()
}
@enduml
diff --git a/doc/diagrams/GameTree.pumlc b/doc/diagrams/GameTree.pumlc
index 85859d8..10b9251 100644
--- a/doc/diagrams/GameTree.pumlc
+++ b/doc/diagrams/GameTree.pumlc
@@ -1,8 +1,8 @@
@startuml
class GameTree {
- GameNode[] firstMoves
- GameData gameData
+ GameMove[] firstMoves
+ 'GameData gameData
}
@enduml
diff --git a/doc/diagrams/ImagoIO.pumlc b/doc/diagrams/ImagoIO.pumlc
new file mode 100644
index 0000000..848a173
--- /dev/null
+++ b/doc/diagrams/ImagoIO.pumlc
@@ -0,0 +1,10 @@
+@startuml
+
+class ImagoIO {
+ function[] commands_set
+ GameEngine gameEngine
+
+ start()
+}
+
+@enduml
diff --git a/doc/diagrams/Keras.pumlc b/doc/diagrams/Keras.pumlc
new file mode 100644
index 0000000..1fa40b2
--- /dev/null
+++ b/doc/diagrams/Keras.pumlc
@@ -0,0 +1,12 @@
+@startuml
+
+class Keras {
+ GameMove currentMove
+ NeuralNetwork neuralNetwork
+
+ forceNextMove(self, coords)
+ pickMove(self)
+ loadNetwork(self)
+}
+
+@enduml
diff --git a/doc/diagrams/MCTS.pumlc b/doc/diagrams/MCTS.pumlc
new file mode 100644
index 0000000..ff00c62
--- /dev/null
+++ b/doc/diagrams/MCTS.pumlc
@@ -0,0 +1,11 @@
+@startuml
+
+class MCTS {
+ MCTSNode root
+
+ forceNextMove(coords)
+ pickMove()
+ clearBoard()
+}
+
+@enduml
diff --git a/doc/diagrams/MCTSNode.pumlc b/doc/diagrams/MCTSNode.pumlc
new file mode 100644
index 0000000..6ae8f35
--- /dev/null
+++ b/doc/diagrams/MCTSNode.pumlc
@@ -0,0 +1,18 @@
+@startuml
+
+class MCTSNode {
+ int visits
+ int score
+ GameMove move
+ MCTSNode parent
+ MCTSNode[] children
+ (int, int)[] unexploredVertices
+
+ ucbForPlayer()
+ selection()
+ expansion()
+ expansionForCoords(coords)
+ simulation(nMatches, scoreDiffHeur)
+}
+
+@enduml
diff --git a/doc/diagrams/NeuralNetwork.pumlc b/doc/diagrams/NeuralNetwork.pumlc
new file mode 100644
index 0000000..f6c0e1c
--- /dev/null
+++ b/doc/diagrams/NeuralNetwork.pumlc
@@ -0,0 +1,13 @@
+@startuml
+
+class NeuralNetwork {
+ int boardSize
+ string path
+
+ trainModel(games)
+ saveModel(modelPath)
+ pickMove(gameMove, player)
+ saveModelPlot(path)
+}
+
+@enduml
diff --git a/doc/diagrams/Property.pumlc b/doc/diagrams/Property.pumlc
new file mode 100644
index 0000000..bb06b47
--- /dev/null
+++ b/doc/diagrams/Property.pumlc
@@ -0,0 +1,10 @@
+@startuml
+
+class Property {
+ string name
+ object value
+
+ addValue(value)
+}
+
+@enduml
diff --git a/doc/diagrams/SGF.pumlc b/doc/diagrams/SGF.pumlc
index 2c30202..5ab248a 100644
--- a/doc/diagrams/SGF.pumlc
+++ b/doc/diagrams/SGF.pumlc
@@ -1,8 +1,7 @@
@startuml
-class SGF {
- GameTree loadGameTree(file)
- void saveGameTree(file)
+object SGF {
+ loadGameTree(file)
}
@enduml
diff --git a/doc/diagrams/analysisClasses.puml b/doc/diagrams/analysisClasses.puml
new file mode 100644
index 0000000..7685ea1
--- /dev/null
+++ b/doc/diagrams/analysisClasses.puml
@@ -0,0 +1,56 @@
+@startuml
+
+!include skinparams.puml
+
+() Player
+package "Game module" {
+ class GameIO
+ class GameState
+ class GameBoard
+ class GameMove
+
+ Player -> GameIO
+ GameIO ..> GameState
+ GameState ..> GameMove
+ GameMove ..> GameBoard
+}
+
+() "Engine user" as EU
+() "Model files" as MF
+package "Engine module" {
+ class EngineIO
+ class EngineLogic
+ interface DecisionAlgorithm
+ class MonteCarloTreeSearch
+ class MCTSNode
+ class Keras
+ class NeuralNetwork
+
+ EU -> EngineIO
+ EngineIO ..> EngineLogic
+ EngineLogic ..> DecisionAlgorithm
+ DecisionAlgorithm <|.. MonteCarloTreeSearch
+ DecisionAlgorithm <|.. Keras
+ MonteCarloTreeSearch ..> MCTSNode
+ Keras ..> NeuralNetwork
+ NeuralNetwork --> MF
+}
+
+() "SGF files" as SGF
+package "Training module" {
+ class Trainer
+ class Parser
+ class ASTNode
+
+ Parser -> SGF
+ Trainer ..> Parser
+ Parser ..> ASTNode
+}
+
+DecisionAlgorithm .> GameMove
+
+ASTNode .> GameMove
+
+Trainer .> NeuralNetwork
+
+@enduml
diff --git a/doc/diagrams/engineModule.puml b/doc/diagrams/engineModule.puml
new file mode 100644
index 0000000..c6f3a3e
--- /dev/null
+++ b/doc/diagrams/engineModule.puml
@@ -0,0 +1,32 @@
+@startuml
+
+!include skinparams.puml
+
+package "Engine module" {
+
+ !include ImagoIO.pumlc
+ !include GameEngine.pumlc
+ !include DecisionAlgorithm.pumlc
+ !include MCTS.pumlc
+ !include MCTSNode.pumlc
+ !include Keras.pumlc
+ !include NeuralNetwork.pumlc
+ !include DenseNeuralNetwork.pumlc
+ !include ConvNeuralNetwork.pumlc
+
+ ImagoIO ..> GameEngine
+ GameEngine ..> DecisionAlgorithm
+
+ DecisionAlgorithm <|.. MCTS
+ MCTSNode <. MCTS
+ MCTSNode -> MCTSNode
+ MCTSNode o--> MCTSNode
+
+ DecisionAlgorithm <|.. Keras
+ Keras ..> NeuralNetwork
+ NeuralNetwork <|-- DenseNeuralNetwork
+ NeuralNetwork <|-- ConvNeuralNetwork
+
+}
+
+@enduml
diff --git a/doc/diagrams/fullClasses.puml b/doc/diagrams/fullClasses.puml
new file mode 100644
index 0000000..d7fe4d8
--- /dev/null
+++ b/doc/diagrams/fullClasses.puml
@@ -0,0 +1,16 @@
+@startuml
+
+!include skinparams.puml
+
+!include gameModule.puml
+!include engineModule.puml
+!include trainingModule.puml
+
+GameEngine --> GameState
+
+MCTSNode --> GameMove
+Keras --> GameMove
+
+ASTNode --> GameMove
+
+@enduml
diff --git a/doc/diagrams/gameModule.puml b/doc/diagrams/gameModule.puml
new file mode 100644
index 0000000..9a60d3f
--- /dev/null
+++ b/doc/diagrams/gameModule.puml
@@ -0,0 +1,18 @@
+@startuml
+
+!include skinparams.puml
+
+package "Game module" {
+
+ !include GameState.pumlc
+ !include GameMove.pumlc
+ !include GameBoard.pumlc
+
+ GameState ..> GameMove
+ GameMove -> GameMove : Previous move
+ GameMove o--> GameMove : Next moves
+ GameMove ..> GameBoard
+
+}
+
+@enduml
diff --git a/doc/diagrams/gameRepresentation.puml b/doc/diagrams/gameRepresentation.puml
deleted file mode 100644
index 9a869f1..0000000
--- a/doc/diagrams/gameRepresentation.puml
+++ /dev/null
@@ -1,14 +0,0 @@
-@startuml
-
-!include skinparams.puml
-
-!include GameState.pumlc
-!include GameTree.pumlc
-!include GameMove.pumlc
-
-GameState --> GameTree
-GameState --> GameMove: Current move
-GameTree *--> GameMove
-GameMove -> GameMove
-
-@enduml
diff --git a/doc/diagrams/gtpEngine.puml b/doc/diagrams/gtpEngine.puml
deleted file mode 100644
index c4caf32..0000000
--- a/doc/diagrams/gtpEngine.puml
+++ /dev/null
@@ -1,29 +0,0 @@
-@startuml
-
-!include skinparams.puml
-
-class EngineCore {
-}
-
-class IO {
- processComand()
-}
-
-!include GameState.pumlc
-
-'class EngineBoard {
-' setSize()
-' setKomi()
-' play()
-' undo()
-'}
-
-class EngineAI {
- genmove(board)
-}
-
-EngineCore --> IO
-EngineCore --> GameState
-EngineCore --> EngineAI
-
-@enduml
diff --git a/doc/diagrams/interfaces.puml b/doc/diagrams/interfaces.puml
new file mode 100644
index 0000000..3ade81e
--- /dev/null
+++ b/doc/diagrams/interfaces.puml
@@ -0,0 +1,20 @@
+@startuml
+
+!include ./skinparams.puml
+
+component Game
+component Engine
+component Trainer
+
+interface "Game text interface" as GTI
+interface "Engine text interface" as ETI
+interface "Neural network model" as NNM
+interface "SGF files" as SGF
+
+Game -- GTI
+Engine -- ETI
+Engine -- NNM
+Trainer -- NNM
+Trainer -- SGF
+
+@enduml
diff --git a/doc/diagrams/keras.puml b/doc/diagrams/keras.puml
new file mode 100644
index 0000000..98776d1
--- /dev/null
+++ b/doc/diagrams/keras.puml
@@ -0,0 +1,13 @@
+@startuml
+
+!include skinparams.puml
+
+!include DecisionAlgorithm.pumlc
+!include Keras.pumlc
+!include NeuralNetwork.pumlc
+
+DecisionAlgorithm <|.. Keras
+
+Keras -> NeuralNetwork
+
+@enduml
diff --git a/doc/diagrams/modules.puml b/doc/diagrams/modules.puml
index 064be1d..5b8d78c 100644
--- a/doc/diagrams/modules.puml
+++ b/doc/diagrams/modules.puml
@@ -1,6 +1,6 @@
@startuml
-!include ./skinparams.puml
+!include skinparams.puml
!include GameState.pumlc
!include SGF.pumlc
diff --git a/doc/diagrams/planificationWorkPlanEngine.puml b/doc/diagrams/planificationWorkPlanEngine.puml
new file mode 100644
index 0000000..9caad40
--- /dev/null
+++ b/doc/diagrams/planificationWorkPlanEngine.puml
@@ -0,0 +1,46 @@
+@startgantt
+
+!include skinparams.puml
+!include skinparamsGantt.puml
+
+printscale weekly
+Saturday are closed
+Sunday are closed
+
+Project starts 2021-01-11
+
+-- Preliminary research --
+[Previous works research] as [PWR] lasts 1 week
+[Algorithms research] as [AR] lasts 2 weeks
+
+-- Engine Implementation --
+[Engine modelling] as [EM] lasts 1 week
+[Engine implementation] as [EI] lasts 4 weeks
+
+-- Algorithms Implementations --
+[Monte Carlo implementation] as [MCI] lasts 4 weeks
+[Neural networks research] as [NNR] lasts 2 weeks
+[Neural networks implementation] as [NNI] lasts 3 weeks
+
+-- Testing --
+[Engine unit testing] as [EUT] lasts 4 weeks
+[System testing] as [ST] lasts 1 week
+
+-- Analysis --
+[Algorithms comparison] as [AC] lasts 2 weeks
+
+[PWR] -> [AR]
+[AR] -> [EM]
+
+[EM] -> [MCI]
+[EM] -> [EI]
+[EM] -> [EUT]
+
+[MCI] -> [NNR]
+[NNR] -> [NNI]
+
+[NNI] -> [ST]
+
+[ST] -> [AC]
+
+@endgantt
diff --git a/doc/diagrams/planificationWorkPlanGame.puml b/doc/diagrams/planificationWorkPlanGame.puml
new file mode 100644
index 0000000..ffaf72c
--- /dev/null
+++ b/doc/diagrams/planificationWorkPlanGame.puml
@@ -0,0 +1,30 @@
+@startgantt
+
+!include skinparams.puml
+!include skinparamsGantt.puml
+
+printscale weekly zoom 2
+Saturday are closed
+Sunday are closed
+
+Project starts 2020-11-02
+
+-- Preliminary research --
+[Previous works research] as [PWR] lasts 1 week
+
+-- Game Implementation --
+[Domain modelling] as [DM] lasts 1 week
+[Domain implementation] as [DI] lasts 6 weeks
+
+-- Testing --
+[Unit testing] as [UT] lasts 6 weeks
+[System testing] as [ST] lasts 1 week
+
+[PWR] -> [DM]
+
+[DM] -> [DI]
+[DM] -> [UT]
+
+[DI] -> [ST]
+
+@endgantt
diff --git a/doc/diagrams/skinparams.puml b/doc/diagrams/skinparams.puml
index cde3da7..d9dce03 100644
--- a/doc/diagrams/skinparams.puml
+++ b/doc/diagrams/skinparams.puml
@@ -1,9 +1,19 @@
@startuml
+'Old style
+'skin rose
+
skinparam {
- monochrome true
+ 'monochrome true
shadowing false
linetype polyline
}
+'skinparam {
+' shadowing false
+' ActorBorderColor #339933
+' ActorBackgroundColor #88FF88
+' linetype polyline
+'}
+
@enduml
diff --git a/doc/diagrams/skinparamsGantt.puml b/doc/diagrams/skinparamsGantt.puml
new file mode 100644
index 0000000..38a4b9b
--- /dev/null
+++ b/doc/diagrams/skinparamsGantt.puml
@@ -0,0 +1,14 @@
+@startuml
+
+<style>
+ganttDiagram {
+ task {
+ FontSize 10
+ }
+ separator {
+ FontSize 15
+ }
+}
+</style>
+
+@enduml
diff --git a/doc/diagrams/trainingModule.puml b/doc/diagrams/trainingModule.puml
new file mode 100644
index 0000000..81d5d72
--- /dev/null
+++ b/doc/diagrams/trainingModule.puml
@@ -0,0 +1,20 @@
+@startuml
+
+!include skinparams.puml
+
+package "Training module" {
+
+ !include SGF.pumlc
+ !include sgflex.pumlc
+ !include sgfyacc.pumlc
+ !include ASTNode.pumlc
+ !include Property.pumlc
+
+ SGF ..> sgfyacc
+ sgfyacc .> sgflex
+ sgfyacc ..> ASTNode
+ ASTNode .> Property
+
+}
+
+@enduml
diff --git a/doc/diagrams/useCase_generateAMove.puml b/doc/diagrams/useCase_generateAMove.puml
new file mode 100644
index 0000000..fa76edb
--- /dev/null
+++ b/doc/diagrams/useCase_generateAMove.puml
@@ -0,0 +1,24 @@
+@startuml
+
+!include skinparams.puml
+
+actor "GUI program / Human user" as user
+
+boundary "Engine CLI" as cli
+control "Play a stone" as playStone
+control "Think next move" as think
+entity "Board state" as state
+
+loop until desired board is set
+ user -> cli : play stone
+ cli -> playStone
+ playStone -> state
+ cli <- state
+end
+
+user -> cli : ask for move
+cli -> think
+think -> state
+cli <- state : Show move
+
+@enduml
diff --git a/doc/diagrams/useCase_playAMatch.puml b/doc/diagrams/useCase_playAMatch.puml
new file mode 100644
index 0000000..65d1517
--- /dev/null
+++ b/doc/diagrams/useCase_playAMatch.puml
@@ -0,0 +1,20 @@
+@startuml
+
+!include skinparams.puml
+
+actor "Player" as player
+
+boundary "Game CLI" as cli
+control "Play a stone" as playStone
+control "Show board" as showBoard
+entity "Board state" as state
+
+loop until game ends
+ player -> cli
+ cli -> playStone
+ playStone -> state
+ showBoard <- state
+ cli <- showBoard
+end
+
+@enduml
diff --git a/doc/diagrams/useCase_useAsBackend.puml b/doc/diagrams/useCase_useAsBackend.puml
new file mode 100644
index 0000000..9076769
--- /dev/null
+++ b/doc/diagrams/useCase_useAsBackend.puml
@@ -0,0 +1,32 @@
+@startuml
+
+!include skinparams.puml
+
+actor "Opponent" as opponent
+actor "GUI Program" as program
+
+boundary "Engine CLI" as cli
+control "Play a stone" as playStone
+control "Think next move" as think
+entity "Board state" as state
+
+loop until starting board is set
+ program -> cli : play stone
+ cli -> playStone
+ playStone -> state
+ cli <- state
+end
+
+loop until game ends
+ program -> cli : ask for move
+ cli -> think
+ think -> state
+ cli <- state : Show move
+ opponent -> program : give input
+ program -> cli : play stone
+ cli -> playStone
+ playStone -> state
+ cli <- state
+end
+
+@enduml
diff --git a/doc/diagrams/useCases.puml b/doc/diagrams/useCases.puml
new file mode 100644
index 0000000..8d4aa71
--- /dev/null
+++ b/doc/diagrams/useCases.puml
@@ -0,0 +1,18 @@
+@startuml
+
+!include skinparams.puml
+
+actor "Human Player" as player
+actor "GUI Program" as gui
+actor "Human User" as user
+
+usecase "Play a match" as play
+usecase "Use as backend for machine player" as backend
+usecase "Generate a move" as genMove
+
+player --> play
+gui --> backend
+user --> genMove
+gui --> genMove
+
+@enduml
diff --git a/doc/listings/convModel.txt b/doc/listings/convModel.txt
new file mode 100644
index 0000000..5c90975
--- /dev/null
+++ b/doc/listings/convModel.txt
@@ -0,0 +1,23 @@
+Model: "sequential"
+_________________________________________________________________
+ Layer (type) Output Shape Param #
+=================================================================
+ conv2d (Conv2D) (None, 9, 9, 32) 608
+
+ max_pooling2d (MaxPooling2D (None, 4, 4, 32) 0
+ )
+
+ conv2d_1 (Conv2D) (None, 4, 4, 64) 18496
+
+ max_pooling2d_1 (MaxPooling (None, 2, 2, 64) 0
+ 2D)
+
+ flatten (Flatten) (None, 256) 0
+
+ dense (Dense) (None, 82) 21074
+
+=================================================================
+Total params: 40,178
+Trainable params: 40,178
+Non-trainable params: 0
+_________________________________________________________________
diff --git a/doc/listings/convTraining.txt b/doc/listings/convTraining.txt
new file mode 100644
index 0000000..6108abc
--- /dev/null
+++ b/doc/listings/convTraining.txt
@@ -0,0 +1,40 @@
+Epoch 1/20
+39501/39501 - 279s - loss: 3.7391 - accuracy: 0.1064 - val_loss: 3.1316 - val_accuracy: 0.2023 - 279s/epoch - 7ms/step
+Epoch 2/20
+39501/39501 - 241s - loss: 2.6512 - accuracy: 0.3046 - val_loss: 2.0729 - val_accuracy: 0.4484 - 241s/epoch - 6ms/step
+Epoch 3/20
+39501/39501 - 214s - loss: 1.6459 - accuracy: 0.6014 - val_loss: 1.2040 - val_accuracy: 0.7143 - 214s/epoch - 5ms/step
+Epoch 4/20
+39501/39501 - 228s - loss: 0.9016 - accuracy: 0.8417 - val_loss: 0.6430 - val_accuracy: 0.8735 - 228s/epoch - 6ms/step
+Epoch 5/20
+39501/39501 - 230s - loss: 0.4704 - accuracy: 0.9380 - val_loss: 0.3520 - val_accuracy: 0.9378 - 230s/epoch - 6ms/step
+Epoch 6/20
+39501/39501 - 222s - loss: 0.2735 - accuracy: 0.9520 - val_loss: 0.2329 - val_accuracy: 0.9549 - 222s/epoch - 6ms/step
+Epoch 7/20
+39501/39501 - 215s - loss: 0.2117 - accuracy: 0.9495 - val_loss: 0.1837 - val_accuracy: 0.9583 - 215s/epoch - 5ms/step
+Epoch 8/20
+39501/39501 - 215s - loss: 0.1797 - accuracy: 0.9533 - val_loss: 0.1787 - val_accuracy: 0.9556 - 215s/epoch - 5ms/step
+Epoch 9/20
+39501/39501 - 225s - loss: 0.1607 - accuracy: 0.9553 - val_loss: 0.1952 - val_accuracy: 0.9446 - 225s/epoch - 6ms/step
+Epoch 10/20
+39501/39501 - 249s - loss: 0.1486 - accuracy: 0.9572 - val_loss: 0.1544 - val_accuracy: 0.9597 - 249s/epoch - 6ms/step
+Epoch 11/20
+39501/39501 - 208s - loss: 0.1380 - accuracy: 0.9586 - val_loss: 0.1467 - val_accuracy: 0.9651 - 208s/epoch - 5ms/step
+Epoch 12/20
+39501/39501 - 210s - loss: 0.1321 - accuracy: 0.9592 - val_loss: 0.1313 - val_accuracy: 0.9665 - 210s/epoch - 5ms/step
+Epoch 13/20
+39501/39501 - 204s - loss: 0.1276 - accuracy: 0.9598 - val_loss: 0.1282 - val_accuracy: 0.9665 - 204s/epoch - 5ms/step
+Epoch 14/20
+39501/39501 - 193s - loss: 0.1222 - accuracy: 0.9604 - val_loss: 0.1174 - val_accuracy: 0.9686 - 193s/epoch - 5ms/step
+Epoch 15/20
+39501/39501 - 183s - loss: 0.1182 - accuracy: 0.9607 - val_loss: 0.1747 - val_accuracy: 0.9433 - 183s/epoch - 5ms/step
+Epoch 16/20
+39501/39501 - 166s - loss: 0.1147 - accuracy: 0.9611 - val_loss: 0.1186 - val_accuracy: 0.9679 - 166s/epoch - 4ms/step
+Epoch 17/20
+39501/39501 - 163s - loss: 0.1119 - accuracy: 0.9616 - val_loss: 0.1112 - val_accuracy: 0.9699 - 163s/epoch - 4ms/step
+Epoch 18/20
+39501/39501 - 168s - loss: 0.1095 - accuracy: 0.9618 - val_loss: 0.1020 - val_accuracy: 0.9706 - 168s/epoch - 4ms/step
+Epoch 19/20
+39501/39501 - 161s - loss: 0.1072 - accuracy: 0.9625 - val_loss: 0.1058 - val_accuracy: 0.9699 - 161s/epoch - 4ms/step
+Epoch 20/20
+39501/39501 - 173s - loss: 0.1052 - accuracy: 0.9624 - val_loss: 0.1031 - val_accuracy: 0.9727 - 173s/epoch - 4ms/step
diff --git a/doc/listings/denseModel.txt b/doc/listings/denseModel.txt
new file mode 100644
index 0000000..006e321
--- /dev/null
+++ b/doc/listings/denseModel.txt
@@ -0,0 +1,17 @@
+Model: "sequential"
+_________________________________________________________________
+ Layer (type) Output Shape Param #
+=================================================================
+ dense (Dense) (None, 9, 9, 81) 243
+
+ dense_1 (Dense) (None, 9, 9, 81) 6642
+
+ flatten (Flatten) (None, 6561) 0
+
+ dense_2 (Dense) (None, 82) 538084
+
+=================================================================
+Total params: 544,969
+Trainable params: 544,969
+Non-trainable params: 0
+_________________________________________________________________
diff --git a/doc/listings/denseTraining.txt b/doc/listings/denseTraining.txt
new file mode 100644
index 0000000..0bfcb51
--- /dev/null
+++ b/doc/listings/denseTraining.txt
@@ -0,0 +1,40 @@
+Epoch 1/20
+148338/148338 - 1151s - loss: 1.1130 - accuracy: 0.6942 - val_loss: 0.6097 - val_accuracy: 0.8249 - 1151s/epoch - 8ms/step
+Epoch 2/20
+148338/148338 - 1084s - loss: 0.5366 - accuracy: 0.8572 - val_loss: 0.4744 - val_accuracy: 0.8617 - 1084s/epoch - 7ms/step
+Epoch 3/20
+148338/148338 - 1071s - loss: 0.4250 - accuracy: 0.8895 - val_loss: 0.4161 - val_accuracy: 0.8813 - 1071s/epoch - 7ms/step
+Epoch 4/20
+148338/148338 - 1118s - loss: 0.3678 - accuracy: 0.9066 - val_loss: 0.3493 - val_accuracy: 0.9024 - 1118s/epoch - 8ms/step
+Epoch 5/20
+148338/148338 - 1092s - loss: 0.3320 - accuracy: 0.9170 - val_loss: 0.3103 - val_accuracy: 0.9185 - 1092s/epoch - 7ms/step
+Epoch 6/20
+148338/148338 - 1097s - loss: 0.3078 - accuracy: 0.9241 - val_loss: 0.3132 - val_accuracy: 0.9145 - 1097s/epoch - 7ms/step
+Epoch 7/20
+148338/148338 - 1074s - loss: 0.2899 - accuracy: 0.9293 - val_loss: 0.2779 - val_accuracy: 0.9257 - 1074s/epoch - 7ms/step
+Epoch 8/20
+148338/148338 - 1114s - loss: 0.2762 - accuracy: 0.9330 - val_loss: 0.2709 - val_accuracy: 0.9246 - 1114s/epoch - 8ms/step
+Epoch 9/20
+148338/148338 - 1111s - loss: 0.2660 - accuracy: 0.9351 - val_loss: 0.2577 - val_accuracy: 0.9319 - 1111s/epoch - 7ms/step
+Epoch 10/20
+148338/148338 - 1104s - loss: 0.2563 - accuracy: 0.9374 - val_loss: 0.2446 - val_accuracy: 0.9388 - 1104s/epoch - 7ms/step
+Epoch 11/20
+148338/148338 - 1084s - loss: 0.2489 - accuracy: 0.9394 - val_loss: 0.2441 - val_accuracy: 0.9348 - 1084s/epoch - 7ms/step
+Epoch 12/20
+148338/148338 - 1088s - loss: 0.2419 - accuracy: 0.9407 - val_loss: 0.2538 - val_accuracy: 0.9337 - 1088s/epoch - 7ms/step
+Epoch 13/20
+148338/148338 - 1090s - loss: 0.2365 - accuracy: 0.9416 - val_loss: 0.2538 - val_accuracy: 0.9312 - 1090s/epoch - 7ms/step
+Epoch 14/20
+148338/148338 - 1063s - loss: 0.2314 - accuracy: 0.9430 - val_loss: 0.2484 - val_accuracy: 0.9308 - 1063s/epoch - 7ms/step
+Epoch 15/20
+148338/148338 - 1111s - loss: 0.2271 - accuracy: 0.9436 - val_loss: 0.2373 - val_accuracy: 0.9359 - 1111s/epoch - 7ms/step
+Epoch 16/20
+148338/148338 - 1124s - loss: 0.2235 - accuracy: 0.9443 - val_loss: 0.2542 - val_accuracy: 0.9257 - 1124s/epoch - 8ms/step
+Epoch 17/20
+148338/148338 - 1074s - loss: 0.2202 - accuracy: 0.9451 - val_loss: 0.2368 - val_accuracy: 0.9327 - 1074s/epoch - 7ms/step
+Epoch 18/20
+148338/148338 - 1120s - loss: 0.2181 - accuracy: 0.9453 - val_loss: 0.2462 - val_accuracy: 0.9286 - 1120s/epoch - 8ms/step
+Epoch 19/20
+148338/148338 - 1121s - loss: 0.2159 - accuracy: 0.9460 - val_loss: 0.2375 - val_accuracy: 0.9316 - 1121s/epoch - 8ms/step
+Epoch 20/20
+148338/148338 - 1115s - loss: 0.2154 - accuracy: 0.9458 - val_loss: 0.2273 - val_accuracy: 0.9352 - 1115s/epoch - 8ms/step
diff --git a/doc/listings/trainCommand.sh b/doc/listings/trainCommand.sh
new file mode 100644
index 0000000..a5f09c4
--- /dev/null
+++ b/doc/listings/trainCommand.sh
@@ -0,0 +1 @@
+./train.py $(ls ../collections/minigo/matches/*.sgf | shuf | head -n 50)
diff --git a/doc/tex/biber.bib b/doc/tex/biber.bib
new file mode 100644
index 0000000..d0a714e
--- /dev/null
+++ b/doc/tex/biber.bib
@@ -0,0 +1,156 @@
+@article{natureAlphaGo2016,
+ author = {David Silver and Aja Huang and Chris J. Maddison and Arthur Guez and Laurent Sifre and George van den Driessche and Julian Schrittwieser and Ioannis Antonoglou and Veda Panneershelvam and Marc Lanctot and Sander Dieleman and Dominik Grewe and John Nham and Nal Kalchbrenner and Ilya Sutskever and Timothy Lillicrap and Madeleine Leach and Koray Kavukcuoglu and Thore Graepel and Demis Hassabis},
+ title = {Mastering the game of Go with deep neural networks and tree search},
+ journaltitle = {Nature},
+ date = {2016-01-27},
+ url = {https://www.nature.com/articles/nature16961}
+}
+
+@online{gtp,
+ author = {Gunnar Farnebäck},
+ title = {GTP --- Go Text Protocol},
+ date = {2002},
+ urldate = {2021},
+ url = {https://www.lysator.liu.se/~gunnar/gtp}
+}
+
+@online{sgf,
+ author = {Arno Hollosi},
+ title = {SGF File Format FF[4]},
+ date = {2021},
+ urldate = {2022},
+ url = {https://www.red-bean.com/sgf}
+}
+
+@online{katago,
+ author = {David J Wu ("lightvector")},
+ title = {KataGo},
+ date = {2021},
+ urldate = {2021},
+ url = {https://github.com/lightvector/KataGo}
+}
+
+@online{gnugo,
+ title = {GNU Go},
+ organization = {Free Software Foundation},
+ date = {2019},
+ urldate = {2021},
+ url = {https://www.gnu.org/software/gnugo}
+}
+
+@online{sabaki,
+ author = {Yichuan Shen},
+ title = {Sabaki --- An elegant Go board and SGF editor for a more civilized age.},
+ date = {2019},
+ urldate = {2021},
+ url = {https://sabaki.yichuanshen.de}
+}
+
+@online{keras,
+ title = {Keras: the Python deep learning API},
+ urldate = {2022},
+ url = {https://keras.io}
+}
+
+@online{sl_go,
+ title = {Go},
+ organization = {Sensei's Library},
+ date = {2019},
+ urldate = {2021},
+ url = {https://senseis.xmp.net/?go}
+}
+
+@online{plantillaRedondo,
+ author = {J. M. Redondo},
+ title = {Documentos-modelo para Trabajos de Fin de Grado/Master de la Escuela de Informática de Oviedo},
+ date = {2019-06-17},
+ url = {https://www.researchgate.net/publication/327882831_Plantilla_de_Proyectos_de_Fin_de_Carrera_de_la_Escuela_de_Informatica_de_Oviedo}
+}
+
+@online{python_unittest,
+ title = {unittest --- Unit testing framework},
+ urldate = {2021},
+ url = {https://docs.python.org/3/library/unittest.html}
+}
+
+@online{python_coverage,
+ title = {Coverage.py},
+ urldate = {2021},
+ url = {https://coverage.readthedocs.io}
+}
+
+@online{matplotlib_heatmaps,
+ title = {Creating annotated heatmaps — Matplotlib 3.5.2 documentation},
+ urldate = {2022},
+ url = {https://matplotlib.org/stable/gallery/images_contours_and_fields/image_annotated_heatmap.html}
+}
+
+@online{python,
+ title = {Welcome to Python.org},
+ urldate = {2022},
+ url = {https://www.python.org}
+}
+
+@online{numpy,
+ title = {NumPy},
+ urldate = {2022},
+ url = {https://numpy.org}
+}
+
+@online{matplotlib,
+ title = {Matplotlib — Visualization with Python},
+ urldate = {2022},
+ url = {https://matplotlib.org}
+}
+
+@online{ply,
+ title = {PLY (Python Lex-Yacc)},
+ urldate = {2022},
+ url = {http://www.dabeaz.com/ply}
+}
+
+@online{vim,
+ title = {welcome home : vim online},
+ urldate = {2022},
+ url = {https://www.vim.org}
+}
+
+@online{neovim,
+ title = {Home - Neovim},
+ urldate = {2022},
+ url = {http://neovim.io}
+}
+
+@online{latex,
+ title = {LaTeX - A document preparation system},
+ urldate = {2022},
+ url = {https://www.latex-project.org}
+}
+
+@online{puml,
+ title = {Open-source tool that uses simple textual descriptions to draw beautiful UML diagrams.},
+ urldate = {2022},
+ url = {https://plantuml.com}
+}
+
+@online{sl_sword,
+ title = {9x9 Tengen Openings at Sensei's Library},
+ urldate = {2022},
+ url = {https://senseis.xmp.net/?9x9TengenOpenings}
+}
+
+@online{ogsLifeAndDeath,
+ author = {sunspark},
+ title = {Cho Chikun's Encyclopedia of Life and Death - Elementary: 1 / 900},
+ date = {2016},
+ urldate = {2022},
+ url = {https://online-go.com/puzzle/2824}
+}
+
+@online{fsf_free,
+ author = {Free Software Foundation},
+ title = {What is Free Software? - GNU Project - Free Software Foundation},
+ date = {2022},
+ urldate = {2022},
+ url = {https://www.gnu.org/philosophy/free-sw.html}
+}
diff --git a/doc/tex/conclusions.tex b/doc/tex/conclusions.tex
new file mode 100644
index 0000000..ebbf7fd
--- /dev/null
+++ b/doc/tex/conclusions.tex
@@ -0,0 +1,128 @@
+\section{Conclusions}
+
+Some problems found during the project, an evaluation of the results and what
+could be done in the future to improve the system are discussed here.
+
+\subsection{Problems with the Implementation of the Game}
+
+While Go has a simple set of rules, they lead to many borderline cases which
+must be specifically addressed. For example, the ko rule obliges to check the
+previous board positions after each move so no boards are repeated.
+
+These problems have been solved by designing the tree of moves of a match so
+each move stores the full board layout after it has been played. This of course
+increases the memory needed to run the application, but has been chosen over the
+alternative of having to recreate the board parsing the tree backwards for each
+move to check if ko is occurring, if a move makes a capture and which stones
+have already been captured, etc. It is the old problem of memory versus
+processing, which in this case has been answered with memory. Which one would be
+the best solution would require a deep analysis out of the scope of the project.
+
+\subsection{Problems with the Monte Carlo Tree Search Algorithm}
+
+The implementation Monte Carlo Tree Search algorithm was not precise by itself
+when asked for moves. This could be attributed to various factors:
+
+\begin{itemize}
+
+ \item The way the score is counted makes it difficult to evaluate who is
+ winning at the beginning or middle of the game, so the score of a move
+ has to be evaluated by running playing simulations. These simulations
+ are not precise on analyzing the result since the moves in them are
+ played at random.
+
+ \item The configuration used, 5 explorations with 10 simulations each for
+ cycle, does not allow for many good moves to be found.
+
+\end{itemize}
+
+To solve these problems, either a good score evaluation engine has to be
+implemented, which is another machine learning problem by itself, or the
+explorations and simulations of the engine tuned up to values unable to be run
+on the development hardware.
+
+\subsection{Problems with Neural Networks}
+
+Some concerns with the design and results of the neural networks are discussed
+on this section.
+
+\subsubsection{Finding the correct design}
+
+When approaching neural networks design with a basic understanding of their
+inner workings it is easy to get lost in all the different factors that can be
+tuned. The number and variant of layers, their number of nodes, their activation
+function, the learning rate; they can all be tweaked and doing so in the favour
+of the design requires a good knowledge of what is being done.
+
+The basic approach was to design the input and output shapes and then adjust the
+network based on that. At first, the desired output was a 9x9 two-dimensional
+matrix with the probabilities of playing on each move. A heatmap generated from
+a failed solution of this approach can be seen on \fref{fig:oldHM}, where the
+network distributed the probability for each row instead of the whole board. The
+fitting of shapes of input, internal layers and output has found to be tricky at
+first.
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=\textwidth]{img/matches/oldLineByLineHeatmap.png}
+ \caption{A heatmap from an old design of the dense neural network.}
+ \label{fig:oldHM}
+ Note that each row adds up to one, meaning that the engine is selecting
+ the best move for each row and not for the whole board.
+ \end{center}
+\end{figure}
+
+Finally, based on the design of classification networks where each possible
+class is mapped to a value in the one-dimensional output vector, it was decided
+that the output was not a two-dimensional matrix but a one-dimensional vector.
+This also helped address the possibility of passing, treating it as just another
+possible move that was previously left out because of not knowing how to fit it
+on the matrix of possible moves. This vector is then reshaped to a matrix
+representing the board when needed, for example to generate the heatmaps used
+for evaluation.
+
+\subsubsection{Mistakes on Networks' Play Patterns}
+
+One notable mistake made by the networks, specially the convolutional network,
+was passing to much. Passing is considered just another move, so the networks
+have no grasp that they should not pass until there are no more valuable moves
+to be made. A new design problem could be to create a specific passing policy.
+
+Another observation is that the engines seem to follow traditional openings and
+make reasonable decisions at the start of the game, with some interesting
+variations. But as the game progresses their moves make less sense. This could
+be because they have seen many examples of starting moves but complications at
+the middle and end game are much more diverse and the networks had not been
+trained on similar situations.
+
+\subsection{Viable Extensions}
+
+There are several ways this project could be improved, but were left out by lack
+of resources or time. Some interesting ones are explored on this section.
+
+\subsubsection{Joining Monte Carlo Tree Search and Neural Networks}
+
+The tree search algorithm is better at the end of the game, where the tree to
+explore is much more manageable. On the other hand, the neural networks are
+better at the beginning, where the positions are more common and patterns are
+simpler. The logical next step would be to join both: the network could select
+the best moves to be made, and the tree search algorithm could explore them to
+select the best and grow its explored tree in meaningful directions.
+
+This is also what was done by AlphaGo. By seeing the results obtained in this
+project it makes sense they made that decision.
+
+\subsubsection{Train the Engine by Itself}
+
+By training a game engine on human matches, it can at best get as good as the
+human players it has learned from.
+
+Top engines learn not from humans but by playing against themselves. This would
+be an interesting problem to tackle, if requiring a new approach to the design
+of the networks and a lot of training resources.
+
+\subsubsection{Presenting the Engine to the World}
+
+Some Go servers allow for bot players to be registered. This would provide a
+source of training against players from all around the world and also an
+evaluation over time of the engine strength.
diff --git a/doc/tex/imago.tex b/doc/tex/imago.tex
new file mode 100644
index 0000000..cc77673
--- /dev/null
+++ b/doc/tex/imago.tex
@@ -0,0 +1,178 @@
+\documentclass[12pt]{article}
+
+\usepackage{geometry}
+\usepackage{graphicx}
+\usepackage{booktabs}
+\usepackage{hyperref}
+\usepackage{csquotes}
+\usepackage{enumitem}
+\usepackage[indent=20pt]{parskip} % Space between paragraphs
+\usepackage{indentfirst} % Indent first paragraph of sections
+
+\geometry{left=3cm,top=2cm,bottom=2cm,right=3cm}
+
+\usepackage{chngcntr}
+
+\hypersetup{colorlinks=false,
+ linkcolor=black,
+ filecolor=black,
+ urlcolor=black,
+ bookmarks=true
+}
+
+\urlstyle{mono}
+
+\usepackage[backend=biber, style=numeric, sorting=none]{biblatex}
+\addbibresource{tex/biber.bib}
+
+\usepackage{minted} % Code importing and formatting
+\setminted{linenos, breaklines}
+
+\newcommand{\program}{Imago}
+
+\newcommand{\fref}[1]{Fig.~\ref{#1}}
+\newcommand{\flist}[1]{Listing~\ref{#1}}
+%\newcommand{\uurl}[1]{\underline{\url{#1}}}
+
+\newcommand{\tabitem}{~~\llap{\textbullet}~~}
+
+\begin{document}
+
+\frenchspacing
+
+\title{
+ \begin{center}
+ \includegraphics[width=0.4\textwidth]{img/logoUniovi.png}\hfill
+ \includegraphics[width=0.3\textwidth]{img/logoEII.png}
+ \end{center}~\\[10pt]
+ \program\\
+ \large An AI player of the game of Go
+}
+
+\author{Íñigo Gutiérrez Fernández}
+
+\date{}
+
+\maketitle
+
+\thispagestyle{empty}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=0.6\textwidth]{img/imago.jpg}
+ \end{center}
+\end{figure}
+
+\clearpage
+
+\begin{abstract}
+ The game of Go presents a complex problem for machine learning by virtue of
+ containing a very wide and deep decision tree. This project has tried to
+ tackle the problem by using different decision algorithms and also provides
+ a full implementation of the game. These tools could be used by players and
+ developers as a foundation for other machine learning projects or to simply
+ keep studying the game.
+\end{abstract}
+
+\clearpage
+
+\section*{Acknowledgements}
+
+To Vicente García Díaz, for helping me learning to program on my first year at
+the school and directing me in this project on my last.
+
+To José Manuel Redondo López\cite{plantillaRedondo}, for making an extensive
+template on which the structure of this documentation is extensively based.
+
+To all the people who have provided their time, support, ideas and company, all
+fundamental for this project.
+
+\clearpage
+
+\section*{Copyright notice}
+
+\begin{displayquote}
+
+ Copyright (C) 2021 \textbf{ÍÑIGO GUTIÉRREZ FERNÁNDEZ}.
+
+ \textit{Permission is granted to copy, distribute and/or modify this
+ document under the terms of the GNU Free Documentation License, Version 1.3
+ or any later version published by the Free Software Foundation; with the
+ Copyright notice as an Invariant Section, no Front-Cover Texts, and no
+ Back-Cover Texts. A copy of the license is included in the section
+ entitled ``GNU Free Documentation License''.}
+
+\end{displayquote}
+
+Although this document uses the GNU Free Documentation License to keep its
+contained information free, bear in mind that it isn't software documentation or
+a manual or guide of any kind, and serves just as the documentation for the
+author's Degree's Final Project.
+
+This document is based on a template by José Manuel Redondo López, associate
+professor of the University of Oviedo. The copyright notice he asks for
+inclusion to use this template is included here.
+
+\begin{displayquote}
+
+ Copyright (C) 2019 \textbf{JOSÉ MANUEL REDONDO
+ LÓPEZ}.\cite{plantillaRedondo}
+
+ \textit{Permission is granted to copy, distribute and/or modify this
+ document under the terms of the GNU Free Documentation License, Version 1.3
+ or any later version published by the Free Software Foundation; with no
+ Invariant Sections, no Front-Cover Texts, and no Back-Cover Texts. A copy
+ of the license is included in the section entitled ``GNU Free
+ Documentation License''.}
+
+\end{displayquote}
+
+\clearpage
+
+\setcounter{secnumdepth}{3}
+\setcounter{tocdepth}{4}
+\tableofcontents
+
+\clearpage
+
+\counterwithin{figure}{section}
+\renewcommand{\listfigurename}{Figures}
+\listoffigures
+
+\clearpage
+
+\renewcommand{\listoflistingscaption}{Listings}
+\counterwithin{listing}{section}
+\listoflistings
+
+\clearpage
+
+\input{tex/introduction.tex}
+\clearpage
+
+\input{tex/planification.tex}
+\clearpage
+
+\input{tex/systemAnalysis.tex}
+\clearpage
+
+\input{tex/systemDesign.tex}
+\clearpage
+
+\input{tex/implementation.tex}
+\clearpage
+
+\input{tex/results.tex}
+\clearpage
+
+\input{tex/conclusions.tex}
+\clearpage
+
+% References (bibliography)
+
+\setcounter{secnumdepth}{0}
+\section{References}
+\printbibliography[type=article,title={Cited articles},heading=subbibintoc]{}
+\printbibliography[type=online,title={Online resources},heading=subbibintoc]{}
+
+\end{document}
diff --git a/doc/tex/implementation.tex b/doc/tex/implementation.tex
index 9e42313..d46e805 100644
--- a/doc/tex/implementation.tex
+++ b/doc/tex/implementation.tex
@@ -1,64 +1,121 @@
\section{Implementation}
-\subsection{Engine}
-
-An engine implementing GTP.\@ It is designed to be used by a software controller
-but can also be directly run, mostly for debugging purposes. Its design is shown
-in \fref{fig:engine}
-
-\begin{figure}[h]
- \begin{center}
- \includegraphics[width=\textwidth]{diagrams/gtpEngine.png}
- \caption{Design of the GTP engine.}\label{fig:engine}
- \end{center}
-\end{figure}
-
-\subsection{Modules}
-
-One module to store the state of the game and the game tree. One module to parse
-moves. One module to read and write SGF files. Modules are shown in
-\fref{fig:modules}.
-
-\begin{figure}[h]
- \begin{center}
- \includegraphics[width=\textwidth]{diagrams/modules.png}
- \caption{Modules.}\label{fig:modules}
- \end{center}
-\end{figure}
-
-\subsection{Representation of a match}
-
-Strictly said, a match is composed of a series of moves. But since game review
-and variants exploration is an important part of Go learing, \program{} allows
-for navigation back and forth through the board states of a match and for new
-variants to be created from each of these board states. Therefore, a match is
-represented as a tree of moves. The state of the game must also be present so
-liberties, captures and legality of moves can be addressed, so it is represented
-with its own class, which holds a reference both to the game tree and the
-current move. This classes and their relationship can be seen in
-\fref{fig:gameRepresentation}.
-
-\begin{figure}[h]
- \begin{center}
- \includegraphics[width=0.7\textwidth]{diagrams/gameRepresentation.png}
- \caption{A game is represented as a tree of moves.}\label{fig:gameRepresentation}
- \end{center}
-\end{figure}
-
-\subsection{SGF}
-
-To parse SGF files a lexer and parser have been implemented using PLY.\@ The
-result of the parsing is an AST (Annotated Syntax Tree) reflecting the contents
-of the text input, each node with zero or more properties, and with the ability
-to convert themselves and their corresponding subtree into a GameTree. This is
-done for the root node, since from the SGF specification there are some
-properties only usable in the root node, like those which specify general game
-information and properties such as rank of players or komi. These components are
-shown in \fref{fig:sgfModule}.
-
-\begin{figure}[h]
- \begin{center}
- \includegraphics[width=\textwidth]{diagrams/sgfModule.png}
- \caption{Components of the SGF file parsing module.}\label{fig:sgfModule}
- \end{center}
-\end{figure}
+\subsection{Development Hardware}
+
+The development and evaluation machine is a Satellite L50-C laptop. Its
+specifications are shown as a list for readability.
+
+\begin{itemize}
+ \item \textbf{CPU}: Intel i5-6200U, 2.800GHz
+ \item \textbf{Integrated GPU}: Intel Skylake GT2
+ \item \textbf{Dedicated GPU}: Nvidia Geforce 930M
+ \item \textbf{RAM}: 8 GiB
+\end{itemize}
+
+\subsection{Development Software}
+
+The tools selected for the development of the project and the documentation are
+listed and explained on this section. All the tools used are either
+free\cite{fsf_free} or open source software. The development machine runs 64
+bits Arch Linux as its operating system.
+
+\subsubsection{Language}
+
+The programming language of choice is Python\cite{python}. The rationale behind
+this decision has been stated on Section \ref{sec:programmingLanguage}. It also
+allows easy use of the Keras library for implementing neural networks.
+
+Various python libraries have been used to easy the development process or
+assist in the analysis of results. These are:
+
+\paragraph{Keras/Tensorflow\cite{keras}}
+
+Tensorflow is a platform for machine learning which provides a diverse range of
+tools, one of which is a python library for machine learning.
+
+Keras is a high-level API for Tensorflow allowing for the easy definition of
+neural networks. It permits easily testing and comparing different network
+layouts.
+
+\paragraph{NumPy\cite{numpy}}
+
+A scientific package for python providing a lot of mathematical tools. The most
+interesting for this project are its capabilities to create and transform
+matrices.
+
+\paragraph{Matplotlib\cite{matplotlib}}
+
+A python library for creating graphs and other visualizations. It is used to
+show the likelihood of moves the neural networks of the project create from a
+board configuration.
+
+\paragraph{PLY\cite{ply}}
+
+A tool for generating compilers in Python. It is an implementation of the lex
+and yacc utilities, allowing to create lexers and parsers. It is used in the
+project to create the SGF parser which transform SGF files to internal
+representations of Go matches.
+
+\paragraph{Other utility libraries}
+
+These are some utility libraries commonly used for frequent programming tasks:
+
+\begin{itemize}
+ \item \textbf{sys}: to stop the execution of the program or access system info such
+ as primitives maximum values.
+ \item \textbf{os}: to interact with files.
+ \item \textbf{re}: to check strings with regular expressions.
+ \item \textbf{random}: to get random values, for example to obtain a random
+ item from a list.
+ \item \textbf{copy}: to obtain deep copies of multidimensional arrays.
+\end{itemize}
+
+\subsubsection{Development Tools}
+
+\paragraph{Neovim\cite{neovim}}
+
+A text editor based on Vim\cite{vim}, providing its same functionality with
+useful additions and defaults for modern computers and terminal emulators. With
+some extensions and configuration it can become a powerful development
+environment with a very fluid usage experience. That, and the fact that the
+developer considers Vim's modal editing the best writing experience possible on
+a computer, have made Neovim the editor of choice.
+
+%TODO: Write about neovim extensions
+%\begin{itemize}
+% \item FZF
+% \item Extensions
+%
+%\end{itemize}
+
+\subsubsection{Documentation Tools}
+
+\paragraph{\LaTeX\cite{latex}}
+
+A typesetting system widely used in the investigation field, among others. It
+allows for documentation like this text to be written in plain text and then
+compiled to PDF or other formats, which permits keeping the source files of the
+documentation small and organized plus other benefits of plain text such as
+being able to use version control.
+
+\paragraph{PlantUML\cite{puml}}
+
+A program which creates diagrams from plain text files. PlantUML supports syntax
+for many different sorts of diagrams, mainly but not only UML. It has been used
+to generate the diagrams used in this text.
+
+\paragraph{Make}
+
+A tool for specifying and handling dependencies on a build system. It reads a
+file, typically named ``Makefile'', containing which files are needed and on
+which other files each of them depends, and then generates those files or
+updates them if they already exist but their source files are newer than them.
+
+It has been used to generate this text from \LaTeX{} and PlantUML source files.
+The contents of the Makefile with which this document has been compiled are
+shown in \flist{code:makefile}.
+
+\begin{listing}[h]
+ \inputminted{make}{Makefile}
+ \caption{Documentation Makefile}\label{code:makefile}
+\end{listing}
diff --git a/doc/tex/interface.tex b/doc/tex/interface.tex
deleted file mode 100644
index 9caa78d..0000000
--- a/doc/tex/interface.tex
+++ /dev/null
@@ -1,6 +0,0 @@
-\section{Interface}
-
-\subsection{Importing and exporting games}
-
-The format chosen to read and write games is SGF (Smart Game Format). It is a
-widely used text format which allows for variants, comments and other metadata.
diff --git a/doc/tex/introduction.tex b/doc/tex/introduction.tex
index 6defbd9..fe5c205 100644
--- a/doc/tex/introduction.tex
+++ b/doc/tex/introduction.tex
@@ -12,5 +12,11 @@
game at heart, Go has nonetheless been interpreted as a stylized representation
of fighting a war, settling a frontier, cornering a market, thrashing out an
argument, or even of fortune-telling and prophecy. Go has always been one of the
- most played games in the world. \parencite{sl_go}
+ most played games in the world.\cite{sl_go}
\end{displayquote}
+
+As old and deep as Go is it has recently lived a revolution by the appearance of
+artificial intelligences with superhuman strength. While not expecting to
+achieve what a full team of developers and computer scientists at Google did,
+this project aims to evaluate how an engine able to play the game of Go could be
+created, implement such an engine and evaluate the results of the whole process.
diff --git a/doc/tex/planification.tex b/doc/tex/planification.tex
new file mode 100644
index 0000000..f0f7535
--- /dev/null
+++ b/doc/tex/planification.tex
@@ -0,0 +1,197 @@
+\section{Planning}
+
+\subsection{Driving Needs}
+
+As one of the deepest and most studied games in the world, Go presents a very
+interesting problem for artificial intelligence. Implementing not only the
+game's simple but subtle rules, but a system capable of playing it with a
+satisfying level of skill, is a task worth of pursuing as an exercise on
+software design, algorithmics and AI research.
+
+On the practical level, this project can be a foundation for the development of
+different Go analysis algorithms by providing an existing engine to house them,
+which can be of interest to Go players and software scientists alike.
+
+\subsection{Reach}
+
+Presented here are the ideal targets of the project.
+
+\begin{itemize}
+ \item An implementation of the game of Go, that is, a system for holding the
+ moves and variants of a match (a tree of moves) and the logic for the
+ game's rules.
+ \item An engine capable of analyzing board positions and generating strong
+ moves via various decision algorithms.
+ \item Either a GUI specifically developed for the project or an
+ implementation of an existing protocol so the engine can be used with
+ existing tools and GUIs.
+ \item A way for processing existing records of games, which are usually
+ recorded in the SGF format.
+\end{itemize}
+
+\subsection{Project Stages}
+
+The project will be organized in several stages based on the different
+components and needs.
+
+\subsubsection{Game Implementation}
+
+The rules of the game must be implemented, ideally in a way they can be tested
+by direct human play. This system will at its bare minimum represent the
+Japanese Go rules (area scoring, no superko rule, no suicide moves).
+
+\subsubsection{Engine Implementation}
+
+The key of this project is to create some kind of system able to generate strong
+moves based on any given board configuration: this will be such system. It will
+implement an existing protocol so it can be used with other compatible tools. It
+has to be able to receive game updates and configuration and to output moves for
+either player. It should also be modular enough so different algorithms can be
+selected and tested against each other as an experimental search for the best of
+them.
+
+\subsubsection{Artificial Intelligence Algorithms}
+
+Different algorithms for the engine to use should be implemented and tested. The
+results of this development and testing process should be presented as part of
+the final version of the project.
+
+\subsection{Logistics}
+
+The project will be developed by Íñigo Gutiérrez Fernández, student of the
+Computer Software Engineering Degree at the University of Oviedo, with
+supervision from Vicente García Díaz, Associate Professor in the Department of
+Computer Science at the University of Oviedo.
+
+The used material consists of a development and testing machine owned by the
+student with specifications stated later on the project plan.
+
+\subsection{Work Plan}
+
+The sole developer will be the student, who is currently working as a Junior
+Software Engineer on a 35 hour per week schedule and with no university
+responsibilities other than this project. Taking this into account, a sensible
+initial assumption is that he will be able to work 3 hours a day, Monday to
+Friday. Gantt diagrams for the planned working schedule are shown as
+\fref{fig:planificationWorkPlanGame} and
+\fref{fig:planificationWorkPlanEngine}.
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=\textwidth]{diagrams/planificationWorkPlanGame.png}
+ \caption{Initial work plan for implementing the game.
+ }\label{fig:planificationWorkPlanGame}
+ \end{center}
+\end{figure}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=\textwidth]{diagrams/planificationWorkPlanEngine.png}
+ \caption{Initial work plan for implementing the engine and algorithms.
+ }\label{fig:planificationWorkPlanEngine}
+ \end{center}
+\end{figure}
+
+\subsection{Previous Works}
+
+\subsubsection{Existing Engines}
+
+\paragraph{AlphaGo}
+
+A Go play and analysis engine developed by DeepMind Technologies, a company
+owned by Google. It revolutionized the world of Go in 2015 and 2016 when it
+respectively became the first AI to win against a professional Go player and
+then won against Lee Sedol, a Korean player of the highest professional rank and
+one of the strongest players in the world at the time. Its source code is
+closed, but a paper\cite{natureAlphaGo2016} written by the team and
+published on Nature is available on
+https://storage.googleapis.com/deepmind-media/alphago/AlphaGoNaturePaper.pdf.
+
+The unprecedented success of AlphaGo served as inspiration for many AI projects,
+including this one.
+
+\paragraph{KataGo\cite{katago}}
+
+An open source project based on the AlphaGo paper that also achieved superhuman
+strength of play. The availability of its implementation and documentation
+presents a great resource for this project.
+
+\paragraph{GnuGo\cite{gnugo}}
+
+A software capable of playing Go part of the GNU project. Although not a strong
+engine anymore, it is interesting for historic reasons as the free software
+engine for which the GTP protocol was first defined.
+
+\subsubsection{Existing Standards}
+
+\paragraph{GTP\cite{gtp}}
+
+GTP (\textit{Go Text Protocol}) is a text based protocol for
+communication with computer go programs. It is the protocol used by GNU Go and
+the more modern and powerful KataGo. By supporting GTP the engine developed for
+this project can be used with existing GUIs and other programs, making it easier
+to use it with the tools users are already familiar with.
+
+\paragraph{SGF\cite{sgf}}
+
+SGF (\textit{Smart Go Format} or, in a more general context, \textit{Smart Game
+Format}) is a text format widely used for storing records of Go matches which
+allows for variants, comments and other metadata. It was devised for Go but it
+supports other games with similar turn-based structure. Many popular playing
+tools use it. By supporting SGF vast existing collections of games, such as
+those played on online Go servers, can be used to train the decision algorithms
+based on neural networks.
+
+\subsubsection{Sabaki\cite{sabaki}}
+
+Sabaki is a go board software compatible with GTP engines. It can serve as a GUI
+for the engine developed in this project and as an example of the advantages of
+following a standardized protocol.
+
+\subsubsection{Keras\cite{keras}}
+
+Keras is a deep learning API for Python allowing for the high-level definition
+of neural networks. This permits easily testing and comparing different network
+layouts.
+
+\subsection{Technological Infrastructure}
+
+\subsubsection{Programming Language}\label{sec:programmingLanguage}
+
+The resulting product of this project will be one or more pieces of software
+able to be run locally on a personal computer. The programming language of
+choice is Python\cite{python}, for various reasons:
+
+\begin{itemize}
+
+ \item It has established a reputation on scientific fields and more
+ specifically on AI research and development.
+ \item Interpreters are available for many platforms, which allows the most
+ people possible to access the product.
+ \item Although not very deeply, it has been used by the developer student
+ during its degree including in AI and game theory contexts.
+
+\end{itemize}
+
+\subsubsection{Interface}
+
+Both the game and the engine will offer a text interface. For the game this
+allows for quick human testing. For the engine it is mandated by the protocol,
+since GTP is a text based protocol for programs using text interfaces.
+Independent programs compatible with this interface can be used as a GUI.
+
+There is also the need of an interface with SGF files so existing games can be
+processed by the trainer.
+
+Both the engine and the trainer will need to interface with the files storing
+the neural network models.
+
+The systems' interfaces are shown in \fref{fig:interfaces}.
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=\textwidth]{diagrams/interfaces.png}
+ \caption{Interfaces of the three components of the project.}
+ \label{fig:interfaces}
+ \end{center}
+\end{figure}
diff --git a/doc/tex/previousWorks.tex b/doc/tex/previousWorks.tex
deleted file mode 100644
index 6ba5dce..0000000
--- a/doc/tex/previousWorks.tex
+++ /dev/null
@@ -1,21 +0,0 @@
-\section{Previous works}
-
-\subsection{SGF}
-
-SGF (\textit{Smart Go Format} or \textit{Smart Game Format}) is a text file
-format specification for records of games or even collections of them. It was
-devised for Go but it supports other games with similar turns structure. It
-supports move variations, annotations, setups and game metadata. By supporting
-SGF, our application can be used to analyse existing games registered by other
-applications, such as those played on online Go servers.
-
-The SGF specification can be found at
-\url{https://www.red-bean.com/sgf/user_guide/index.html}
-
-\subsection{GTP}
-
-GTP (\textit{Go Text Protocol}) is a text based protocol for communication with
-computer go programs. [ref https://www.lysator.liu.se/~gunnar/gtp/] It is the
-protocol used by GNU Go and the more modern and powerful KataGo. By supporting
-GTP, our application can be used with existing GUIs and other programs, making
-it easier to use it with the tools users are already familiar with.
diff --git a/doc/tex/results.tex b/doc/tex/results.tex
new file mode 100644
index 0000000..3c586e4
--- /dev/null
+++ b/doc/tex/results.tex
@@ -0,0 +1,416 @@
+\newcommand{\boards}[5]{
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=0.4\textwidth]{#1}
+ \includegraphics[width=0.4\textwidth]{#2}
+ \caption{#3}
+ \label{#4}
+ #5
+ \end{center}
+\end{figure}
+}
+
+\newcommand{\moveHeatmap}[9]{
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=0.35\textwidth]{#1}
+ \includegraphics[width=0.5\textwidth]{#2}
+ \\[\smallskipamount]
+ \includegraphics[width=0.35\textwidth]{#3}
+ \includegraphics[width=0.5\textwidth]{#4}
+ \\[\smallskipamount]
+ \includegraphics[width=0.35\textwidth]{#5}
+ \includegraphics[width=0.5\textwidth]{#6}
+ \caption{#7}
+ \label{#8}
+ #9
+ \end{center}
+\end{figure}
+}
+
+\section{Results}
+
+\subsection{Monte Carlo Tree Search Evaluation}
+
+The Monte Carlo Algorithm tries to explore the tree of possibilities as
+efficiently as possible. With this approach, it can be expected to fail when
+alone on a problem such big as the game of Go. Nonetheless, there are some areas
+where it can be useful. It will be evaluated by its capabilities while playing
+games but also when presented with go problems.
+
+The Monte Carlo algorithm has been set to do 5 explorations with 10 simulations
+each when it is asked for a move. In the hardware used this makes it think for
+40 seconds on an empty 9x9 board.
+
+\subsubsection{Monte Carlo Tree Search against itself}
+
+\boards
+{img/matches/mctsVSmcts01.jpg}
+{img/matches/mctsVSmcts02.jpg}
+{Monte Carlo Tree Search against itself.}
+{fig:mctsVSmcts}
+{Both boards are from the same match. The first shows only the first 12 moves
+for clarity. The second shows the finished game.}
+
+When set to play against itself the algorithm shows what looks like random play.
+Some moves could be debated as sensible, but many of them are on the second or
+fist line, which so early on the game are the two worst places to play at.
+
+It seems clear that this algorithm, at least with this specific configuration,
+can't handle the size of an empty Go board, even on the 9x9 size.
+
+A record of the game is shown in \fref{fig:mctsVSmcts}.
+
+\subsubsection{Monte Carlo Tree Search against Go problems}
+
+\boards
+{img/problems/mctsProblem01.jpg}
+{img/problems/mctsProblem02.jpg}
+{Monte Carlo against the first of Cho Chikun's problems.}
+{fig:mctsProblem01}
+
+Since tree exploration on smaller boards or advanced games with little empty
+spaces should be easier the algorithm has also been tested on some Go problems.
+
+A Go problem or tsumego is a predefined layout of the board, or of a section of
+the board, for which the player must find some beneficial move. Life and death
+problems are a subset of tsumegos in which the survival of a group depends on
+finding the correct sequence to save or kill the group. One collection of such
+tsumegos is \textit{Cho Chikun's Encyclopedia of Life and Death}, part of which
+are available on OGS\cite{ogsLifeAndDeath}, an online go server.
+
+The first of these problems and what the algorithm suggested as moves is shown
+in \fref{fig:mctsProblem01}.
+
+Black makes the first move, which means the solution is to find some favorable
+outcome for black, which in this case is killing the white group. The white
+group has a critical point on B1. If white plays on B1 they make two eyes and
+live, but if black plays there first white can't make two eyes and dies, so B1
+is the solution to the tsumego. This is one of the easiest Go problems.
+
+The algorithm neglects this solution. While asked five times to generate a move
+for the starting position it suggested B1 only once.
+
+But notably, after making another move, it consistently suggested B1 for white,
+which is the solution now that white has to play. So in the end it was able to
+solve the tsumego, probably because after making a move it had already explored
+part of the tree but it was difficult that it explored the solution for the
+first move.
+
+The engine was tested against other tsumegos but it was not able to solve them,
+so no more are shown here.
+
+\subsection{Neural Network Training}
+
+Each network has been training by receiving batches of SGF files which are first
+converted to lists of moves by the Training System and then provided to the
+train function of the networks. This has been executed with the following
+command:
+
+\inputminted[fontsize=\small]{bash}{listings/trainCommand.sh}
+
+Which lists the contents of a folder containing multiple SGF files, shuffles the
+list, takes some of them and passes them to train.py as arguments. The combined
+list of game positions and moves made from them in all the games selected make
+up the sample of the training. The number of files selected can of course be
+adapted to the situation.
+
+The networks were configured to train for 20 epochs, that is, processing the
+full batch and updating the weights on the network 20 times. 10\% of the sample
+were used as validation. This means they were not used for training but to
+check the accuracy and loss of the network after training with the rest of
+the batch. This technique of validation can help detect overfitting, which
+happens when a network does a very good job on the population it has been
+trained on but it fails when receiving unseen data.
+
+The training shows loss decrementing and accuracy incrementing on each epoch for
+both training and validation samples, which suggests there is learning happening
+and no overfitting occurring.
+
+The number of files to train on has been selected by trying to keep the
+resulting training time manageable for the developer. It was found that
+incrementing the files per batch did not increment the training time linearly,
+as with batches of 10 games an epoch of training could be completed in one
+minute, in three minutes batches of 20 games, and in up to an hour with batches
+of 100 games.
+
+The outputs from this training process can be seen on \flist{code:denseTraining}
+and \flist{code:convTraining} for the dense network and the convolutional
+network respectively.
+
+\begin{listing}[h]
+ \inputminted[fontsize=\scriptsize]{text}{listings/denseTraining.txt}
+ \caption{Dense neural network training log.}
+ \label{code:denseTraining}
+\end{listing}
+
+\begin{listing}[h]
+ \inputminted[fontsize=\scriptsize]{text}{listings/convTraining.txt}
+ \caption{Convolutional neural network training log.}
+ \label{code:convTraining}
+\end{listing}
+
+\subsection{Neural Network Evaluation}
+
+One way of studying the results of the training could be to programmatically
+test if the network is able to predict human moves when provided with a game
+file. This has the drawback of not directly testing the strength of the network,
+since it would be tested on predicting the moves of some human player, whose
+level could greatly vary, and not on its playing capabilities alone. This also
+has already been tested to some extent by the validation portion of the samples
+providing for training, and the results show the network increasing its accuracy
+of predicting human moves through the training epochs.
+
+Another way is to make the network play either against itself, another network,
+or a human player, and analyze the score it provides to each possible play. The
+output of the network is a vector with the likelihood of making each move, so
+we can take this values as how strongly the engine suggests each of them.
+
+\subsection{Neural Networks Against Themselves}
+
+The case of neural networks playing against themselves is interesting in that it
+shows moves with high certainty, that is, the network strongly suggests a
+specific move. It can be thought that this would be the most common line of play
+the engine has seen, with one certain move leading into another.
+
+This happened for both the dense neural network and the convolutional network.
+
+\subsubsection{Dense network Against Itself}
+
+The initial moves of a match of the dense network against itself, along with
+heatmaps showing the output from the network (which chance it gives for each
+move), can be seen on Figs.~\ref{fig:denseVSdense01}, \ref{fig:denseVSdense02},
+\ref{fig:denseVSdense03} and \ref{fig:denseVSdense04}.
+
+The dense network starts on the center of the board, which is one of the
+standard openings in the 9x9 board. It starts on a very good track, but we must
+acknowledge that the empty board is a position present on every go match it has
+trained on and so it should know it well. It probably means the center was the
+most played opening in the sample. It is interesting to check the heatmap of
+this move, since the selected move has only a score of 0.27. Other common
+openings on the 9x9 are represented on the vertices with some significant score.
+
+The heatmap of the response to the center play is also interesting. The four
+highest scored moves are equivalent, since the first move has not broken any
+symmetry. The move they represent, two spaces from the first stone, is also the
+consensual response. The three moves following in score are also equivalent
+between them.
+
+The first white stone has broken the symmetry in one direction, and so the
+second black move is suggested with more likelihood than the previous one. This
+is also a very common sequence of play.
+
+The following moves are a white attack followed by black's sensible response,
+and a strong white extension (arguably to the wrong side, but the minutia of why
+the other side would be better is probably not grasped by the engine). The
+following moves could be called looking for complication, which is a strategy.
+
+Overall some moves could be criticised but the engine is showing at least a
+basic knowledge of the game's strategy.
+
+\subsubsection{Convolutional Network Against Itself}
+
+The same information on a match of the convolutional network against itself can
+be seen on Figs.~\ref{fig:convVSconv01}, \ref{fig:convVSconv02},
+\ref{fig:convVSconv03} and \ref{fig:convVSconv04}.
+
+The convolutional network also likes to start on the center of the board and is
+more certain of the move than the dense network. Its next two plays are also the
+same, but the match starts to diverge from the fourth move.
+
+Instead of attacking the black stone on the side, white plays directly under at
+B5, keeping the edge of symmetry. This is strategically important because while
+symmetry is present playing on either side makes no difference, while playing
+after the opponent has broken symmetry gives the opportunity to respond and
+capitalize on the now better side to play.
+
+Black responds to the white stone by attacking it at B4 and white then extends
+to the more open side with F7.
+
+The match up to this point is discussed on Sensei's Library as an interesting
+sequence deriving from the center first stone\cite{sl_sword}. The discussion
+there states that white should have extended to the other side.
+
+The following moves are some sensible continuations, with approaches and
+responses on each side. They are probably not the best moves, but the idea
+behind them can be read from the board.
+
+\subsubsection{Dense Network Against Convolutional}
+
+The first 12 and the last 6 moves of a match of the dense network against the
+convolutional network can be seen on be seen on Figs.~\ref{fig:denseVSconv01},
+\ref{fig:denseVSconv02}, \ref{fig:denseVSconv03}, \ref{fig:denseVSconv04},
+\ref{fig:denseVSconv05} and \ref{fig:denseVSconv06}.
+
+The dense network is given black. The convolutional network plays then as white.
+
+The first three moves are known territory for both networks, since both play the
+same sequence when matched against themselves.
+
+After white plays under the black stone as the fourth move, black makes a maybe
+too careful extension, but it seemed very sure about it. Now white has some
+doubts. It seems to like the extensions to both sides, if a bit more to the more
+open side, a preference both engines have previously shown at this point of the
+match. The move it prefers the most, though, would be to play again under black.
+So, as this move is impossible, it defers to the extension to the open side with
+F3.
+
+Black now makes the mistake of overattacking the lone white stone on B5 with B6,
+and white capitalizes on it by keeping extending with D3. B5 is still a move
+with a not negligible score, but it is no longer the highest.
+
+The following moves are questionable, with black keeping building a very tight
+group and getting no territory and white attacking too directly with a lone
+stone into that strong group.
+
+In the final moves of the game we see that black has built a living group on the
+right side and things are looking good for it on the rest of the board. White
+has passed a bunch of times, starting too early, which means it gives too high
+an importance to passing. Since the networks learned only by seeing moves in
+response to boards, it has not learnt that it should not pass until there is no
+more to gain. But it is also important to note that passing was not the most
+likely move for the engine to make, it just happens that the move it would like
+to make is already taken and the highest chance available move is to pass.
+
+\moveHeatmap
+{img/matches/denseVSdense_board_01.jpg}
+{img/matches/denseVSdense_heatmap_01.png}
+{img/matches/denseVSdense_board_02.jpg}
+{img/matches/denseVSdense_heatmap_02.png}
+{img/matches/denseVSdense_board_03.jpg}
+{img/matches/denseVSdense_heatmap_03.png}
+{Dense network against itself, moves 1 through 3.}
+{fig:denseVSdense01}
+
+\moveHeatmap
+{img/matches/denseVSdense_board_04.jpg}
+{img/matches/denseVSdense_heatmap_04.png}
+{img/matches/denseVSdense_board_05.jpg}
+{img/matches/denseVSdense_heatmap_05.png}
+{img/matches/denseVSdense_board_06.jpg}
+{img/matches/denseVSdense_heatmap_06.png}
+{Dense network against itself, moves 4 through 6.}
+{fig:denseVSdense02}
+
+\moveHeatmap
+{img/matches/denseVSdense_board_07.jpg}
+{img/matches/denseVSdense_heatmap_07.png}
+{img/matches/denseVSdense_board_08.jpg}
+{img/matches/denseVSdense_heatmap_08.png}
+{img/matches/denseVSdense_board_09.jpg}
+{img/matches/denseVSdense_heatmap_09.png}
+{Dense network against itself, moves 7 through 9.}
+{fig:denseVSdense03}
+
+\moveHeatmap
+{img/matches/denseVSdense_board_10.jpg}
+{img/matches/denseVSdense_heatmap_10.png}
+{img/matches/denseVSdense_board_11.jpg}
+{img/matches/denseVSdense_heatmap_11.png}
+{img/matches/denseVSdense_board_12.jpg}
+{img/matches/denseVSdense_heatmap_12.png}
+{Dense network against itself, moves 10 through 12.}
+{fig:denseVSdense04}
+
+\moveHeatmap
+{img/matches/convVSconv_board_01.jpg}
+{img/matches/convVSconv_heatmap_01.png}
+{img/matches/convVSconv_board_02.jpg}
+{img/matches/convVSconv_heatmap_02.png}
+{img/matches/convVSconv_board_03.jpg}
+{img/matches/convVSconv_heatmap_03.png}
+{Convolutional network against itself, moves 1 through 3.}
+{fig:convVSconv01}
+
+\moveHeatmap
+{img/matches/convVSconv_board_04.jpg}
+{img/matches/convVSconv_heatmap_04.png}
+{img/matches/convVSconv_board_05.jpg}
+{img/matches/convVSconv_heatmap_05.png}
+{img/matches/convVSconv_board_06.jpg}
+{img/matches/convVSconv_heatmap_06.png}
+{Convolutional network against itself, moves 4 through 6.}
+{fig:convVSconv02}
+
+\moveHeatmap
+{img/matches/convVSconv_board_07.jpg}
+{img/matches/convVSconv_heatmap_07.png}
+{img/matches/convVSconv_board_08.jpg}
+{img/matches/convVSconv_heatmap_08.png}
+{img/matches/convVSconv_board_09.jpg}
+{img/matches/convVSconv_heatmap_09.png}
+{Convolutional network against itself, moves 7 through 9.}
+{fig:convVSconv03}
+
+\moveHeatmap
+{img/matches/convVSconv_board_10.jpg}
+{img/matches/convVSconv_heatmap_10.png}
+{img/matches/convVSconv_board_11.jpg}
+{img/matches/convVSconv_heatmap_11.png}
+{img/matches/convVSconv_board_12.jpg}
+{img/matches/convVSconv_heatmap_12.png}
+{Convolutional network against itself, moves 10 through 12.}
+{fig:convVSconv04}
+
+\moveHeatmap
+{img/matches/denseVSconv_board_01.jpg}
+{img/matches/denseVSconv_heatmap_01.png}
+{img/matches/denseVSconv_board_02.jpg}
+{img/matches/denseVSconv_heatmap_02.png}
+{img/matches/denseVSconv_board_03.jpg}
+{img/matches/denseVSconv_heatmap_03.png}
+{Dense network against convolutional, moves 1 through 3.}
+{fig:denseVSconv01}
+{The dense network plays as black.}
+
+\moveHeatmap
+{img/matches/denseVSconv_board_04.jpg}
+{img/matches/denseVSconv_heatmap_04.png}
+{img/matches/denseVSconv_board_05.jpg}
+{img/matches/denseVSconv_heatmap_05.png}
+{img/matches/denseVSconv_board_06.jpg}
+{img/matches/denseVSconv_heatmap_06.png}
+{Dense network against convolutional, moves 4 through 6.}
+{fig:denseVSconv02}
+
+\moveHeatmap
+{img/matches/denseVSconv_board_07.jpg}
+{img/matches/denseVSconv_heatmap_07.png}
+{img/matches/denseVSconv_board_08.jpg}
+{img/matches/denseVSconv_heatmap_08.png}
+{img/matches/denseVSconv_board_09.jpg}
+{img/matches/denseVSconv_heatmap_09.png}
+{Dense network against convolutional, moves 7 through 9.}
+{fig:denseVSconv03}
+
+\moveHeatmap
+{img/matches/denseVSconv_board_10.jpg}
+{img/matches/denseVSconv_heatmap_10.png}
+{img/matches/denseVSconv_board_11.jpg}
+{img/matches/denseVSconv_heatmap_11.png}
+{img/matches/denseVSconv_board_12.jpg}
+{img/matches/denseVSconv_heatmap_12.png}
+{Dense network against convolutional, moves 10 through 12.}
+{fig:denseVSconv04}
+
+\moveHeatmap
+{img/matches/denseVSconv_board_72.jpg}
+{img/matches/denseVSconv_heatmap_72.png}
+{img/matches/denseVSconv_board_73.jpg}
+{img/matches/denseVSconv_heatmap_73.png}
+{img/matches/denseVSconv_board_74.jpg}
+{img/matches/denseVSconv_heatmap_74.png}
+{Dense network against convolutional, moves 72 through 74.}
+{fig:denseVSconv05}
+
+\moveHeatmap
+{img/matches/denseVSconv_board_75.jpg}
+{img/matches/denseVSconv_heatmap_75.png}
+{img/matches/denseVSconv_board_76.jpg}
+{img/matches/denseVSconv_heatmap_76.png}
+{img/matches/denseVSconv_board_77.jpg}
+{img/matches/denseVSconv_heatmap_77.png}
+{Dense network against convolutional, moves 75 through 77.}
+{fig:denseVSconv06}
+
+% Needed line so the processing of the last command doesn't find an EOF
diff --git a/doc/tex/systemAnalysis.tex b/doc/tex/systemAnalysis.tex
new file mode 100644
index 0000000..c3c6aa8
--- /dev/null
+++ b/doc/tex/systemAnalysis.tex
@@ -0,0 +1,892 @@
+\section{System Analysis}
+
+\subsection{System Reach Determination}
+
+These are the main goals the final product must reach.
+
+\begin{enumerate}
+
+ \item The implementation, analysis and comparison of different decision
+ algorithms for genarating moves. This is the main goal and the following
+ ones are derived from the need of reaching it.
+
+ \item A library for representing the game of Go. It can be used for the
+ decision algorithms to keep the state of the game and can also be used
+ in an interactive application for a user to play the game and test the
+ code.
+
+ \item An engine program as a way of presenting an interface for using these
+ algorithms. The engine will use the GTP so it can be used with an
+ existing GUI or other tools.
+
+ \item A parser for SGF files so they can be processed in the training of
+ neural networks.
+
+\end{enumerate}
+
+\subsection{System Requirements}
+
+The requirements for the system are expressed here in a nested list way, each of
+them with a textual and numeric reference for them to be traceable. The
+functional requirements are exposed first, followed by the other kinds of
+requisites needed for the system.
+
+\setlist[enumerate,2]{label*=\arabic*.}
+\setlist[enumerate,3]{label*=\arabic*.}
+
+\subsubsection{Functional Requirements}
+
+\paragraph{Game Requirements}
+
+\setlist[enumerate,1]{label=FRG \arabic*.}
+
+\begin{enumerate}
+
+ \item The game program is interactive.
+
+ \item Movements can be introduced to be played on the board.
+ \begin{enumerate}
+ \item A move is introduced as the textual representation of the
+ coordinates of the vertex to play on or as ``pass''.
+ \begin{enumerate}
+ \item The text introduced for the move must follow the
+ regular expression \texttt{([A-Z][0-9]+|pass)}
+ \item If the move is not valid it must be notified to the
+ user and another move asked for.
+ \end{enumerate}
+ \end{enumerate}
+
+ \item The state of the board can be shown to the user.
+ \begin{enumerate}
+ \item A text representation of each cell is printed.
+ \begin{enumerate}
+ \item A different character is used for each different state
+ of a cell.
+ \end{enumerate}
+ \item The coordinates system is shown around the board.
+ \begin{enumerate}
+ \item Columns are shown as capital letters left to right
+ starting with ``A'' and skipping ``I''.
+ \item Rows are shown as numbers starting with 1 on the
+ lowest row and increasing upwards.
+ \end{enumerate}
+ \end{enumerate}
+
+ \item The board will behave according to the Japanese rules of Go.
+
+\end{enumerate}
+
+\paragraph{Engine Requirements}
+
+\setlist[enumerate,1]{label=FRE \arabic*.}
+
+\begin{enumerate}
+
+ \item The engine program is interactive.
+
+ \item The engine implements the GTP (\textit{Go Text Protocol}) for its
+ interface.
+ \begin{enumerate}
+ \item Commands are read from standard input.
+ \item Responses are provided via standard output.
+ \item There exist commands to set up the conditions of the match.
+ \begin{enumerate}
+ \item The size of the board can be set.
+ \item The komi can be set.
+ \end{enumerate}
+ \item There exist commands to manipulate the internal representation
+ of the match.
+ \begin{enumerate}
+ \item It is possible to indicate a move being played.
+ \item It is possible to clear the board.
+ \end{enumerate}
+ \item There exists a command to generate a move.
+ \begin{enumerate}
+ \item The generated move must be a playable move.
+ \item Generating a move does not change the internal
+ representation of the match.
+ \end{enumerate}
+ \item There exist commands to ask for information about the engine.
+ \begin{enumerate}
+ \item It is possible to ask for the protocol version
+ implemented.
+ \item It is possible to ask for the name of the engine.
+ \item It is possible to ask for the version of the engine.
+ \item It is possible to ask whether a specific command is
+ known to the engine.
+ \item It is possible to ask for a list of the known commands.
+ \end{enumerate}
+ \item There exists a command to stop the engine.
+ \end{enumerate}
+
+ \item The engine can be executed from the command line.
+ \begin{enumerate}
+ \item The engine can be executed directly from an interactive shell.
+ \item The engine can be executed by another program to be used as
+ backend.
+ \end{enumerate}
+
+\end{enumerate}
+
+\paragraph{Trainer Requirements}
+
+\setlist[enumerate,1]{label=FRT \arabic*.}
+
+\begin{enumerate}
+
+ \item The trainer program is non-interactive.
+
+ \item The trainer can be executed from the command line.
+ \begin{enumerate}
+ \item The trainer can be executed directly from an interactive shell.
+ \end{enumerate}
+
+ \item The trainer can interact with stored neural network models.
+ \begin{enumerate}
+ \item The trainer can read stored models to continue training them.
+ \item The trainer can store model files after their training.
+ \end{enumerate}
+
+ \item The trainer can import existing games.
+ \begin{enumerate}
+ \item Records of games stored as SGF can be imported.
+ \item Files containing records of games are provided as arguments to
+ the trainer.
+ \end{enumerate}
+
+\end{enumerate}
+
+%\subsubsection{Security Requirements}
+%
+%\setlist[enumerate,1]{label=SR \arabic*.}
+
+\subsubsection{Usability Requirements}
+
+\setlist[enumerate,1]{label=UR \arabic*.}
+
+\begin{enumerate}
+
+ %TODO: Implement this
+ \item The engine executable will include a help option with the different
+ modes of execution.
+
+\end{enumerate}
+
+\subsubsection{User Requirements}
+
+\setlist[enumerate,1]{label=USR \arabic*.}
+
+\begin{enumerate}
+
+ \item For understanding the workings of the application the user needs to be
+ familiar with the basics of the game of Go.
+
+ \item For directly using the engine the user needs to be familiar with
+ command line interfaces.
+
+ \item For directly using the trainer the user needs to know the different
+ network models available.
+
+\end{enumerate}
+
+\subsubsection{Technological Requirements}
+
+\setlist[enumerate,1]{label=TR \arabic*.}
+
+\begin{enumerate}
+
+ \item The game program will be a python file able to be executed by the
+ python interpreter.
+
+ \item The game program will make use of standard input and standard output
+ for communication.
+ \begin{enumerate}
+ \item Standard input will be used for reading moves.
+ \item Standard output will be used for showing the board.
+ \item Standard output will be used for messages directed to the user.
+ \end{enumerate}
+
+ \item The engine program will be a python file able to be executed by the
+ python interpreter.
+
+ \item The engine program will make use of standard input and standard output
+ for communication.
+ \begin{enumerate}
+ \item Standard input will be used for reading commands.
+ \item Standard output will be used for showing the result of
+ commands.
+ \end{enumerate}
+
+ \item The trainer program will be a python file able to be executed by the
+ python interpreter.
+
+ \item The engine program will make use of standard input and standard output
+ for communication.
+ \begin{enumerate}
+ \item Standard input will be used for reading commands.
+ \item Standard output will be used for showing the result of
+ commands.
+ \end{enumerate}
+
+\end{enumerate}
+
+\subsubsection{Response Time Requirements}
+
+\setlist[enumerate,1]{label=RTR \arabic*.}
+
+\begin{enumerate}
+
+%TODO: Check and update this to something feasible
+ \item The maximum thinking time of the engine will be configurable.
+ \begin{enumerate}
+ \item It will be possible to pass the maximum time as a launch
+ argument.
+ \item It will be possible to store the maximum time as a setting
+ in a configuration file.
+ \end{enumerate}
+
+\end{enumerate}
+
+\setlist[enumerate,1]{label=\arabic*.}
+
+\subsection{Subsystems}
+
+There will be three main subsystems.
+
+\subsubsection{Game System}
+
+The Game System will be in charge of storing all the state information regarding
+a Go match, such as the history of moves, the possible variations, the state of
+the board at any given time or the current number of captured stones.
+
+This system will include a command-line interface with which to play Go matches
+between human players to show and test its capabilities.
+
+\subsubsection{Engine System}
+
+The Engine System will implement the GTP interface and use the Game System to
+analyse positions and generate moves via decision algorithms.
+
+This system can be directly called to manually set up game states and ask for
+moves or can be called by other programs which use GTP to be used as backend for
+playing matches against a computer player.
+
+\subsubsection{Training System}
+
+The Training System will process SGF files storing records of games, train the
+neural network models over those games and store the result. These models can
+then be imported by the engine and be used to generate moves.
+
+\subsubsection{Interface Between Subsystems}
+
+The Training System depends on the NeuralNetwork interface of the Engine System
+and uses it to train and store the neural network models.
+
+Both the Engine and Training systems depend on the GameMove class of the Game
+System. The Engine System uses it to store the state of a game and provide it
+to the decision algorithms. The Training System uses it to create the internal
+representation of a game resulting from the processing of an SGF file.
+
+\subsection{Class Analysis}
+
+\subsubsection{Class Diagram}
+
+The classes resulting from the analysis phase are shown in
+\fref{fig:analysisClasses}.
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=\textwidth]{diagrams/analysisClasses.png}
+ \caption{General classes obtained from the analysis
+ phase.}\label{fig:analysisClasses}
+ \end{center}
+\end{figure}
+
+\subsubsection{Class Description}
+
+\newcommand{\interclassSpace}{30pt}
+
+\paragraph{Engine System}
+\indent \\
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{EngineIO} \\
+ \midrule
+ \textbf{Description} \\
+ Offers the interface with the engine. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Read input.} \\
+ \tabitem{Do some preprocessing.} \\
+ \tabitem{Forward commands to the engine logic component.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \tabitem{\textbf{start()}: Starts reading standard input in a loop.} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{EngineLogic} \\
+ \midrule
+ \textbf{Description} \\
+ Does the core logic and connects the different components of the engine. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Processes the commands and arguments forwarded by the IO
+ component.} \\
+ \tabitem{Handles the logic of the game by using components from the game
+ module.} \\
+ \tabitem{Calls a decision algorithm to generate moves.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\newcommand{\decisionAlgorithmMethods}{
+ \tabitem{\textbf{pickMove()}: Gives a move to play.} \\
+ \tabitem{\textbf{forceNextMove(coords)}: Notifies the system of a played
+ move so it can update its state accordingly.} \\
+ \tabitem{\textbf{clearBoard()}: Empties the move history. The algorithm will
+ now generate moves as from a new game.} \\
+}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{DecisionAlgorithm} \\
+ \midrule
+ \textbf{Description} \\
+ Interface for the decision algorithms to be used by the engine. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Analyzing game states and generating moves.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \textit{(Depends on the algorithm.)} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \decisionAlgorithmMethods
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{MonteCarloTreeSearch} \\
+ \midrule
+ \textbf{Description} \\
+ Implements the Monte Carlo Tree Search algorithm for exploring the tree of
+ the game and deciding on a move. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Analyzing game states and generating moves.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \tabitem{\textbf{root}: The root node of a tree representing of the current
+ game state and the explored possible moves from it.} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \decisionAlgorithmMethods
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{MCTSNode} \\
+ \midrule
+ \textbf{Description} \\
+ A node of the tree used by the Monte Carlo Tree Search algorithm. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Storing a specific state of a match.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \tabitem{\textbf{visits}: How many times the node has been visited.} \\
+ \tabitem{\textbf{score}: The number of explorations of the node resulting in
+ victory.} \\
+ \tabitem{\textbf{move}: A GameMove for accessing game state and logic.} \\
+ \tabitem{\textbf{parent}: This node's parent in the tree.} \\
+ \tabitem{\textbf{children}: The nodes following from this node in the tree.}
+ \\
+ \tabitem{\textbf{unexploredVertices}: The plays which could be explored from
+ this node.} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \tabitem{\textbf{ucbForPlayer()}: Computes the Upper Confidence Bound of the
+ node from the perspective of the player making the move stored in the node.}
+ \\
+ \tabitem{\textbf{selection()}: Monte Carlo Tree Search selection step.
+ Selects the most promising node which still has some unexplored children.}
+ \\
+ \tabitem{\textbf{expansion()}: Monte Carlo Tree Search expansion step. Picks
+ an unexplored vertex from the node and adds it as a new MCTSNode.} \\
+ \tabitem{\textbf{expansionForCoords()}: Performs an expansion for the given
+ coordinates. This represents forcing a move on the algorithm.} \\
+ \tabitem{\textbf{simulation()}: Play random matches to accumulate reward
+ information on the node.} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{Keras} \\
+ \midrule
+ \textbf{Description} \\
+ Implements the DecisionAlgorithm interface to give access to a neural
+ network. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Analyzing game states and generating moves.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \tabitem{\textbf{currentMove}: A GameMove for accessing game state and
+ logic.} \\
+ \tabitem{\textbf{neuralNetwork}: A NeuralNetwork instance for generating
+ moves.} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \decisionAlgorithmMethods
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{NeuralNetwork} \\
+ \midrule
+ \textbf{Description} \\
+ Manages the neural networks used by the engine. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Analyzing game states and generating moves.} \\
+ \tabitem{Generating a new neural network.} \\
+ \tabitem{Loading a model file to use an existing trained neural network.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \tabitem{\textbf{currentMove}: A GameMove for accessing game state and
+ logic.} \\
+ \tabitem{\textbf{neuralNetwork}: A NeuralNetwork instance for generating
+ moves.} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \tabitem{\textbf{pickMove()}: Uses the current internal model to pick a move
+ given a game state.} \\
+ \tabitem{\textbf{trainModel()}: Receives a list of games, with each game
+ being a list of moves, and trains the network on them.} \\
+ \tabitem{\textbf{saveModel()}: Saves the current internal neural network
+ model.} \\
+ \tabitem{\textbf{saveHeatmap()}: Saves an image of a heatmap of move
+ likelihood.} \\
+ \tabitem{\textbf{saveModelPlot()}: Saves an image of a plot of the model
+ configuration.} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\paragraph{Game System}
+
+\indent \\
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{GameState} \\
+ \midrule
+ \textbf{Description} \\
+ Stores the state of a match. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Store state information.} \\
+ \tabitem{Offer methods to manipulate the game state.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \tabitem{\textbf{getCurrentPlayer()}: Returns the player who should play
+ next.} \\
+ \tabitem{\textbf{playMove()}: Play a move in the specified coordinates
+ for the specified player.} \\
+ \tabitem{\textbf{playMoveForPlayer()}: Play a move in the specified coordinates
+ for the player who should play next.} \\
+ \tabitem{\textbf{undo()}: Reset the state to how it was just before the
+ last move was played.} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{GameBoard} \\
+ \midrule
+ \textbf{Description} \\
+ Stores the state of a board position and handles its logic. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Store the vertices of a board position.} \\
+ \tabitem{Logic related to a board position.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \tabitem{\textbf{board}: An array of the stones on the board.} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \tabitem{\textbf{getGroupLiberties()}: Returns a set with the empty vertices
+ adjacent to the group occupying a vertex.} \\
+ \tabitem{\textbf{getGroupLibertiesCount()}: Returns the number of liberties
+ of the group occupying a vertex.} \\
+ \tabitem{\textbf{getGroupVertices()}: Returns a set with the vertices of the
+ group occupying a vertex.} \\
+ \tabitem{\textbf{getGroupVerticesCount()}: Returns the number of stones of
+ the group occupying a vertex.} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{GameMove} \\
+ \midrule
+ \textbf{Description} \\
+ Stores information about a specific move and its relationships to the
+ previous and next moves. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Store information about a move (board, player, coordinates\ldots).} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \tabitem{\textbf{board}: The board as of this move.} \\
+ \tabitem{\textbf{nextMoves}: The list of moves played after this
+ one. Different moves represent different game variations.} \\
+ \tabitem{\textbf{previousMove}: The move before this one.} \\
+ \tabitem{\textbf{isPass}: True if the move is a pass and not a stone
+ placement.} \\
+ \tabitem{\textbf{coords}: The coordinates of the board the move was
+ played at. Has no meaning if \textbf{isPass} is true.} \\
+ \tabitem{\textbf{playerWhoPassed}: The player who made this move. Has no
+ meaning if \textbf{isPass} is false, since the player can be obtained from
+ the coordinates of the move when it is not a pass.} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \tabitem{\textbf{getRow()}: Returns the row the move was played at.} \\
+ \tabitem{\textbf{getCol()}: Returns the col the move was played at.} \\
+ \tabitem{\textbf{getPlayer()}: Returns the player who played the move.} \\
+ \tabitem{\textbf{getNextPlayer()}: Returns the player who should play after
+ this move.} \\
+ \tabitem{\textbf{getGameLength()}: Returns the number of moves the game has
+ had.} \\
+ \tabitem{\textbf{getPlayableVertices()}: Returns the legal vertices for the
+ next move.} \\
+ \tabitem{\textbf{addMove()}: Inserts a new children move for the given
+ coordinates and for the player who should make the next move.} \\
+ \tabitem{\textbf{addMoveForPlayer()}: Inserts a new children move for the given
+ coordinates and player.} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{GameBoard} \\
+ \midrule
+ \textbf{Description} \\
+ Represents a board. Contains played stones and the amount of captures made
+ by each player. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Store a specific layout of stones in the board.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \tabitem{\textbf{board}: An array containing the stone layout.} \\
+ \tabitem{\textbf{capturesBlack}: The stones captured by black before the
+ position.} \\
+ \tabitem{\textbf{capturesWhite}: The stones captured by white before the
+ position.} \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \tabitem{\textbf{getBoardHeight()}: Returns the number of rows of the board.} \\
+ \tabitem{\textbf{getBoardWidth()}: Returns the number of columns of the board.} \\
+ \tabitem{\textbf{getGroupLiberties()}: Returns a list with the empty
+ vertices adjacent to the group occupying a vertex.} \\
+ \tabitem{\textbf{getGroupVertices()}: Returns a list with the vertices
+ occupied by the group occupying a vertex.} \\
+ \tabitem{\textbf{moveAndCapture()}: Makes a move and captures the
+ corresponding stones if the move results in the capture of a group.} \\
+ \tabitem{\textbf{score()}: Gets the current score based on the already
+ surrounded territory. This follows Japanese rules.} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\paragraph{Training System}
+
+\indent \\
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{Trainer} \\
+ \midrule
+ \textbf{Description} \\
+ Provides the neural networks with moves to train on. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Obtain moves from stored records of matches.} \\
+ \tabitem{Provide neural networks with moves to train on.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ %TODO: Explain why this is empty
+ \midrule
+ \textbf{Proposed methods} \\
+ \tabitem{\textbf{loadGameTree()}: Reads a file and generates a GameMove tree
+ from its contents.} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{Parser} \\
+ \midrule
+ \textbf{Description} \\
+ Reads SGF files and converts them to a tree of GameMove from the Game
+ System. \\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Read SGF files.} \\
+ \tabitem{Convert the content of the SGF files to a tree of GameMove.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ %TODO: Explain why this is empty
+ \midrule
+ \textbf{Proposed methods} \\
+ %TODO: Explain why this is empty
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{tabular}{p{0.9\linewidth}}
+ \toprule
+ \textbf{ASTNode} \\
+ \midrule
+ \textbf{Description} \\
+ Makes up the tree resulting from the parsing of an SGF file.\\
+ \midrule
+ \textbf{Responsibilities} \\
+ \tabitem{Obtain a GameMove tree from itself and its children.} \\
+ \midrule
+ \textbf{Proposed attributes} \\
+ \tabitem{\textbf{children}: The nodes following from itself.} \\
+ \tabitem{\textbf{props}: The properties of the tree read from an SGF file.}
+ \\
+ \midrule
+ \textbf{Proposed methods} \\
+ \tabitem{\textbf{toGameTree()}: Returns a GameMove tree corresponding to the
+ tree following from this node.} \\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\subsection{System Actors}
+
+There are various actors who will interact with the system, both human and
+non-human.
+
+\begin{itemize}
+
+ \item The human player who interacts with the playing interface.
+ \item The human user who interacts with the engine.
+ \item A GUI software which uses the engine to generate moves.
+
+\end{itemize}
+
+\subsection{Use Cases}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=\textwidth]{diagrams/useCases.png}
+ \caption{Use cases.}
+ \label{fig:useCases}
+ \end{center}
+\end{figure}
+
+The different actors and use cases are represented on \fref{fig:useCases}. Each
+use case is explained next.
+
+\paragraph{Play a match}
+
+The game interface reads the moves presented by the player and shows their
+result on the board.
+
+\paragraph{Use as backend for machine player}
+
+The engine is used as the backend for generating moves for a machine player,
+this is, for automated play, either against a human who is using the GUI or
+against another machine player.
+
+\paragraph{Generate a move}
+
+The engine interface reads the input for generating a move as stated by the
+GTP protocol and outputs the coordinates of the board to play.
+
+\subsection{Use Case Analysis and Scenarios}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=0.8\textwidth]{diagrams/useCase_playAMatch.png}
+ \caption{Use case: Play a match.}
+ \label{fig:useCase_playAMatch}
+ \end{center}
+\end{figure}
+
+\begin{tabular}{lp{0.6\linewidth}}
+ \toprule
+ \multicolumn{2}{c}{\textbf{Play a match}} \\
+ \midrule
+ \textbf{Preconditions} & The game interface has been started. \\
+ \midrule
+ \textbf{Postconditions} & The program terminates after a match has been
+ played. \\
+ \midrule
+ \textbf{Actors} & Human player \\
+ \midrule
+ \textbf{Description} &
+ 1. The user enters the move to make.\newline
+ 2. The result of playing that move is outputted by the program.\newline
+ 3. Stop the program if the game has ended or go back to 1 if not. \\
+ \midrule
+ \textbf{Secondary scenarios} &
+ \textbf{The move is illegal}: An error message is shown. Go back to step 1 of
+ main scenario. \\
+ \midrule
+ \textbf{Exceptions} &
+ \textbf{The input is wrong}: An error message is shown. Go back to step 1 of
+ main scenario. \\
+ \midrule
+ \textbf{Notes} &
+ This scenario does not pretend to be a complete recreation of a go match. It
+ will be playable, but its main purpose is to see the Game implementation in
+ action.\newline
+ A robustness diagram for this scenario is shown in
+ \fref{fig:useCase_playAMatch}.\\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=\textwidth]{diagrams/useCase_generateAMove.png}
+ \caption{Use case: Generate a move.}
+ \label{fig:useCase_generateAMove}
+ \end{center}
+\end{figure}
+
+\begin{tabular}{lp{0.6\linewidth}}
+ \toprule
+ \multicolumn{2}{c}{\textbf{Generate a move}} \\
+ \midrule
+ \textbf{Preconditions} & The game engine has been started. \newline
+ Optionally, some moves have already been played. \\
+ \midrule
+ \textbf{Postconditions} & A move is suggested via the engine output. \\
+ \midrule
+ \textbf{Actors} & Human user and GUI program. \\
+ \midrule
+ \textbf{Description} &
+ 1. The user or program enters the player to generate the move
+ for.\newline
+ 2. The suggested move is outputted by the engine, either as
+ coordinates or as an indication to pass.
+ \\
+ \midrule
+ \textbf{Secondary scenarios} &
+ \textbf{The move is illegal}: An error message is shown. Go back to step 1 of
+ main scenario. \\
+ \midrule
+ \textbf{Exceptions} &
+ \textbf{The input is wrong}: An error message is shown. Go back to step 1 of
+ main scenario. \\
+ \midrule
+ \textbf{Notes} &
+ A robustness diagram for this scenario is shown in
+ \fref{fig:useCase_generateAMove}.\\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=\textwidth]{diagrams/useCase_useAsBackend.png}
+ \caption{Use case: Use as backend for machine player.}
+ \label{fig:useCase_useAsBackend}
+ \end{center}
+\end{figure}
+
+\begin{tabular}{lp{0.6\linewidth}}
+ \toprule
+ \multicolumn{2}{c}{\textbf{Use as backend for machine player}} \\
+ \midrule
+ \textbf{Preconditions} & The game engine has been configured as engine for
+ the software. \\
+ \midrule
+ \textbf{Postconditions} & A match has been played against the engine. \\
+ \midrule
+ \textbf{Actors} & GUI program. \\
+ \midrule
+ \textbf{Description} &
+ 1. The program gives commands to the engine to set up the game. The
+ specific commands will vary from program to program.\newline
+ 2. The program asks the engine for a move.\newline
+ 3. The engine suggest a move to the program.\newline
+ 4. The moves are shown by the program as if made by a player.\newline
+ 5. The opponent gives a move to the program.\newline
+ 6. Repeat from step 2 until the game ends. \\
+ \midrule
+ \textbf{Secondary scenarios} &
+ ---\\
+ \midrule
+ \textbf{Exceptions} &
+ ---\\
+ \midrule
+ \textbf{Notes} &
+ A robustness diagram for this scenario is shown in
+ \fref{fig:useCase_useAsBackend}.\\
+ \bottomrule
+\end{tabular}
+
+\vspace{\interclassSpace}
+
+\subsection{Testing Plan Specification}
+
+\subsubsection{Unitary Testing}
+
+Tests for the python code are developed using the unittest\cite{python_unittest}
+testing framework. It has been chosen by virtue of being thoroughly documented
+and widely used.
+
+The coverage of unit testing is checked with Coverage.py\cite{python_coverage},
+which can by itself run the unittest tests and generate coverage reports based
+on the results.
+
+% Maybe put an example report here?
diff --git a/doc/tex/systemDesign.tex b/doc/tex/systemDesign.tex
new file mode 100644
index 0000000..80a2ccb
--- /dev/null
+++ b/doc/tex/systemDesign.tex
@@ -0,0 +1,324 @@
+\section{System Design}
+
+\subsection{Class Diagram}
+
+The full class diagram is shown in \fref{fig:fullClasses}.
+
+\begin{figure}[h]
+ \begin{center}
+ \makebox[0pt]{\begin{minipage}{1.2\textwidth}
+ \includegraphics[width=\textwidth]{diagrams/fullClasses.png}
+ \caption{Full class diagram.}
+ \label{fig:fullClasses}
+ \end{minipage}}
+ \end{center}
+\end{figure}
+
+The design of each system of the diagram is explained after this section
+together with diagrams for each subsystem, since the full class diagram can be
+too big to be comfortably analyzed.
+
+\subsection{Game}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=0.55\textwidth]{diagrams/gameModule.png}
+ \caption{Design of the implementation of the game of Go.}
+ \label{fig:game}
+ A game is represented as a tree of moves.
+ \end{center}
+\end{figure}
+
+A regular Go match is composed of a list of moves. But since game review and
+variants exploration is an important part of Go learning, \program{} and most
+playing and analysis existing programs allow for navigation back and forth
+through the board states of a match and for new variants to be created from each
+of these board states. Therefore, a match is represented as a tree of moves. The
+GameMove class has the information about a specific move and also a reference to
+the previous move and to a list of following moves, implementing this tree
+structure and allowing for navigating both forward and backwards in the move
+history.
+
+The state of the board at any given move must be stored so liberties, captures
+count and legality of moves can be addressed, so it is represented with the
+GameState class, which holds a reference to the current move.
+
+Moves depend on a representation of the game board to have access to its current
+layout and count of captured stones. There are also many logic operations needed
+to be performed on the board, such as getting the stones in a group, counting
+their liberties or checking if a move is playable. The layout of the board and
+these operations are implemented as the GameBoard class.
+
+A game can be started by the executable \texttt{go.py}.
+
+These classes and their relationships can be seen in \fref{fig:game}.
+
+\subsection{Engine}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=0.8\textwidth]{diagrams/engineModule.png}
+ \caption{Design of the GTP engine.}\label{fig:engine}
+ \end{center}
+\end{figure}
+
+An implementation of GTP, that is, the piece of software which offers the GTP
+interface to other applications. It is designed to be used by a software
+controller but can also be directly run, mostly for debugging purposes. Its
+design is shown in \fref{fig:engine}. The core of the engine is related with
+three components, each with a separate responsibility:
+
+\begin{itemize}
+
+ \item The ImagoIO component is the one imported from executables or other
+ applications and offers the text interface. It reads and processes input
+ and calls corresponding commands from the core of the engine.
+
+ \item The GameEngine contains the logic of the commands available from the
+ IO component. It uses a GameState to keep a record of the game and uses
+ a DecisionAlgorithm to generate moves.
+
+ \item The DecisionAlgorithm component is responsible of analyzing the match
+ and generate moves. The engine core uses it when a decision has to be
+ made by the AI, such as when a move needs to be generated by the engine.
+
+\end{itemize}
+
+Two implementations of DecisionAlgorithm have been made: one for the Monte
+Carlo Tree Search algorithm (on the MCTS class) and the other for neural
+networks (on the Keras class).
+
+The Keras class also makes use of the NeuralNetwork class, which offers
+functions for creating, training, saving and using neural network models. The
+designs of the network are implemented in the subclasses DenseNeuralNetwork and
+ConvNeuralNetwork as examples of dense and convolutional networks, respectively.
+
+The engine can be started with the executable \texttt{imagocli.py}.
+
+\subsubsection{Monte Carlo Tree Search Explained}
+
+Monte Carlo Tree Search is an algorithm that can be useful for exploring
+decision trees. It was used by AlphaGo in conjunction with neural networks as
+explained in the AlphaGo 2016 paper\cite{natureAlphaGo2016}.
+
+The algorithm assigns a score to each explored node based on how likely the
+player who makes the corresponding move is to win and updates this score on each
+exploration cycle.
+
+The exploration of the tree has 4 steps:
+
+\begin{enumerate}
+
+ \item \textbf{Selection}: The most promising move with unexplored children
+ is selected for exploration. Unexplored children are viable moves which
+ are not yet part of the tree.
+
+ \item \textbf{Expansion}: An unexplored children of the selected move is
+ added to the tree. This children is selected at random.
+
+ \item \textbf{Simulation}: The score of the new move is evaluated by playing
+ random matches from it.
+
+ \item \textbf{Backpropagation}: The score of the new move, as well as its
+ previous moves up to the root of the tree, is updated based on the
+ results of the simulation.
+
+\end{enumerate}
+
+The suggested move is the children of the current move with the best score from
+the perspective of the player which has to make the move.
+
+The implementation of the algorithm will use the existing GameMove class from
+the Game System to access the game logic it needs, such as to get the possible
+children from a node or to simulate random games.
+
+\subsubsection{Neural Networks Explained}
+
+A neural network is composed of nodes or ``neurons''. Each node contains a value
+named weight. During execution the node receives a numeric input, multiplies it
+for its weight and applies a function called activation function to the result.
+
+Nodes are organized in layers so that a network contains several layers and each
+layer one or more neurons. The input to the network forms the input layer, which
+contents are forwarded to the second layer. The second layer applies the weight
+and activation function as discussed before in each of its nodes and the result
+is forwarded to the next layer, and so on. At the end the last layer, called the
+output layer, contains the result of the input evaluation. Each layer can have a
+unique activation function for all its nodes and a different strategy of
+connecting to the previous and next layers.
+
+Several kinds of layers have been used in this project:
+
+\begin{itemize}
+
+ \item \textbf{Dense layers}, which connects each of its nodes to each of the
+ nodes of the previous layers.
+
+ \item \textbf{Convolutional layers}, which process their input by applying
+ a filter function to adjacent values. In the case of this project, the
+ board is filtered by grouping its vertices in 3x3 squares. The aim of
+ these layers is to detect patterns in the input, such as curves, edges
+ or more complex shapes, so they are used a lot on neural networks
+ processing images. They are used in this project because a configuration
+ of the Go board is not that different from a two-dimensional image.
+
+ \item \textbf{Max pooling layers}, which process their input in a similar
+ way to convolutional layers, but reducing the size of the input by
+ keeping the highest value in each of the groups they process. This
+ reduction accentuates the patterns detected by convolutional layers and
+ helps on the detection of bigger, more complex patterns.
+
+ \item \textbf{Flatten layers}, which just change the shape of the input so
+ that all the values are on one dimension.
+
+\end{itemize}
+
+Combinations of these layers have been used to define two neural networks.
+
+First, a network using mainly dense layers as an example of a more general
+purpose design of a network.
+
+Then, a network with convolutional and max pooling layers to compare the
+approach used on image processing to the more general one and studying its
+utility on the analysis of the Go board.
+
+These networks have been implemented on the DenseNeuralNetwork and
+ConvNeuralNetwork classes, respectively.
+
+The networks have been designed to process boards of size 9x9, which is the
+introductory size to the game. It is the easiest both for the hardware to handle
+and for the analysis of results while keeping able to support meaningful
+matches.
+
+Both networks have the same design for their input and output.
+
+Their input is a three-dimensional matrix of size 9x9x2 with values either 0 or
+1. It represents two views of the board, one with ones as the stones of a player
+and the other with ones as the stones of the other player.
+
+Their output is a vector with 82 elements of type float. Classification networks
+typically use a vector of probabilities with one element for each class they are
+trying to classify. Here the classes are the 81 positions of the 9x9 board and
+the pass move, hence 82 total elements. Each element signifies the chance of
+playing that move for the input board position, so the element with the highest
+value represents the suggested move.
+
+\subsubsection{Dense Neural Network Design}
+
+\begin{listing}[h]
+ \inputminted{text}{listings/denseModel.txt}
+ \caption{Dense neural network model.}
+ \label{code:denseModel}
+\end{listing}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=0.7\textwidth]{img/models/denseModel.png}
+ \caption{Dense neural network model.}
+ \label{fig:denseNN}
+ \end{center}
+\end{figure}
+
+This network first uses two dense layers with 81 nodes each. This number has
+been selected so each node can have as input each of the vertices of the board.
+A flatten layer acts then to make the output one-dimensional, and a final dense
+layer provides the vector containing the likelihood of each possible move.
+
+The design of this network is shown in \flist{code:denseModel} and
+\fref{fig:denseNN} as provided by Keras' summary and plot\_model functions
+respectively.
+
+\subsubsection{Convolutional Neural Network Design}
+
+\begin{listing}[h]
+ \inputminted{text}{listings/convModel.txt}
+ \caption{Convolutional neural network model.}
+ \label{code:convModel}
+\end{listing}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=0.7\textwidth]{img/models/convModel.png}
+ \caption{Convolutional neural network model.}
+ \label{fig:convNN}
+ \end{center}
+\end{figure}
+
+This network uses two pairs of convolutional and max pooling layers with the aim
+of being trained to recognize patterns on the board. A flatten layer acts then
+to make the output one-dimensional, and a final dense layer provides the vector
+containing the likelihood of each possible move.
+
+The design of this network is shown in \flist{code:convModel} and
+\fref{fig:convNN} as provided by Keras' summary and plot\_model functions
+respectively.
+
+\subsection{Training}
+
+\begin{figure}[h]
+ \begin{center}
+ \includegraphics[width=\textwidth]{diagrams/trainingModule.png}
+ \caption{Components of the SGF file parsing module.}
+ \label{fig:trainingModule}
+ Components not showing a capital C are not classes, as in they not
+ follow the object-oriented paradigm and do not implement any classes,
+ only functions.
+ \end{center}
+\end{figure}
+
+Neural networks can be powerful machine learning algorithms, but they have to be
+trained first so they can provide meaningful results. For a Go AI it makes sense
+to have its algorithms trained on Go games. There exists a common text format to
+store Go games: SGF. If the system is able to process SGF files, it can provide
+the games stored on them to the neural networks for training. And so the need
+for an SGF parser arises.
+
+To parse SGF files a lexer and parser have been implemented using PLY.\@ The
+result of the parsing is an AST (Annotated Syntax Tree) reflecting the contents
+of the text input, each node with zero or more properties, and with the ability
+to convert themselves and their corresponding subtree into a GameMove tree. This
+is done for the root node, since from the SGF specification there are some
+properties only usable in the root node, like those which specify general game
+information and properties such as rank of players or komi.
+
+Here follows an explanation of the role and motivation before each component of
+the Training module to show how these previous concerns have been addressed and
+solved. These components are shown in \fref{fig:trainingModule}.
+
+\begin{itemize}
+
+ \item \textbf{SGF}: Provides a high-level method to convert a path to a SGF
+ file to a GameMove tree.
+
+ \item \textbf{sgfyacc}: The implementation of a SGF parser using PLY. Takes
+ the tokens generated by \textbf{sgflex} and creates an ASTNode tree from
+ them.
+
+ \item \textbf{sgflex}: The implementation of a SGF lexer using PLY.\@ Takes
+ text input and generates the tokens of the SGF language from them.
+
+ \item \textbf{ASTNode}: The AST resulting from the parsing of a SGF file.
+ Has a method to convert it to a tree of GameMove and so obtain the
+ contents of the SGF in the internal representation used by the project's
+ systems.
+
+ \item \textbf{Property}: The representation of a property of an ASTNode
+ tree. Each property is made of a name and one or more values and this
+ class helps handling this specific situation.
+
+The training can be started with the executable \texttt{train.py}.
+
+\end{itemize}
+
+%\subsection{Modules}
+%
+%One module to store the state of the game and the game tree. One module to parse
+%moves. One module to read and write SGF files. Modules are shown in
+%\fref{fig:modules}.
+%
+%\begin{figure}[h]
+% \begin{center}
+% \includegraphics[width=\textwidth]{diagrams/modules.png}
+% \caption{Modules.}\label{fig:modules}
+% \end{center}
+%\end{figure}
diff --git a/doc/tex/tfg.tex b/doc/tex/tfg.tex
deleted file mode 100644
index 9248748..0000000
--- a/doc/tex/tfg.tex
+++ /dev/null
@@ -1,60 +0,0 @@
-\documentclass{article}
-
-\usepackage{geometry}
-\usepackage{graphicx}
-\usepackage{booktabs}
-\usepackage{hyperref}
-\usepackage{csquotes}
-
-\usepackage[backend=biber, style=numeric-comp]{biblatex}
-\addbibresource{/home/taamas/docs/biber.bib}
-
-\geometry{left=4.5cm,top=2cm,bottom=2cm,right=4.5cm}
-
-\hypersetup{colorlinks=true,
- linkcolor=black,
- filecolor=magenta,
- urlcolor=black,
- bookmarks=true
-}
-
-\urlstyle{mono}
-
-%\renewcommand{\contentsname}{Contenidos}
-%\renewcommand{\figurename}{Figura}
-
-\newcommand{\program}{Go-AI}
-
-\newcommand{\inputtex}[1]{\input{tex/#1}}
-\newcommand{\fref}[1]{Fig.~\ref{#1}}
-%\newcommand{\uurl}[1]{\underline{\url{#1}}}
-
-\begin{document}
-
-\frenchspacing
-
-\title{\program}
-
-\author{Íñigo Gutiérrez Fernández}
-
-\date{}
-
-\maketitle
-
-\begin{abstract}
- This is the abstract.
-\end{abstract}
-
-\tableofcontents
-
-\inputtex{introduction.tex}
-
-\inputtex{previousWorks.tex}
-
-\inputtex{interface.tex}
-
-\inputtex{implementation.tex}
-
-\printbibliography{}
-
-\end{document}
diff --git a/go.py b/go.py
index 548df38..cf0a673 100755
--- a/go.py
+++ b/go.py
@@ -2,29 +2,27 @@
"""Play Go!"""
-from imago.engine.parseHelpers import ParseCodes, parseVertex
+from imago.engine.parseHelpers import parseVertex
from imago.gameLogic.gameState import GameState
if __name__ == "__main__":
- #GAMESTATE = GameState(5)
- GAMESTATE = GameState(19)
+ GAMESTATE = GameState(9)
- while 1:
+ while True:
GAMESTATE.getBoard().printBoard()
move = input("Move (" + GAMESTATE.getPlayerCode() + "): ")
- move = parseVertex(move, GAMESTATE.size)
- if move == ParseCodes.ERROR:
+ try:
+ move = parseVertex(move, GAMESTATE.size)
+ except Exception as err:
print("Invalid move syntax. Example of move: A1")
continue
print()
- player = str(GAMESTATE.getPlayerCode())
-
moveRow = move[0]
moveCol = move[1]
diff --git a/imago/data/enums.py b/imago/data/enums.py
index 9d963ec..c790384 100644
--- a/imago/data/enums.py
+++ b/imago/data/enums.py
@@ -16,3 +16,9 @@ class Player(Enum):
if player == cls.WHITE:
return cls.BLACK
return cls.EMPTY
+
+class DecisionAlgorithms(Enum):
+ MONTECARLO = enumAuto()
+ KERAS = enumAuto()
+ DENSE = enumAuto()
+ CONV = enumAuto()
diff --git a/imago/engine/core.py b/imago/engine/core.py
index 28166b8..2bf7d5a 100644
--- a/imago/engine/core.py
+++ b/imago/engine/core.py
@@ -1,21 +1,21 @@
-#!/usr/bin/python
-
"""Imago GTP engine"""
-from random import randrange
-
-from imago.data.enums import Player
+from imago.data.enums import DecisionAlgorithms
+from imago.engine.createDecisionAlgorithm import create as createDA
from imago.gameLogic.gameState import GameState
-DEF_SIZE = 19
+DEF_SIZE = 9
DEF_KOMI = 5.5
+DEF_ALGORITHM = DecisionAlgorithms.KERAS
class GameEngine:
"""Plays the game of Go."""
- def __init__(self):
+ def __init__(self, decisionAlgorithmId = DEF_ALGORITHM):
self.komi = DEF_KOMI
self.gameState = GameState(DEF_SIZE)
+ self.daId = decisionAlgorithmId
+ self.da = createDA(self.daId, self.gameState.lastMove)
def setBoardsize(self, newSize):
"""Changes the size of the board.
@@ -23,19 +23,21 @@ class GameEngine:
It is wise to call clear_board after this command.
"""
self.gameState = GameState(newSize)
+ self.da = createDA(self.daId, self.gameState.lastMove)
def clearBoard(self):
"""The board is cleared, the number of captured stones reset to zero and the move
history reset to empty.
"""
self.gameState.clearBoard()
+ self.da.clearBoard()
def setKomi(self, komi):
"""Sets a new value of komi."""
self.komi = komi
def setFixedHandicap(self, stones):
- """Sets handicap stones in fixed vertexes."""
+ """Sets handicap stones in fixed vertices."""
if stones < 1 or stones > 9:
raise Exception("Wrong number of handicap stones")
# TODO: Set handicap stones
@@ -43,23 +45,20 @@ class GameEngine:
def play(self, color, vertex):
"""Plays in the vertex passed as argument"""
+ if vertex == "pass":
+ self.gameState.passForPlayer(color)
+ self.da.forceNextMove(vertex)
+ return
row = vertex[0]
col = vertex[1]
self.gameState.playMoveForPlayer(row, col, color)
+ self.da.forceNextMove(vertex)
def genmove(self, color):
- """The key of this TFG."""
- validCells = []
- board = self.gameState.getBoard().board
- size = self.gameState.size
- for row in range(size):
- for col in range(size):
- if board[row][col] == Player.EMPTY:
- validCells.append([row, col])
- randIndex = randrange(0, len(validCells))
- move = validCells[randIndex]
- self.gameState.playMoveForPlayer(move[0], move[1], color)
- return move
+ """Returns a list representing coordinates of the board in the form (row, col)."""
+ coords = self.da.pickMove()
+ self.play(color, coords)
+ return coords
def undo(self):
"""The board configuration and number of captured stones are reset to the state
diff --git a/imago/engine/createDecisionAlgorithm.py b/imago/engine/createDecisionAlgorithm.py
new file mode 100644
index 0000000..d7fafbf
--- /dev/null
+++ b/imago/engine/createDecisionAlgorithm.py
@@ -0,0 +1,21 @@
+"""Create decision algorithms"""
+
+from imago.data.enums import DecisionAlgorithms
+from imago.engine.monteCarlo import MCTS
+from imago.engine.keras.keras import Keras
+
+def create(algorithm, move):
+ """Creates an instance of the requested algorithm."""
+
+ if algorithm == DecisionAlgorithms.MONTECARLO:
+ return MCTS(move)
+
+ if algorithm == DecisionAlgorithms.KERAS:
+ return Keras(move)
+
+ if algorithm == DecisionAlgorithms.DENSE\
+ or algorithm == DecisionAlgorithms.CONV:
+ return Keras(move, algorithm)
+
+ else:
+ return MCTS(move)
diff --git a/imago/engine/decisionAlgorithm.py b/imago/engine/decisionAlgorithm.py
new file mode 100644
index 0000000..5727d25
--- /dev/null
+++ b/imago/engine/decisionAlgorithm.py
@@ -0,0 +1,18 @@
+"""Decision algorithm interface."""
+
+class DecisionAlgorithm:
+
+ def __init__(self, move):
+ pass
+
+ def forceNextMove(self, coords):
+ """Selects given move as next move."""
+ raise NotImplementedError("Method forceNextMove not implemented on type %s" % type(self))
+
+ def pickMove(self):
+ """Returns a move to play."""
+ raise NotImplementedError("Method pickMove not implemented on type %s" % type(self))
+
+ def clearBoard(self):
+ """Empties move history."""
+ raise NotImplementedError("Method clearBoard not implemented on type %s" % type(self))
diff --git a/imago/engine/imagoIO.py b/imago/engine/imagoIO.py
index b929788..9b3e367 100644
--- a/imago/engine/imagoIO.py
+++ b/imago/engine/imagoIO.py
@@ -1,5 +1,3 @@
-#!/usr/bin/python
-
"""Imago GTP engine input output"""
import sys
@@ -7,17 +5,25 @@ import sys
from imago.engine import parseHelpers
from imago.engine.core import GameEngine
+def _response(text=""):
+ print("= %s" % text)
+ print()
+
+def _responseError(text=""):
+ print("? %s" % text)
+ print()
+
def protocol_version(_):
"""Version of the GTP Protocol"""
- print("2")
+ _response("2")
def name(_):
"""Name of the engine"""
- print("Imago")
+ _response("Imago")
def version(_):
"""Version of the engine"""
- print("0.0.0")
+ _response("0.0.0")
def getCoordsText(row, col):
"""Returns a string representation of row and col.
@@ -28,7 +34,7 @@ def getCoordsText(row, col):
class ImagoIO:
"""Recieves and handles commands."""
- def __init__(self):
+ def __init__(self, decisionAlgorithmId = None):
self.commands_set = {
protocol_version,
name,
@@ -45,44 +51,52 @@ class ImagoIO:
self.genmove,
self.undo
}
- self.gameEngine = GameEngine()
+ self.gameEngine = GameEngine(decisionAlgorithmId)
def start(self):
"""Starts reading commands interactively."""
- while True:
- input_tokens = input().split()
-
- if input_tokens[0] == "quit":
- sys.exit(0)
-
- command = None
- for comm in self.commands_set:
- if comm.__name__ == input_tokens[0]:
- command = comm
-
- if command is not None:
- arguments = input_tokens[1:]
- #print("[DEBUG]:Selected command: %s; args: %s" % (command, arguments))
- command(arguments)
- else:
- print("unknown command")
+ try:
+ while True:
+ input_tokens = input().split()
+
+ if len(input_tokens) == 0:
+ continue
+
+ if input_tokens[0] == "quit":
+ sys.exit(0)
+
+ command = None
+ for comm in self.commands_set:
+ if comm.__name__ == input_tokens[0]:
+ command = comm
+
+ if command is not None:
+ arguments = input_tokens[1:]
+ #print("[DEBUG]:Selected command: %s; args: %s" % (command, arguments))
+ command(arguments)
+ else:
+ _responseError("unknown command")
+ except Exception as err:
+ _responseError("An uncontrolled error ocurred. The error was: %s" % err)
def known_command(self, args):
"""True if command is known, false otherwise"""
if len(args) != 1:
- print ("Wrong number of args.")
- print ("Usage: known_command COMMAND_NAME")
- sys.exit(0)
+ _responseError("Wrong number of arguments.")
+ _responseError("Usage: known_command COMMAND_NAME")
+ return
out = "false"
for c in self.commands_set:
if c.__name__ == args[0]:
out = "true"
- print(out)
+ _response(out)
def list_commands(self, _):
"""List of commands, one per row"""
+ output = ""
for c in self.commands_set:
- print("%s - %s" % (c.__name__, c.__doc__))
+ output += ("%s - %s\n" % (c.__name__, c.__doc__))
+ _response(output)
def boardsize(self, args):
"""Changes the size of the board.
@@ -90,38 +104,44 @@ class ImagoIO:
It is wise to call clear_board after this command.
"""
if len(args) != 1:
- print("Error - Wrong n of args")
- sys.exit(1)
+ _responseError("Wrong number of arguments")
+ _responseError("Usag. boardsize <newSize>")
+ return
size = int(args[0])
self.gameEngine.setBoardsize(size)
+ _response()
def clear_board(self, _):
"""The board is cleared, the number of captured stones reset to zero and the move
history reset to empty.
"""
self.gameEngine.clearBoard()
+ _response()
def komi(self, args):
"""Sets a new value of komi."""
if len(args) != 1:
- print("Error - Wrong n of args")
- sys.exit(1)
+ _responseError("Wrong number of arguments")
+ _responseError("Usage: komi <newKomi>")
+ return
komi = float(args[0])
self.gameEngine.setKomi(komi)
+ _response()
def fixed_handicap(self, args):
"""Handicap stones are placed on the board on standard vertices.
These vertices follow the GTP specification.
"""
if len(args) != 1:
- print("Error - Wrong n of args")
- sys.exit(1)
+ _responseError("Wrong number of arguments")
+ _responseError("Usage: fixed_handicap <count>")
+ return
stones = float(args[0])
vertices = self.gameEngine.setFixedHandicap(stones)
out = getCoordsText(vertices[0][0], vertices[0][1])
for vertex in vertices[1:]:
out += " " + getCoordsText(vertex[0], vertex[1])
- print(out)
+ _response(out)
def place_free_handicap(self, args):
"""Handicap stones are placed on the board by the AI criteria."""
@@ -134,20 +154,23 @@ class ImagoIO:
def play(self, args):
"""A stone of the requested color is played at the requested vertex."""
if len(args) != 2:
- print("Error - Wrong n of args")
- sys.exit(1)
+ _responseError("Wrong number of arguments.")
+ _responseError("Usage: play <color> <vertex>")
+ return
move = parseHelpers.parseMove(args, self.gameEngine.gameState.size)
self.gameEngine.play(move.color, move.vertex)
+ _response()
def genmove(self, args):
"""A stone of the requested color is played where the engine chooses."""
if len(args) != 1:
- print("Error - Wrong n of args")
- sys.exit(1)
+ _responseError("Wrong number of arguments.")
+ _responseError("Usage: genmove <color>")
+ return
color = parseHelpers.parseColor(args[0])
output = parseHelpers.vertexToString(self.gameEngine.genmove(color),
self.gameEngine.gameState.size)
- print(output)
+ _response(output)
self.gameEngine.gameState.getBoard().printBoard()
def undo(self, _):
diff --git a/imago/engine/keras/__init__.py b/imago/engine/keras/__init__.py
new file mode 100644
index 0000000..e69de29
--- /dev/null
+++ b/imago/engine/keras/__init__.py
diff --git a/imago/engine/keras/convNeuralNetwork.py b/imago/engine/keras/convNeuralNetwork.py
new file mode 100644
index 0000000..638e2fe
--- /dev/null
+++ b/imago/engine/keras/convNeuralNetwork.py
@@ -0,0 +1,54 @@
+"""Convolutional neural network."""
+
+from tensorflow.keras.models import Sequential
+from tensorflow.keras.layers import Conv2D, MaxPool2D, Flatten, Dense
+from tensorflow.keras.optimizers import Adam
+
+from imago.engine.keras.neuralNetwork import NeuralNetwork
+
+class ConvNeuralNetwork(NeuralNetwork):
+
+ NETWORK_ID = "convNeuralNetwork"
+ DEFAULT_MODEL_FILE = 'models/imagoConvKerasModel.h5'
+
+ def _initModel(self, boardSize=NeuralNetwork.DEF_BOARD_SIZE):
+ model = Sequential([
+ Conv2D(
+ filters=32,
+ kernel_size=(3,3),
+ activation='relu',
+ padding='same',
+ input_shape=(boardSize,boardSize,2)
+ ),
+ MaxPool2D(
+ pool_size=(2,2),
+ strides=2,
+ padding='valid'
+ ),
+ Conv2D(
+ filters=64,
+ kernel_size=(3,3),
+ activation='relu',
+ padding='same'
+ ),
+ MaxPool2D(
+ pool_size=(2,2),
+ strides=2,
+ padding='valid'
+ ),
+ Flatten(),
+ Dense(
+ units=82,
+ activation='softmax'
+ ),
+ ])
+
+ model.summary()
+
+ model.compile(
+ optimizer=Adam(learning_rate=0.0001),
+ loss='categorical_crossentropy',
+ metrics=['accuracy']
+ )
+
+ return model
diff --git a/imago/engine/keras/denseNeuralNetwork.py b/imago/engine/keras/denseNeuralNetwork.py
new file mode 100644
index 0000000..6a350f7
--- /dev/null
+++ b/imago/engine/keras/denseNeuralNetwork.py
@@ -0,0 +1,40 @@
+"""Dense neural network."""
+
+from tensorflow.keras.models import Sequential
+from tensorflow.keras.layers import Dense, Flatten
+from tensorflow.keras.optimizers import Adam
+
+from imago.engine.keras.neuralNetwork import NeuralNetwork
+
+class DenseNeuralNetwork(NeuralNetwork):
+
+ NETWORK_ID = "denseNeuralNetwork"
+ DEFAULT_MODEL_FILE = "models/imagoDenseKerasModel.h5"
+
+ def _initModel(self, boardSize=NeuralNetwork.DEF_BOARD_SIZE):
+ model = Sequential([
+ Dense(
+ units=81,
+ activation="relu",
+ input_shape=(boardSize,boardSize,2)
+ ),
+ Dense(
+ units=81,
+ activation="relu"
+ ),
+ Flatten(),
+ Dense(
+ units=82,
+ activation="softmax"
+ ),
+ ])
+
+ model.summary()
+
+ model.compile(
+ optimizer=Adam(learning_rate=0.0001),
+ loss="categorical_crossentropy",
+ metrics=["accuracy"]
+ )
+
+ return model
diff --git a/imago/engine/keras/initialDenseNeuralNetwork.py b/imago/engine/keras/initialDenseNeuralNetwork.py
new file mode 100644
index 0000000..dfe8379
--- /dev/null
+++ b/imago/engine/keras/initialDenseNeuralNetwork.py
@@ -0,0 +1,28 @@
+"""Dense neural network."""
+
+from tensorflow.keras.models import Sequential
+from tensorflow.keras.layers import Dense
+from tensorflow.keras.optimizers import Adam
+
+from imago.engine.keras.neuralNetwork import NeuralNetwork
+
+defaultModelFile = 'models/imagoDenseKerasModel.h5'
+
+class DenseNeuralNetwork(NeuralNetwork):
+
+ def _initModel(self, boardSize=NeuralNetwork.DEF_BOARD_SIZE):
+ model = Sequential([
+ Dense(units=16, activation='relu', input_shape=(boardSize,boardSize)),
+ Dense(units=32, activation='relu'),
+ Dense(units=boardSize, activation='softmax')
+ ])
+
+ model.summary()
+
+ model.compile(
+ optimizer=Adam(learning_rate=0.0001),
+ loss='categorical_crossentropy',
+ metrics=['accuracy']
+ )
+
+ return model
diff --git a/imago/engine/keras/keras.py b/imago/engine/keras/keras.py
new file mode 100644
index 0000000..871f4a0
--- /dev/null
+++ b/imago/engine/keras/keras.py
@@ -0,0 +1,49 @@
+"""Keras neural network module."""
+
+from imago.data.enums import DecisionAlgorithms
+from imago.gameLogic.gameMove import GameMove
+from imago.gameLogic.gameBoard import GameBoard
+from imago.engine.decisionAlgorithm import DecisionAlgorithm
+from imago.engine.keras.neuralNetwork import NeuralNetwork
+
+DENSE_MODEL_FILE = "/home/taamas/IIS/TFG/imago/models/imagoDenseKerasModel.h5"
+CONV_MODEL_FILE = "/home/taamas/IIS/TFG/imago/models/imagoConvKerasModel.h5"
+DEF_MODEL_FILE = CONV_MODEL_FILE
+
+class Keras(DecisionAlgorithm):
+
+ def __init__(self, move, network=None):
+ self.currentMove = move
+ modelFile = DEF_MODEL_FILE
+ if network == DecisionAlgorithms.DENSE:
+ modelFile = DENSE_MODEL_FILE
+ elif network == DecisionAlgorithms.CONV:
+ modelFile = CONV_MODEL_FILE
+ elif network != None:
+ raise RuntimeError(
+ "Unknown decision algorithm code for neural network: %s" % network
+ )
+
+ self.neuralNetwork = NeuralNetwork(
+ modelFile,
+ move.board.getBoardHeight()
+ )
+
+ def forceNextMove(self, coords):
+ """Selects given move as next move."""
+ if coords == "pass":
+ self.currentMove = self.currentMove.addPass()
+ else:
+ self.currentMove = self.currentMove.addMoveByCoords(coords)
+
+ def pickMove(self):
+ """Returns a move to play."""
+ return self.neuralNetwork.pickMove(
+ self.currentMove,
+ self.currentMove.getNextPlayer()
+ )
+
+ def clearBoard(self):
+ """Empties move history."""
+ boardSize = self.currentMove.board.getBoardHeight()
+ self.currentMove = GameMove(GameBoard(boardSize, boardSize))
diff --git a/imago/engine/keras/neuralNetwork.py b/imago/engine/keras/neuralNetwork.py
new file mode 100644
index 0000000..c414a78
--- /dev/null
+++ b/imago/engine/keras/neuralNetwork.py
@@ -0,0 +1,217 @@
+"""Keras neural network."""
+
+import sys
+import os
+import os.path
+
+import numpy
+from matplotlib import pyplot
+
+from tensorflow.keras.models import load_model
+from tensorflow.keras.utils import plot_model
+
+from imago.data.enums import Player
+
+class NeuralNetwork:
+
+ DEF_BOARD_SIZE = 9
+
+ NETWORK_ID = "neuralNetwork"
+ DEFAULT_MODEL_FILE = "models/imagoKerasModel.h5"
+
+ def __init__(self, modelPath="", boardSize=DEF_BOARD_SIZE):
+ self.boardSize = boardSize
+ self.path = self.DEFAULT_MODEL_FILE
+ if modelPath != "":
+ self.path = modelPath
+ try:
+ self.model = self._loadModel(self.path)
+ except FileNotFoundError:
+ self.model = self._initModel(boardSize)
+ self.saveModelPlot("model.png")
+
+ def _initModel(self, boardSize=DEF_BOARD_SIZE):
+ raise NotImplementedError("Tried to directly use NeuralNetwork class. Use one of the subclasses instead.")
+
+ def trainModel(self, games):
+ trainMoves = []
+ targets = []
+ for game in games:
+ for move in self._movesToTrainMoves(game):
+ trainMoves.append(move)
+ for target in self._movesToTargets(game):
+ targets.append(target)
+ trainMoves = numpy.array(trainMoves)
+ targets = numpy.array(targets)
+ self.model.fit(
+ x=trainMoves,
+ y=targets,
+ validation_split=0.1,
+ batch_size=1,
+ epochs=20,
+ shuffle=False,
+ verbose=2
+ )
+
+ def _loadModel(self, modelPath):
+ # Load model
+ if os.path.isfile(modelPath):
+ return load_model(modelPath)
+ else:
+ raise FileNotFoundError("Keras neural network model file not found at %s"
+ % modelPath)
+
+ def saveModel(self, modelPath=""):
+ """Saves the neural network model at the given path."""
+ if modelPath != "":
+ self.model.save(modelPath)
+ else:
+ self.model.save(self.path)
+
+ def _movesToTrainMoves(self, moves):
+ trainMoves = []
+ for move in moves:
+ if len(move.nextMoves) == 0:
+ continue
+ player = move.nextMoves[0].getPlayer()
+ board = move.board.board
+ trainMove = self._boardToPlayerContext(board, player)
+ trainMoves.append(trainMove)
+ return trainMoves
+
+ def _boardToPlayerContext(self, board, player):
+ """Converts the board to a 3D matrix with two representations of the board, one
+ marking the player's stones and the other marking the opponent's stones."""
+ boardRows = len(board)
+ boardCols = len(board[0])
+ contextBoard = numpy.zeros((boardRows, boardCols, 2), dtype = float)
+ for row in range(boardRows):
+ for col in range(boardCols):
+ if board[row][col] != Player.EMPTY:
+ if board[row][col] == player:
+ contextBoard[row][col][0] = 1
+ else:
+ contextBoard[row][col][1] = 1
+ return contextBoard
+
+ def _movesToTargets(self, moves):
+ """Converts the moves to 2D matrices with values zero except for a one indicating
+ the played move."""
+ targets = []
+ targetsSize = self.boardSize * self.boardSize + 1 # Each vertex + 1 for pass
+ for move in moves:
+ if len(move.nextMoves) == 0:
+ continue
+ target = numpy.zeros(targetsSize, dtype = float)
+ nextMove = move.nextMoves[0]
+ if nextMove.isPass:
+ target[-1] = 1
+ else:
+ target[nextMove.getRow() * self.boardSize + nextMove.getCol()] = 1
+ targets.append(target.tolist())
+ return targets
+
+ def pickMove(self, gameMove, player):
+ """Uses the model's predict function to pick the highest valued vertex to play."""
+
+ predictionVector = self._predict(gameMove, player)[0]
+ predictionBoard = numpy.zeros((self.boardSize, self.boardSize))
+ for row in range(self.boardSize):
+ for col in range(self.boardSize):
+ predictionBoard[row][col] = predictionVector[row * self.boardSize + col]
+ predictionPass = predictionVector[-1]
+ self._saveHeatmap(predictionBoard, predictionPass)
+
+ # Search the highest valued vertex which is also playable
+ playableVertices = gameMove.getPlayableVertices()
+ highest = -sys.float_info.max
+ hRow = -1
+ hCol = -1
+ for row in range(self.boardSize):
+ for col in range(self.boardSize):
+ if predictionBoard[row][col] > highest and (row, col) in playableVertices:
+ hRow = row
+ hCol = col
+ highest = predictionBoard[row][col]
+
+ if highest < predictionPass:
+ return "pass"
+ return [hRow, hCol]
+
+ def _predict(self, gameMove, player):
+ board = gameMove.board.board
+ sampleBoards = self._boardToPlayerContext(board, player)
+ sampleBoards = numpy.array([sampleBoards])
+ return self.model.predict(
+ x = sampleBoards,
+ batch_size = 1,
+ verbose = 2)
+
+ def _saveHeatmap(self, data, passChance):
+ rows = len(data)
+ cols = len(data[0])
+
+ fig, (axBoard, axPass) = pyplot.subplots(1, 2, gridspec_kw={'width_ratios': [9, 1]})
+ imBoard = axBoard.imshow(data, cmap="YlGn")
+ axPass.imshow([[passChance]], cmap="YlGn", norm=imBoard.norm)
+
+ # Tick and label the board
+ axBoard.set_xticks(numpy.arange(cols))
+ axBoard.set_xticklabels(self._getLetterLabels(cols))
+ axBoard.set_yticks(numpy.arange(rows))
+ axBoard.set_yticklabels(numpy.arange(rows, 0, -1))
+
+ # Label the pass chance
+ axPass.set_xticks([0])
+ axPass.set_yticks([])
+ axPass.set_xticklabels(["Pass"])
+
+ # Loop over data dimensions and create text annotations.
+ textColorThreshold = data.max() / 2
+ for row in range(rows):
+ for col in range(cols):
+ textColor = ("k" if data[row, col] < textColorThreshold else "w")
+ axBoard.text(col, row, "%.2f"%(data[row, col]),
+ ha="center", va="center", color=textColor)
+
+ textColor = ("k" if passChance < textColorThreshold else "w")
+ axPass.text(0, 0, "%.2f"%(passChance),
+ ha="center", va="center", color=textColor)
+
+ pyplot.suptitle("Heat map of move likelihood")
+ #axBoard.set_title("Heat map of move likelihood")
+ fig.tight_layout()
+
+ #pyplot.show()
+ pyplot.savefig("heatmaps/heatmap_%s_%s_%d.png" %
+ (
+ self.NETWORK_ID,
+ self.path.replace('/','-'),
+ len([file for file in os.listdir("heatmaps")])
+ )
+ )
+
+ def _getLetterLabels(self, count):
+ labels = []
+ letter = 'A'
+ for _ in range(count):
+ labels.append(letter)
+ letter = chr(ord(letter) + 1)
+ # Skip I
+ if letter == 'I':
+ letter = 'J'
+ return labels
+
+ def saveModelPlot(self, path):
+ plot_model(
+ self.model,
+ to_file=path,
+ show_shapes=True,
+ show_dtype=True,
+ show_layer_names=True,
+ rankdir="TB",
+ expand_nested=True,
+ dpi=96,
+ layer_range=None,
+ show_layer_activations=True,
+ )
diff --git a/imago/engine/monteCarlo.py b/imago/engine/monteCarlo.py
new file mode 100644
index 0000000..baaaba8
--- /dev/null
+++ b/imago/engine/monteCarlo.py
@@ -0,0 +1,187 @@
+"""Monte Carlo Tree Search module."""
+
+import sys
+import random
+
+from imago.data.enums import Player
+from imago.engine.decisionAlgorithm import DecisionAlgorithm
+
+class MCTS(DecisionAlgorithm):
+ """Monte Carlo tree."""
+
+ def __init__(self, move):
+ self.root = MCTSNode(move, None)
+
+ def forceNextMove(self, coords):
+ """Selects given move as next move."""
+ if coords == "pass":
+ raise NotImplementedError("Pass not implemented for MCTS algorithm.")
+ for node in self.root.children:
+ if (node.move.getRow() == coords[0]
+ and node.move.getCol() == coords[1]):
+ self.root = node
+ return
+ self.root = self.root.expansionForCoords(coords)
+
+ def pickMove(self):
+ """
+ Performs an exploratory cycle, updates the root to the best node and returns its
+ corresponding move."""
+ #NOTE: with only one selection-expansion the match is
+ # completely random
+ for _ in range(5):
+ self.root.selection().expansion().simulation(10, 20)
+ selectedNode = self._selectBestNextNode()
+ return selectedNode.move.coords
+
+ def _selectBestNextNode(self):
+ """Returns best ucb node available for the current player."""
+
+ # Assumes at least one expansion has occurred
+ bestUCB = -sys.maxsize - 1
+ bestNode = None
+ for node in self.root.children:
+ ucb = node.ucbForPlayer()
+ if ucb > bestUCB:
+ bestUCB = ucb
+ bestNode = node
+
+ return bestNode
+
+ def clearBoard(self):
+ """Empties move history."""
+ while self.root.parent is not None:
+ self.root = self.root.parent
+
+class MCTSNode:
+ """Monte Carlo tree node."""
+
+ def __init__(self, move, parent):
+ self.visits = 0
+ self.score = 0
+ self.move = move
+ self.parent = parent
+ self.children = set()
+ self.unexploredVertices = move.getPlayableVertices()
+
+ def ucbForPlayer(self):
+ """
+ Returns Upper Confidence Bound of node changing the symbol if the move is for the
+ wite player."""
+ return self._ucbForSpecificPlayer(self.move.getPlayer())
+
+ def _ucbForSpecificPlayer(self, player):
+ """
+ Returns Upper Confidence Bound of node from the perspective of the given
+ player."""
+ if player == Player.WHITE:
+ return self._ucb() * -1
+ return self._ucb()
+
+ def _ucb(self):
+ """Returns Upper Confidence Bound of node"""
+ # UCB = meanVictories + 1/visits
+ if self.visits == 0:
+ return 0
+ mean = self.score / self.visits
+ adjust = 1/self.visits
+ return mean + adjust
+
+ def selection(self):
+ """Select the most promising node with unexplored children."""
+ bestNode = self._selectionRec(self)
+ return bestNode
+
+ def _selectionRec(self, bestNode):
+ """Searches this node and its children for the node with the best UCB value for
+ the current player."""
+
+ #TODO: En cada nivel debe escoger como mejor el que sea mejor para quien le toque
+ # jugar, ya que esa es la partida esperada. Esto es lo que hacía con
+ # ucbForPlayer()
+
+ # ¿Cada nuevo nodo expandido tiene una puntuación inicial? ¿Se le hacen
+ # exploraciones?
+
+ # Backpropagation: ¿Es correcto acumular la puntuación de cada nodo hacia
+ # arriba? ¿Sería mejor acumular hacia arriba el valor del mejor nodo? ¿O del
+ # juego perfecto? Estos dos últimos valores no son el mismo.
+
+ player = self.move.getPlayer()
+
+ # Check if node has unexplored children and better UCB than previously explored
+ if len(self.unexploredVertices) > 0:
+ if self._ucbForSpecificPlayer(
+ player) > bestNode._ucbForSpecificPlayer(player):
+ bestNode = self
+
+ # Recursively search children for better UCB
+ for child in self.children:
+ bestChildNode = child._selectionRec(bestNode)
+ if bestChildNode._ucbForSpecificPlayer(
+ player) > bestNode._ucbForSpecificPlayer(player):
+ bestNode = bestChildNode
+
+ return bestNode
+
+ def expansion(self):
+ """Pick an unexplored vertex from this node and add it as a new MCTSNode."""
+ newVertex = random.choice(list(self.unexploredVertices))
+ return self.expansionForCoords(newVertex)
+
+ def expansionForCoords(self, coords):
+ """
+ Adds a move for the given coordinates as a new node to the children of this
+ node."""
+ newMove = self.move.addMove(coords[0], coords[1])
+ newNode = MCTSNode(newMove, self)
+ self.children.add(newNode)
+ self.unexploredVertices.remove((coords[0], coords[1]))
+ return newNode
+
+ def simulation(self, nMatches, scoreDiffHeur):
+ """Play random matches to accumulate reward information on the node."""
+ scoreAcc = 0
+ for _ in range(nMatches):
+ result = self._randomMatch(scoreDiffHeur)
+ self.visits += 1
+ scoreDiff = result[0]-result[1]
+ if scoreDiff != 0:
+ scoreAcc += scoreDiff / abs(scoreDiff)
+ # Backpropagation
+ node = self
+ while node is not None:
+ node.score += scoreAcc
+ node.visits += nMatches
+ node = node.parent
+
+ def _randomMatch(self, scoreDiffHeur):
+ """Play a random match and return the resulting score."""
+ #IMPORTANT: the score heuristic doesn't work for the first move of the game, since
+ #the black player holds all except for one vertex!
+ currentMove = self.move
+ score = currentMove.board.score()
+ while currentMove.getGameLength() < 5 or abs(score[0] - score[1]) < scoreDiffHeur:
+ if currentMove.isPass and currentMove.previousMove.isPass:
+ return score
+ sensibleMoves = currentMove.getSensibleVertices()
+ if len(sensibleMoves) == 0:
+ currentMove = currentMove.addPass()
+ else:
+ selectedMove = random.choice(list(sensibleMoves))
+ currentMove = currentMove.addMoveByCoords(selectedMove)
+ score = currentMove.board.score()
+ print("Current move: %s" % (str(currentMove)))
+ print("Current move game length: ", currentMove.getGameLength())
+ print("Score of the board: %d, %d (%d)"
+ % (score[0],
+ score[1],
+ score[0]-score[1])
+ )
+ currentMove.printBoard()
+ return score
+
+ def _printBoardInfo(self):
+ """Prints the visits and score for debugging purposes."""
+ print("Visits: %d" % self.visits)
+ print("Score: %d" % self.score)
diff --git a/imago/engine/parseHelpers.py b/imago/engine/parseHelpers.py
index 32f0753..fc42845 100644
--- a/imago/engine/parseHelpers.py
+++ b/imago/engine/parseHelpers.py
@@ -15,32 +15,28 @@ VALID_BLACK_STRINGS = {
"BLACK"
}
-class ParseCodes(Enum):
- """Return values of the move parser."""
- ERROR = enumAuto()
- QUIT = enumAuto()
-
def parseMove(args, boardsize):
- """Converts the textual input of a move to a move instance."""
+ """Converts the textual representation of a move to a move instance."""
if len(args) != 2:
- print("[ERROR] - Wrong n of args for move")
- return ParseCodes.ERROR
+ raise RuntimeError(
+ "Unable to transform string %s to move: Wrong format."
+ % args)
color = parseColor(args[0])
vertex = parseVertex(args[1], boardsize)
return GtpMove(color, vertex)
def parseColor(text):
"""Returns color of a move given its input string."""
- text = text.upper()
- if text in VALID_WHITE_STRINGS:
+ textUpper = text.upper()
+ if textUpper in VALID_WHITE_STRINGS:
return Player.WHITE
- if text in VALID_BLACK_STRINGS:
+ if textUpper in VALID_BLACK_STRINGS:
return Player.BLACK
- print("[ERROR] - Unknown color.")
- return ParseCodes.ERROR
+ raise RuntimeError("Unknown color %s." % text)
def parseVertex(text, boardSize):
- """Returns row and column of a vertex given its input string.
+ """Returns row and column of a vertex given its input string. A vertex can also be the
+ string "pass".
GTP uses A1 style notation: columns are letters left to right, rows are number bottom
to top.
@@ -48,7 +44,11 @@ def parseVertex(text, boardSize):
text = text.upper()
if not re.match("^[A-HJ-Z][1-9][0-9]*$", text):
- return ParseCodes.ERROR
+ if text == "PASS":
+ return "pass"
+ raise RuntimeError(
+ "Unable to transform string %s to vertex. Wrong format."
+ % text)
vertexCol = ord(text[0])
# Column 'I' does not exist
@@ -60,7 +60,9 @@ def parseVertex(text, boardSize):
if (vertexCol < 0 or vertexRow < 0
or vertexCol >= boardSize or vertexRow >= boardSize):
- return ParseCodes.ERROR
+ raise RuntimeError(
+ "Unable to transform string %s to vertex. Maps to [%d, %d], which is out of board bounds (size %d)"
+ % (text, vertexCol, vertexRow, boardSize))
return [vertexRow, vertexCol]
@@ -70,10 +72,16 @@ def vertexToString(vertex, boardSize):
GTP uses A1 style notation: columns are letters left to right, rows are number bottom
to top.
"""
+ if vertex == "pass":
+ return "pass"
if len(vertex) != 2:
- return ParseCodes.ERROR
+ raise RuntimeError(
+ "Unable to transform vertex %s to string. Too many elements."
+ % str(vertex))
if vertex[0] >= boardSize or vertex[1] >= boardSize or vertex[0] < 0 or vertex[1] < 0:
- return ParseCodes.ERROR
+ raise RuntimeError(
+ "Unable to transform vertex %s to string. Vertex out of board bounds (size %d)"
+ % (str(vertex), boardSize))
vertexRow = boardSize - vertex[0]
vertexCol = ord('A') + vertex[1]
diff --git a/imago/gameLogic/gameBoard.py b/imago/gameLogic/gameBoard.py
index 265b646..611c4cb 100644
--- a/imago/gameLogic/gameBoard.py
+++ b/imago/gameLogic/gameBoard.py
@@ -4,45 +4,61 @@ from copy import deepcopy
from imago.data.enums import Player
-def getNewBoard(size):
+def _getNewBoard(height, width):
"""Return a new board."""
board = []
- for row in range(size):
+ for row in range(height):
board.append([])
- for _ in range(size):
+ for _ in range(width):
board[row].append(Player.EMPTY)
return board
class GameBoard:
+ """Logic and state related to the board."""
- def __init__(self, size):
- self.board = getNewBoard(size)
+ def __init__(self, height, width):
+ self.board = _getNewBoard(height, width)
self.capturesBlack = 0
self.capturesWhite = 0
- self.lastStone = None
+
+ def getBoard(self):
+ """Gets the matrix representing the board."""
+ return self.board
+
+ def getBoardHeight(self):
+ """Returns the number of rows in the board."""
+ return len(self.board)
+
+ def getBoardWidth(self):
+ """Returns the number of columns of the first row of the board. This number should
+ be the same for all the rows."""
+ return len(self.board[0])
def getDeepCopy(self):
"""Returns a copy GameBoard."""
- newBoard = GameBoard(len(self.board))
+ newBoard = GameBoard(self.getBoardHeight(), self.getBoardWidth())
newBoard.capturesBlack = self.capturesBlack
newBoard.capturesWhite = self.capturesWhite
- newBoard.lastStone = self.lastStone
newBoard.board = deepcopy(self.board)
return newBoard
def getGroupLiberties(self, row, col):
- """Returns the empty vertexes adjacent to the group occupying a cell (its
- liberties) or -1 if the cell is empty.
+ """Returns the empty vertices adjacent to the group occupying a vertex (its
+ liberties) as a set. An empty set is returned if the vertex is empty.
"""
groupColor = self.board[row][col]
if groupColor == Player.EMPTY:
- return -1
+ return set()
emptyCells = set()
exploredCells = set()
- self.__exploreLiberties(row, col, groupColor, emptyCells, exploredCells)
+ self._exploreLiberties(row, col, groupColor, emptyCells, exploredCells)
return emptyCells
- def __exploreLiberties(self, row, col, groupColor, emptyCells, exploredCells):
+ def getGroupLibertiesCount(self, row, col):
+ """Returns the number of liberties of a group."""
+ return len(self.getGroupLiberties(row, col))
+
+ def _exploreLiberties(self, row, col, groupColor, emptyCells, exploredCells):
"""Adds surrounding empty cells to array if they have not been added yet
and explores adjacent occupied cells of the same group.
"""
@@ -58,99 +74,217 @@ class GameBoard:
emptyCells.add((row, col))
return
- # Up
- if row > 0:
- self.__exploreLiberties(row-1, col, groupColor, emptyCells, exploredCells)
+ for side in ((-1,0), (1,0), (0,-1), (0,1)):
+ rowToExplore = row + side[0]
+ colToExplore = col + side[1]
+ if self.isMoveInBoardBounds(rowToExplore, colToExplore):
+ self._exploreLiberties(rowToExplore, colToExplore, groupColor,
+ emptyCells, exploredCells)
- # Right
- if col < len(self.board[0])-1:
- self.__exploreLiberties(row, col+1, groupColor, emptyCells, exploredCells)
-
- # Down
- if row < len(self.board)-1:
- self.__exploreLiberties(row+1, col, groupColor, emptyCells, exploredCells)
-
- # Left
- if col > 0:
- self.__exploreLiberties(row, col-1, groupColor, emptyCells, exploredCells)
-
- def getGroupCells(self, row, col):
- """Returns a set containing the cells occupied by the group in the given cell."""
+ def getGroupVertices(self, row, col):
+ """
+ Returns a set containing the cells occupied by the group in the given cell.
+ This is also valid if the cell is empty."""
groupColor = self.board[row][col]
- if groupColor == Player.EMPTY:
- return 0
cells = set()
self.__exploreGroup(row, col, groupColor, cells)
return cells
+ def getGroupVerticesCount(self, row, col):
+ """Returns the number of cells of a group."""
+ return len(self.getGroupVertices(row, col))
+
def __exploreGroup(self, row, col, groupColor, cells):
if self.board[row][col] != groupColor or (row, col) in cells:
return
cells.add((row, col))
- # Up
- if row > 0:
- self.__exploreGroup(row-1, col, groupColor, cells)
+ for side in ((-1,0), (1,0), (0,-1), (0,1)):
+ rowToExplore = row + side[0]
+ colToExplore = col + side[1]
+ if self.isMoveInBoardBounds(rowToExplore, colToExplore):
+ self.__exploreGroup(rowToExplore, colToExplore, groupColor, cells)
- # Right
- if col < len(self.board[0])-1:
- self.__exploreGroup(row, col+1, groupColor, cells)
+ def moveAndCapture(self, row, col, player):
+ """Checks surrounding captures of a move, removes them and returns a set
+ containing the vertices where stones were captured.
+ """
- # Down
- if row < len(self.board)-1:
- self.__exploreGroup(row+1, col, groupColor, cells)
+ if (row < 0 or row >= self.getBoardHeight()
+ or col < 0 or col >= self.getBoardWidth()):
+ raise RuntimeError("[ERROR] Move and capture: out of bounds (%d, %d)" % (row, col))
- # Left
- if col > 0:
- self.__exploreGroup(row, col-1, groupColor, cells)
+ self.board[row][col] = player
+ captured = set()
+
+ for side in ((-1,0), (1,0), (0,-1), (0,1)):
+ rowToExplore = row + side[0]
+ colToExplore = col + side[1]
+ if self.isMoveInBoardBounds(rowToExplore, colToExplore):
+ if (self.board[rowToExplore][colToExplore] != player
+ and self.board[rowToExplore][colToExplore] != Player.EMPTY
+ and self.getGroupLibertiesCount(rowToExplore, colToExplore) == 0):
+ captured.update(self.__captureGroup(rowToExplore, colToExplore))
- def moveCapture(self, row, col, player):
- """Checks surrounding captures of a move, removes them and returns the number of
- stones captured.
- """
- captured = 0
- if row > 0:
- if (self.board[row-1][col] != player
- and self.board[row-1][col] != Player.EMPTY
- and len(self.getGroupLiberties(row-1, col)) == 0):
- captured += self.captureGroup(row-1, col)
- if row < len(self.board)-1:
- if (self.board[row+1][col] != player
- and self.board[row+1][col] != Player.EMPTY
- and len(self.getGroupLiberties(row+1, col)) == 0):
- captured += self.captureGroup(row+1, col)
- if col > 0:
- if (self.board[row][col-1] != player
- and self.board[row][col-1] != Player.EMPTY
- and len(self.getGroupLiberties(row, col-1)) == 0):
- captured += self.captureGroup(row, col-1)
- if col < len(self.board[0])-1:
- if (self.board[row][col+1] != player
- and self.board[row][col+1] != Player.EMPTY
- and len(self.getGroupLiberties(row, col+1)) == 0):
- captured += self.captureGroup(row, col+1)
return captured
- def captureGroup(self, row, col):
- """Removes all the stones from the group occupying the given cell and returns the
- number of removed stones.
+ def __captureGroup(self, row, col):
+ """Removes all the stones from the group occupying the given cell and returns a
+ set containing them.
"""
- cellsToCapture = self.getGroupCells(row, col)
- count = 0
+ cellsToCapture = self.getGroupVertices(row, col)
for cell in cellsToCapture:
self.board[cell[0]][cell[1]] = Player.EMPTY
- count += 1
- return count
+ return cellsToCapture
+
+ def isMoveInBoardBounds(self, row, col):
+ """Returns True if move is inside board bounds, false otherwise."""
+ return 0 <= row < self.getBoardHeight() and 0 <= col < self.getBoardWidth()
+
+ def isCellEmpty(self, row, col):
+ """Returns True if cell is empty, false otherwise."""
+ return self.board[row][col] == Player.EMPTY
+
+ def isCellEye(self, row, col):
+ """Returns the surrounding color if the cell is part of an eye and Player.EMTPY
+ otherwise.
+ """
+ # if isCellEmpty && all adjacent to group are same color
+ if not self.isCellEmpty(row, col):
+ return Player.EMPTY
+ groupCells = self.getGroupVertices(row, col)
+ surroundingColor = Player.EMPTY
+ # Check surrounding cells of each cell in the group
+ for cell in groupCells:
+ for side in ((-1,0), (1,0), (0,-1), (0,1)):
+ rowChecked = cell[0]+side[0]
+ colChecked = cell[1]+side[1]
+ if self.isMoveInBoardBounds(rowChecked, colChecked):
+ otherColor = self.board[rowChecked][colChecked]
+ if otherColor != Player.EMPTY:
+ if surroundingColor == Player.EMPTY:
+ surroundingColor = otherColor
+ elif surroundingColor != otherColor:
+ return Player.EMPTY
+ return surroundingColor
+
+ def isMoveSuicidal(self, row, col, player):
+ """Returns True if move is suicidal."""
+
+ # Check vertex is empty
+ if not self.isCellEmpty(row, col):
+ raise RuntimeError("Cell to play should be empty when checking for suicide.")
+
+ # Temporarily play and capture
+ self.board[row][col] = player
+ groupLiberties = self.getGroupLibertiesCount(row, col)
+ captured = self.moveAndCapture(row, col, player)
+
+ illegal = False
+ # If move didn't capture anything and its group is left without liberties, it's
+ # suicidal
+ if len(captured) == 0 and groupLiberties == 0:
+ illegal = True
+
+ # Restore captured stones
+ for vertex in captured:
+ self.board[vertex[0]][vertex[1]] = Player.otherPlayer(player)
+ # Remove temporarily played stone
+ self.board[row][col] = Player.EMPTY
+ return illegal
+
+ def isMoveKoIllegal(self, row, col, player, prevBoards):
+ """Returns True if move is illegal because of ko."""
+
+ # Check vertex is empty
+ if not self.isCellEmpty(row, col):
+ raise RuntimeError("Cell to play should be empty when checking for ko.")
+
+ illegal = False
+ # Temporarily play and capture for comparisons
+ captured = self.moveAndCapture(row, col, player)
+ # Check previous boards
+ for prevBoard in prevBoards:
+ # A ko is possible in boards where the stone to play exists
+ if prevBoard.board[row][col] == player:
+ if self.equals(prevBoard):
+ illegal = True
+
+ # Restore captured stones
+ for vertex in captured:
+ self.board[vertex[0]][vertex[1]] = Player.otherPlayer(player)
+ # Remove temporarily played stone
+ self.board[row][col] = Player.EMPTY
+ return illegal
+
+ def isPlayable(self, row, col, player, prevBoards):
+ """Determines if a move is playable."""
+ if not self.isMoveInBoardBounds(row, col):
+ return False, "Move outside board bounds."
+ if not self.isCellEmpty(row, col):
+ return False, "Vertex is not empty."
+ if self.isMoveSuicidal(row, col, player):
+ return False, "Move is suicidal."
+ if self.isMoveKoIllegal(row, col, player, prevBoards):
+ return False, "Illegal by ko rule."
+ return True, ""
+
+ def isSensible(self, row, col, player, prevBoards):
+ """Determines if a move is playable and sensible."""
+ playable, playableText = self.isPlayable(row, col, player, prevBoards)
+ if not playable:
+ return playable, playableText
+ if ( self.getGroupVerticesCount(row, col) == 1
+ and self.isCellEye(row, col) == player ):
+ return False, "Move fills own eye."""
+ return True, ""
+
+ def score(self):
+ """Gets the current score given by the already surrounded territory for Japanese
+ rules. The format of the returned score is (black, white).
+ """
+ scores = []
+ for player in Player:
+ while len(scores) <= player.value:
+ scores.append(0)
+ checkedVertices = set()
+ for row in range(0, self.getBoardHeight()):
+ for col in range(0, self.getBoardWidth()):
+ if not (row, col) in checkedVertices:
+ group = self.getGroupVertices(row, col)
+ for cell in group:
+ checkedVertices.add(cell)
+ surroundingColor = self.isCellEye(row, col)
+ if surroundingColor != Player.EMPTY:
+ scores[surroundingColor.value] += len(group)
+ return (scores[Player.BLACK.value], scores[Player.WHITE.value])
+
+ def equals(self, otherBoard):
+ """Returns true if this board is equal to another board. Only takes into account
+ dimensions and placed stones.
+ """
+ if ( self.getBoardHeight() != otherBoard.getBoardHeight()
+ or self.getBoardWidth() != otherBoard.getBoardWidth() ):
+ return False
+ for row in range(self.getBoardHeight()):
+ for col in range(self.getBoardWidth()):
+ if self.board[row][col] != otherBoard.board[row][col]:
+ return False
+ return True
def printBoard(self):
"""Print the board."""
colTitle = 'A'
rowTitlePadding = 2
+ if self.getBoardHeight() >= 10:
+ firstRowPadding = 2
+ else:
+ firstRowPadding = 1
# Print column names
- rowText = " " * (rowTitlePadding + 2)
- for col in range(len(self.board[0])):
+ rowText = " " * (rowTitlePadding + firstRowPadding)
+ for col in range(self.getBoardWidth()):
rowText += colTitle + " "
colTitle = chr(ord(colTitle)+1)
if colTitle == "I": # Skip I
@@ -158,7 +292,7 @@ class GameBoard:
print(rowText)
# Print rows
- rowTitle = len(self.board)
+ rowTitle = self.getBoardHeight()
for row in self.board:
rowText = ""
for col in row:
diff --git a/imago/gameLogic/gameMove.py b/imago/gameLogic/gameMove.py
index bd210b4..c1c7a05 100644
--- a/imago/gameLogic/gameMove.py
+++ b/imago/gameLogic/gameMove.py
@@ -1,19 +1,145 @@
"""Information about one move."""
+from imago.data.enums import Player
+
class GameMove:
+ """Stores information about a move. A move in this context is one position of the Game
+ Tree: the board can be empty, or the move can consist of more than one added or
+ removed stones."""
- def __init__(self, player, row, col, makesKo, board):
- self.player = player
- self.row = row
- self.col = col
- self.makesKo = makesKo
+ def __init__(self, board, coords=None, isPass=False, playerWhoPassed=None):
self.board = board
self.nextMoves = []
self.previousMove = None
+ self.isPass = isPass
+ self.coords = coords
+ self.playerWhoPassed = playerWhoPassed
+
+ def getRow(self):
+ """Returns the row of the vertex the move was played on."""
+ if self.coords is None:
+ return None
+ return self.coords[0]
+
+ def getCol(self):
+ """Returns the column of the vertex the move was played on."""
+ if self.coords is None:
+ return None
+ return self.coords[1]
+
+ def getPlayer(self):
+ """Returns the player who placed the last stone or passed."""
+ if self.isPass:
+ if self.previousMove is None:
+ return Player.BLACK
+ return self.playerWhoPassed
+
+ if self.coords is None: # Not pass and no coordinates: root move of the tree
+ return Player.EMPTY
+
+ return self.board.getBoard()[self.getRow()][self.getCol()]
+
+ def getNextPlayer(self):
+ """Returns the player who should place the next stone."""
+ selfPlayer = self.getPlayer()
+ if selfPlayer == Player.EMPTY:
+ return Player.BLACK
+ return Player.otherPlayer(selfPlayer)
+
+ def getGameLength(self):
+ """Returns the number of (actual player-made) moves since the game started."""
+ acc = 0
+ prevMove = self.previousMove
+ while prevMove is not None:
+ acc += 1
+ prevMove = prevMove.previousMove
+ return acc
+
+ def getThisAndPrevBoards(self):
+ """Returns an array with all the boards of this and previous moves."""
+ prevBoards = []
+ checkedMove = self.previousMove
+ while checkedMove is not None:
+ prevBoards.append(checkedMove.board)
+ checkedMove = checkedMove.previousMove
+ return prevBoards
+
+ def getPlayableVertices(self):
+ """Returns a set with the playable vertices."""
+ return self._getVerticesByFilter(self.board.isPlayable)
+
+ def getSensibleVertices(self):
+ """Returns a set with the sensible vertices."""
+ return self._getVerticesByFilter(self.board.isSensible)
+
+ def _getVerticesByFilter(self, filterFunction):
+ """Returns a set with the vertices which fill a requirement."""
+ vertices = set()
+ player = self.getNextPlayer()
+ prevBoards = self.getThisAndPrevBoards()
+ for row in range(self.board.getBoardHeight()):
+ for col in range(self.board.getBoardWidth()):
+ valid, _ = filterFunction(row, col, player, prevBoards)
+ if valid:
+ vertices.add((row, col))
+ return vertices
- def addMove(self, player, row, col, makesKo, board):
- """Adds a move to the next moves list."""
- newMove = GameMove(player, row, col, makesKo, board)
+ def addMoveByCoords(self, coords):
+ """Adds a move to the next moves list creating its board from this move's board
+ plus a new stone at the specified coordinates.
+ """
+ return self.addMove(coords[0], coords[1])
+
+
+ def addMove(self, row, col):
+ """Adds a move to the next moves list creating its board from this move's board
+ plus a new stone at the specified row and column.
+ """
+ if self.getPlayer() == Player.EMPTY:
+ player = Player.BLACK
+ else:
+ player = Player.otherPlayer(self.getPlayer())
+ return self.addMoveForPlayer(row, col, player)
+
+ def addMoveForPlayer(self, row, col, player):
+ """Adds a move to the next moves list creating its board from this move's board
+ plus a new stone at the specified row and column.
+ """
+ newBoard = self.board.getDeepCopy()
+ newBoard.moveAndCapture(row, col, player)
+ newMove = GameMove( newBoard, (row, col) )
newMove.previousMove = self
self.nextMoves.append(newMove)
return newMove
+
+ def addPass(self):
+ """Adds a pass move to the next moves list."""
+ return self.addPassForPlayer(self.getNextPlayer())
+
+ def addPassForPlayer(self, player):
+ """Adds a pass move for the given player to the next moves list."""
+ newBoard = self.board.getDeepCopy()
+ newMove = GameMove(newBoard, isPass=True, playerWhoPassed=player)
+ newMove.previousMove = self
+ self.nextMoves.append(newMove)
+ return newMove
+
+ def getMainLineOfPlay(self, previousMoves=[]):
+ """Returns, recursively, this move and its first children, so a list of moves is
+ obtained. This typically represents the played sequence of a match."""
+ previousMoves.append(self)
+ if len(self.nextMoves) == 0:
+ return previousMoves
+ return self.nextMoves[0].getMainLineOfPlay(previousMoves)
+
+ def __str__(self):
+ """Returns the coordinates of the move as a string."""
+ if self.isPass:
+ return "Pass"
+ if self.coords is None:
+ return "Root move"
+ return "(%d, %d)" % (self.getRow(), self.getCol())
+
+ def printBoard(self):
+ """Prints the board as of this move."""
+ self.board.printBoard()
diff --git a/imago/gameLogic/gameState.py b/imago/gameLogic/gameState.py
index 7a96962..72b91b4 100644
--- a/imago/gameLogic/gameState.py
+++ b/imago/gameLogic/gameState.py
@@ -1,7 +1,6 @@
"""Storing state of the game."""
from imago.data.enums import Player
-from imago.gameLogic.gameTree import GameTree
from imago.gameLogic.gameMove import GameMove
from imago.gameLogic.gameBoard import GameBoard, cellToString
@@ -10,15 +9,16 @@ class GameState:
def __init__(self, size):
self.size = size
- self.gameTree = None
self.lastMove = None
- self.initState()
+ self.clearBoard()
def getCurrentPlayer(self):
"""Gets the player who should make the next move."""
if self.lastMove is None:
return Player.BLACK
- return Player.otherPlayer(self.lastMove.player)
+ if self.lastMove.getPlayer() is Player.EMPTY:
+ return Player.BLACK
+ return Player.otherPlayer(self.lastMove.getPlayer())
def getPlayerCode(self):
"""Gets a string representation of the current player."""
@@ -26,10 +26,13 @@ class GameState:
def getBoard(self):
"""Returns the board as of the last move."""
- if self.lastMove is None:
- return GameBoard(self.size)
return self.lastMove.board
+ def clearBoard(self):
+ """Empties the board and moves tree."""
+ newBoard = GameBoard(self.size, self.size)
+ self.lastMove = GameMove(newBoard)
+
def playMove(self, row, col):
"""Execute a move on the board for the current player and switches players."""
return self.playMoveForPlayer(row, col, self.getCurrentPlayer())
@@ -37,69 +40,32 @@ class GameState:
def playMoveForPlayer(self, row, col, player):
"""Execute a move on the board for the given player."""
- # Check valid move
- if not self.prevalidateMove(row, col):
- print("Invalid move!")
- return False
-
- newBoard = self.getBoard().getDeepCopy()
-
- newBoard.board[row][col] = player
-
- groupLiberties = newBoard.getGroupLiberties(row, col)
+ prevBoards = self.lastMove.getThisAndPrevBoards()
+ playable, message = self.lastMove.board.isPlayable(row, col, player, prevBoards)
+ if playable:
+ self._addMove(player, row, col)
+ return True
+ print("Invalid Move! %s" % message)
+ return False
- # Check suicide
- killed = newBoard.moveCapture(row, col, player)
- if killed == 0 and len(groupLiberties) == 0:
- print("Invalid move! (Suicide)")
- return False
+ def playPass(self):
+ """Passes the turn for the player who should make a move."""
+ self.lastMove.addPass()
- # Check ko
- if self.lastMove is not None:
- illegalKoVertex = self.lastMove.makesKo
- if illegalKoVertex is not None:
- if row == illegalKoVertex[0] and col == illegalKoVertex[1]:
- print("Invalid move! (Ko)")
- return False
-
- # Move is legal
-
- # Check if move makes ko
- makesKo = None
- if killed == 1 and len(groupLiberties) == 1:
- makesKo = groupLiberties[0]
-
- self.__addMove(player, row, col, makesKo, newBoard)
- return True
+ def passForPlayer(self, player):
+ """Passes the turn for the given player."""
+ self.lastMove.addPassForPlayer(player)
def undo(self):
"""Sets the move before the last move as the new last move."""
self.lastMove = self.lastMove.previousMove
- def initState(self):
- """Starts current player, captured stones, board and game tree."""
- self.capturesBlack = 0
- self.capturesWhite = 0
- self.gameTree = GameTree()
- self.lastMove = None
+ def _addMove(self, player, row, col):
- def clearBoard(self):
- """Clears the board, captured stones and game tree."""
- self.initState()
-
- def prevalidateMove(self, row, col):
- """Returns True if move is valid, False if not."""
- if (row < 0 or row >= self.size
- or col < 0 or col >= self.size):
- return False
- if self.getBoard().board[row][col] != Player.EMPTY:
- return False
- return True
-
- def __addMove(self, player, row, col, makesKo, newBoard):
+ # Check a last move already exists
if self.lastMove is None:
- self.lastMove = GameMove(player, row, col, makesKo, newBoard)
- self.gameTree.firstMoves.append(self.lastMove)
- else:
- self.lastMove = self.lastMove.addMove(player, row, col, makesKo, newBoard)
+ raise RuntimeError("Last move of the GameState is None.")
+
+ # Add and return the new move
+ self.lastMove = self.lastMove.addMoveForPlayer(row, col, player)
return self.lastMove
diff --git a/imago/gameLogic/gameTree.py b/imago/gameLogic/gameTree.py
index 4b88c4d..5955252 100644
--- a/imago/gameLogic/gameTree.py
+++ b/imago/gameLogic/gameTree.py
@@ -2,7 +2,7 @@
# This class will not be necessary if it just keeps being a list of moves
-class GameTree:
-
- def __init__(self):
- self.firstMoves = []
+#class GameTree:
+#
+# def __init__(self):
+# self.firstMoves = []
diff --git a/imago/scripts/__init__.py b/imago/scripts/__init__.py
new file mode 100644
index 0000000..e69de29
--- /dev/null
+++ b/imago/scripts/__init__.py
diff --git a/imago/scripts/monteCarloSimulation.py b/imago/scripts/monteCarloSimulation.py
new file mode 100644
index 0000000..395a87e
--- /dev/null
+++ b/imago/scripts/monteCarloSimulation.py
@@ -0,0 +1,25 @@
+#!/usr/bin/python
+
+"""Runs MonteCarlo simulations."""
+
+import sys
+
+from imago.gameLogic.gameBoard import GameBoard
+from imago.gameLogic.gameMove import GameMove
+from imago.engine.monteCarlo import MCTSNode
+
+if __name__ == "__main__":
+
+ if len(sys.argv) != 4:
+ print("[ERROR] Usage: monteCarloSimulation.py <size> <scoreDiffHeur> <nMatches>")
+ sys.exit(1)
+
+ size = int(sys.argv[1])
+ scoreDiffHeur = int(sys.argv[2])
+ nMatches = int(sys.argv[3])
+
+ board = GameBoard(size, size)
+ move = GameMove(board)
+ node = MCTSNode(move, None)
+ node.simulation(nMatches, scoreDiffHeur)
+ print("Score: %d" % node.score)
diff --git a/imago/scripts/monteCarloSimulation.sh b/imago/scripts/monteCarloSimulation.sh
new file mode 100755
index 0000000..8aa9e68
--- /dev/null
+++ b/imago/scripts/monteCarloSimulation.sh
@@ -0,0 +1,24 @@
+#!/bin/sh
+
+# Stores statistical data about MonteCarlo simulations
+
+outputDir="out"
+
+sampleSize=50
+nMatches=10
+
+mkdir -p "$outputDir"
+
+for size in 9 13 19; do
+ for scoreDiffHeur in 10 30 60; do
+ filename="size${size}_scoreDiffHeur${scoreDiffHeur}.dat"
+ logFile="size${size}_scoreDiffHeur${scoreDiffHeur}_fullOutput.log"
+ rm "$logFile"
+ for i in $(seq "$sampleSize"); do
+ python ./monteCarloSimulation.py "$size" "$scoreDiffHeur" "$nMatches" |
+ tee -a "${outputDir}/${logFile}" |
+ grep -E '^Score:' |
+ cut -d' ' -f2
+ done >"${outputDir}/${filename}"
+ done
+done
diff --git a/imago/sgfParser/astNode.py b/imago/sgfParser/astNode.py
index ec28c2a..41629ce 100644
--- a/imago/sgfParser/astNode.py
+++ b/imago/sgfParser/astNode.py
@@ -1,11 +1,11 @@
-from imago.gameLogic.gameTree import GameTree
from imago.gameLogic.gameData import GameData
from imago.gameLogic.gameMove import GameMove
-from imago.gameLogic.gameState import Player
+from imago.gameLogic.gameBoard import GameBoard
+from imago.data.enums import Player
class ASTNode:
"""Abstract Syntax Tree Node of SGF parser"""
- def __init__(self, children=None, leaf=None, props=None):
+ def __init__(self, children=None, props=None):
if children:
self.children = children
else:
@@ -13,8 +13,7 @@ class ASTNode:
if props:
self.props = props
else:
- self.props = {}
- self.leaf = leaf
+ self.props = []
def addToSequence(self, move):
"""Appends a move to the last of the sequence started by this move"""
@@ -68,7 +67,7 @@ class ASTNode:
gameData.roundInfo = prop.value
if prop.name == "RU": # Rules used for the game
gameData.rules = prop.value
- if prop.name == "SO": # Source of the gamw
+ if prop.name == "SO": # Source of the game
gameData.source = prop.source
if prop.name == "TM": # Time limit in seconds
gameData.timeInfo = prop.source
@@ -77,42 +76,69 @@ class ASTNode:
firstMoves = []
for child in self.children:
- firstMoves.append(child.toGameMoveTree)
+ firstMoves.append(child.toGameMoveTree(size))
return GameTree(firstMoves, gameData)
- def toGameMoveTree(self):
- player = 0
- coords = []
- for prop in self.props:
- if prop.name == "B": # White move
- player = Player.BLACK
- coords = textToCoords(prop.value)
- if prop.name == "W": # White move
- player = Player.WHITE
- coords = textToCoords(prop.value)
- gameMove = GameMove(player, coords[0], coords[1])
+ def toGameMoveTree(self, previousMove=None):
+ if previousMove is None:
+ # Game root node
+ size = int(self.getPropertyValue("SZ"))
+ board = GameBoard(size, size)
+ gameMove = GameMove(board)
+ else:
+ coords = []
+ player = None
+ for prop in self.props:
+ if prop.name == "B" or prop.name == "W":
+ if prop.value != "tt" and prop.value != "":
+ coords = textToCoords(prop.value)
+ if prop.name == "B":
+ player = Player.BLACK
+ else:
+ player = Player.WHITE
+ if len(coords) == 2:
+ gameMove = previousMove.addMoveForPlayer(coords[0], coords[1], player)
+ else:
+ gameMove = previousMove.addPassForPlayer(player)
for child in self.children:
- newMove = child.toGameMoveTree()
- gameMove.nextMoves.append(newMove)
- newMove.previousMove = gameMove
+ child.toGameMoveTree(previousMove=gameMove)
+ # Add a couple passes at the end of the match since they are not usually recorded
+ if len(self.children) == 0 and not gameMove.isPass:
+ nextMove = gameMove.addPass()
+ nextMove.addPass()
+
return gameMove
-def textToCoords(text): # Poner en PropertyMove, subclase de Property
- col = ord(text[1]) - ord('a')
- row = ord(text[0]) - ord('a')
- return [row, col]
+ def hasProperty(self, propertyName):
+ """Returns True if the node contains a property with the given name."""
+ for prop in self.props:
+ if prop.name == propertyName:
+ return True
+ return False
+ def getPropertyValue(self, propertyName):
+ """Returns the value of the given property for this node."""
+ for prop in self.props:
+ if prop.name == propertyName:
+ return prop.value
+ raise RuntimeError("ASTNode has no property %s" % propertyName)
- def toString(self):
+ def toString(self, debug=False):
"""Returns a depth-first representation of the tree."""
out = '(' + str(self.props) + ')'
- out += "in"
+ if debug: out += "in"
for node in self.children:
out = out + node.toString()
- out += "out"
+ if debug: out += "out"
return out
+def textToCoords(text): # Poner en PropertyMove, subclase de Property
+ col = ord(text[0]) - ord('a')
+ row = ord(text[1]) - ord('a')
+ return [row, col]
+
+
class Property:
"""Property of a Node"""
def __init__(self, name, value):
@@ -125,3 +151,6 @@ class Property:
self.value.append(value)
else:
self.value = [self.value, value]
+
+ def toString(self):
+ return("Property(%s, %s)" % (self.name, self.value))
diff --git a/imago/sgfParser/sgf.py b/imago/sgfParser/sgf.py
index b5c0be2..154cbbe 100644
--- a/imago/sgfParser/sgf.py
+++ b/imago/sgfParser/sgf.py
@@ -1,11 +1,13 @@
"""Module for reading and writing of SGF files."""
-from imago.gameLogic.gameTree import GameTree
-from imago.gameLogic.gameMove import GameMove
-
-# def loadGameTree(filename):
-# PLY?
-# """Parses a GameTree instance from a source SGF file."""
-# sgf = open(filename, "r")
-#
-# a = GameTree()
+from imago.sgfParser.sgfyacc import parser
+
+def loadGameTree(filename):
+ """Parses a GameTree instance from a source SGF file."""
+ file = open(filename, "r")
+
+ text = file.read()
+
+ file.close()
+
+ return parser.parse(text).toGameMoveTree()
diff --git a/imago/sgfParser/sgflex.py b/imago/sgfParser/sgflex.py
index 07fb404..c7dbf38 100755
--- a/imago/sgfParser/sgflex.py
+++ b/imago/sgfParser/sgflex.py
@@ -1,4 +1,4 @@
-#!/bin/python
+#!/usr/bin/python
# --------------------------------------
# sgflex.py
@@ -12,8 +12,6 @@ tokens = (
'LPAREN',
'RPAREN',
'SCOLON',
- 'LSQBRACKET',
- 'RSQBRACKET',
'PROPID',
'UCLETTER',
'DIGIT',
@@ -29,8 +27,6 @@ tokens = (
t_LPAREN = r'\('
t_RPAREN = r'\)'
t_SCOLON = r';'
-t_LSQBRACKET = r'\['
-t_RSQBRACKET = r'\]'
t_PROPID = r'[A-Z][A-Z]?'
t_UCLETTER = r'[A-Z]'
t_DIGIT = r'[0-9]'
@@ -58,7 +54,7 @@ def t_PROPVALUE(t):
# Rule to track line numbers
def t_newline(t):
- r'\n+'
+ r'\n'
t.lexer.lineno += len(t.value)
t_ignore = ' \t'
@@ -68,14 +64,8 @@ def t_error(t):
print("Illegal character '%s'" % t.value[0])
t.lexer.skip(1)
-#data='''
-#B[aa ]
-#W[AB]W[ab]
-#B[bb]
-#'''
+lexer = lex.lex() # Used by the parser
+#lexer = lex.lex(debug=True)
-lexer = lex.lex()
-#lexer.input(data)
-
-#for token in lexer:
-# print(token)
+if __name__ == '__main__':
+ lex.runmain()
diff --git a/imago/sgfParser/sgfyacc.py b/imago/sgfParser/sgfyacc.py
index bd00df6..d18f2a8 100755
--- a/imago/sgfParser/sgfyacc.py
+++ b/imago/sgfParser/sgfyacc.py
@@ -1,4 +1,4 @@
-#!/bin/python
+#!/usr/bin/python
# --------------------------------------
# sgyacc.py
@@ -7,8 +7,8 @@
import ply.yacc as yacc
-from sgflex import tokens
-from astNode import ASTNode, Property
+from imago.sgfParser.sgflex import tokens
+from imago.sgfParser.astNode import ASTNode, Property
def p_tree(p):
'''tree : LPAREN node RPAREN
@@ -31,7 +31,10 @@ def p_node(p):
def p_node_prop(p):
'node : node property'
- p[1].props[p[2].name] = p[2].value
+ if p[1].hasProperty(p[2].name):
+ print("Syntax error: node already contains a property named - %s" % p[2].name)
+ raise SyntaxError
+ p[1].props.append(p[2])
p[0] = p[1]
def p_property(p):
@@ -43,19 +46,26 @@ def p_property_value(p):
p[1].addValue(p[2])
p[0] = p[1]
-def p_error(_):
+def p_error(p):
"""Error rule for syntax errors"""
- print("Syntax error in input!")
+ print("Syntax error in input - %s" % p)
# Build the parser
parser = yacc.yacc()
+#parser = yacc.yacc(start='property')
-while True:
- try:
- s = input('calc > ')
- except EOFError:
- break
- if not s:
- continue
- result = parser.parse(s)
- print(result.toString())
+def main():
+
+ s = ""
+ while True:
+ try:
+ s = input('calc > ')
+ except EOFError:
+ break
+ if not s:
+ continue
+ result = parser.parse(s, debug=True)
+ print(result.toString())
+
+if __name__ == '__main__':
+ main()
diff --git a/imagocli.py b/imagocli.py
index e8e4580..5f14380 100755
--- a/imagocli.py
+++ b/imagocli.py
@@ -2,8 +2,28 @@
"""Run the Imago engine."""
+import sys
+
+from imago.data.enums import DecisionAlgorithms
from imago.engine.imagoIO import ImagoIO
if __name__ == "__main__":
- io = ImagoIO()
+
+ decisionAlgorithm = None
+ if len(sys.argv) >= 3:
+ if sys.argv[1] == "-e":
+ if sys.argv[2] == "montecarlo":
+ decisionAlgorithm = DecisionAlgorithms.MONTECARLO
+ if sys.argv[2] == "keras":
+ decisionAlgorithm = DecisionAlgorithms.KERAS
+ if sys.argv[2] == "dense":
+ decisionAlgorithm = DecisionAlgorithms.DENSE
+ if sys.argv[2] == "conv":
+ decisionAlgorithm = DecisionAlgorithms.CONV
+
+ if decisionAlgorithm is None:
+ io = ImagoIO()
+ else:
+ io = ImagoIO(decisionAlgorithm)
+
io.start()
diff --git a/models/testModel.h5 b/models/testModel.h5
new file mode 100644
index 0000000..6bc5fe2
--- /dev/null
+++ b/models/testModel.h5
Binary files differ
diff --git a/results.txt b/results.txt
new file mode 100644
index 0000000..aa1a8a3
--- /dev/null
+++ b/results.txt
@@ -0,0 +1,41 @@
+Visits: 10
+Score: 2
+Visits: 10
+Score: -4
+Visits: 10
+Score: 2
+Visits: 10
+Score: -2
+Visits: 10
+Score: -4
+Visits: 10
+Score: 0
+Visits: 10
+Score: 4
+Visits: 10
+Score: -2
+Visits: 10
+Score: 0
+Visits: 10
+Score: -4
+----------
+Visits: 50
+Score: -4
+Visits: 50
+Score: 0
+Visits: 50
+Score: -6
+Visits: 50
+Score: 0
+Visits: 50
+Score: -12
+Visits: 50
+Score: -6
+Visits: 50
+Score: 10
+Visits: 50
+Score: 0
+Visits: 50
+Score: 8
+Visits: 50
+Score: -2
diff --git a/simulationMatchesPyplot.py b/simulationMatchesPyplot.py
new file mode 100755
index 0000000..809e1a1
--- /dev/null
+++ b/simulationMatchesPyplot.py
@@ -0,0 +1,27 @@
+#!/usr/bin/python
+
+"""Uses pyplot to create graphs of the results of MonteCarlo simulations"""
+
+import matplotlib.pyplot as plt
+import numpy as np
+
+data = np.loadtxt("out/size9_scoreDiffHeur10.dat")
+
+dic = {}
+for value in data:
+ if value in dic.keys():
+ dic[value] += 1
+ else:
+ dic[value] = 1
+
+names = list(dic.keys())
+values = list(dic.values())
+
+fig, axs = plt.subplots(1, 3, figsize=(9, 3), sharey=True)
+axs[0].bar(names, values)
+axs[1].scatter(names, values)
+axs[2].plot(names, values)
+axs[2].axis([-10, 10, 0, max(values)+2])
+fig.suptitle('Categorical Plotting')
+
+plt.show()
diff --git a/testSGF.py b/testSGF.py
new file mode 100755
index 0000000..08a1bee
--- /dev/null
+++ b/testSGF.py
@@ -0,0 +1,20 @@
+#!/usr/bin/python
+
+"""Gets a game from an SGF file."""
+
+import sys
+
+from imago.sgfParser.sgf import loadGameTree
+
+def main():
+ filename = sys.argv[1]
+ move = loadGameTree(filename)
+ while move is not None:
+ move.printBoard()
+ if len(move.nextMoves) > 0:
+ move = move.nextMoves[0]
+ else:
+ move = None
+
+if __name__ == '__main__':
+ main()
diff --git a/tests/test_enums.py b/tests/test_enums.py
new file mode 100644
index 0000000..73f4009
--- /dev/null
+++ b/tests/test_enums.py
@@ -0,0 +1,15 @@
+"""Tests for enums module."""
+
+import unittest
+
+from imago.data.enums import Player
+
+class TestEnums(unittest.TestCase):
+ """Test parseHelpers module."""
+
+ def testOtherPlayer(self):
+ """Test method to get the other player"""
+
+ self.assertEqual(Player.otherPlayer(Player.BLACK), Player.WHITE)
+ self.assertEqual(Player.otherPlayer(Player.WHITE), Player.BLACK)
+ self.assertEqual(Player.otherPlayer(''), Player.EMPTY)
diff --git a/tests/test_gameBoard.py b/tests/test_gameBoard.py
new file mode 100644
index 0000000..8a7b127
--- /dev/null
+++ b/tests/test_gameBoard.py
@@ -0,0 +1,118 @@
+"""Tests for gameBoard module."""
+
+import unittest
+
+from imago.data.enums import Player
+from imago.gameLogic.gameBoard import GameBoard
+
+TEST_BOARD_SIZE = 19
+
+class TestGameBoard(unittest.TestCase):
+ """Test gameBoard module."""
+
+ def testGetGroupCounts(self):
+ """Test calculation of group stones and liberties."""
+ board = GameBoard(TEST_BOARD_SIZE, TEST_BOARD_SIZE)
+
+ #Empty cell liberties
+ self.assertEqual(board.getGroupLiberties(0,0), set())
+ self.assertEqual(board.getGroupLibertiesCount(0,0), 0)
+
+ # Lone stone
+ board.board[3][3] = Player.WHITE
+ self.assertEqual(board.getGroupVertices(3,3),
+ {(3,3)})
+ self.assertEqual(board.getGroupVerticesCount(3,3), 1)
+ self.assertEqual(board.getGroupLiberties(3,3),
+ {(2,3), (3,2), (4,3), (3,4)})
+ self.assertEqual(board.getGroupLibertiesCount(3,3), 4)
+
+ # L group (don't compute twice liberty inside L)
+ board.board[3][4] = Player.WHITE
+ board.board[2][4] = Player.WHITE
+ self.assertEqual(board.getGroupVertices(3,3),
+ {(3,3), (3,4), (2,4)})
+ self.assertEqual(board.getGroupVerticesCount(3,3), 3)
+ self.assertEqual(board.getGroupLiberties(3,3),
+ {(2,3), (3,2), (4,3), (4, 4), (3,5), (2,5), (1,4)})
+ self.assertEqual(board.getGroupLibertiesCount(3,3), 7)
+
+ def testIsCellEye(self):
+ """Tests the isCellEye method."""
+ board = GameBoard(TEST_BOARD_SIZE, TEST_BOARD_SIZE)
+
+ # Empty board is eye
+ self.assertEqual(Player.EMPTY, board.isCellEye(0, 0))
+ self.assertEqual(Player.EMPTY, board.isCellEye(3, 3))
+ self.assertEqual(Player.EMPTY, board.isCellEye(TEST_BOARD_SIZE-1, TEST_BOARD_SIZE-1))
+
+ # Board with 1 stone is eye
+ board.board[5][6] = Player.WHITE
+ self.assertEqual(Player.WHITE, board.isCellEye(3, 3))
+
+ # Board with 2 stones of different color is not eye
+ board.board[9][9] = Player.BLACK
+ self.assertEqual(Player.EMPTY, board.isCellEye(3, 3))
+
+ # Surrounded cell is eye
+ board.board[6][5] = Player.WHITE
+ board.board[6][7] = Player.WHITE
+ board.board[7][6] = Player.WHITE
+
+ self.assertEqual(Player.WHITE, board.isCellEye(6, 6))
+
+ # Surrounded cell with 2 different colors is not eye
+ board.board[6][5] = Player.BLACK
+ self.assertEqual(Player.EMPTY, board.isCellEye(6, 6))
+
+ def testScore(self):
+ """Tests the score method."""
+ board = GameBoard(TEST_BOARD_SIZE, TEST_BOARD_SIZE)
+
+ # Empty board has no score.
+ self.assertEqual((0, 0), board.score())
+
+ # Board with 1 black stone has totalVertices-1 points for black.
+ board.board[3][3] = Player.BLACK
+ self.assertEqual((TEST_BOARD_SIZE*TEST_BOARD_SIZE-1, 0), board.score())
+
+ # Board with 2 black stones has totalVertices-2 points for black.
+ board.board[5][5] = Player.BLACK
+ self.assertEqual((TEST_BOARD_SIZE*TEST_BOARD_SIZE-2, 0), board.score())
+
+ # Board with lone stones of different colors has no score.
+ board.board[7][7] = Player.WHITE
+ self.assertEqual((0, 0), board.score())
+
+ # Black group with surrounded territory.
+ board.board[2][3] = Player.BLACK
+ board.board[1][3] = Player.BLACK
+ board.board[0][3] = Player.BLACK
+ board.board[3][2] = Player.BLACK
+ board.board[3][1] = Player.BLACK
+ board.board[3][0] = Player.BLACK
+ self.assertEqual((9, 0), board.score())
+
+ # White group besides black group.
+ board.board[6][7] = Player.WHITE
+ board.board[5][7] = Player.WHITE
+ board.board[5][6] = Player.WHITE
+ board.board[5][5] = Player.WHITE
+ board.board[5][4] = Player.WHITE
+ board.board[5][3] = Player.WHITE
+ board.board[5][2] = Player.WHITE
+ board.board[5][1] = Player.WHITE
+ board.board[5][0] = Player.WHITE
+ board.board[8][7] = Player.WHITE
+ board.board[9][7] = Player.WHITE
+ board.board[9][6] = Player.WHITE
+ board.board[9][5] = Player.WHITE
+ board.board[9][4] = Player.WHITE
+ board.board[9][3] = Player.WHITE
+ board.board[9][2] = Player.WHITE
+ board.board[9][1] = Player.WHITE
+ board.board[9][0] = Player.WHITE
+ self.assertEqual((9, 21), board.score())
+
+if __name__ == '__main__':
+ unittest.main()
diff --git a/tests/test_gameMove.py b/tests/test_gameMove.py
new file mode 100644
index 0000000..6569c5b
--- /dev/null
+++ b/tests/test_gameMove.py
@@ -0,0 +1,78 @@
+"""Tests for gameMove module."""
+
+import unittest
+
+from imago.data.enums import Player
+from imago.gameLogic.gameBoard import GameBoard
+from imago.gameLogic.gameMove import GameMove
+
+TEST_BOARD_SIZE = 19
+
+class TestGameMove(unittest.TestCase):
+ """Test gameMove module."""
+
+ def testAddMove(self):
+ """Test adding new moves to existing moves."""
+ board = GameBoard(TEST_BOARD_SIZE, TEST_BOARD_SIZE)
+ firstMove = GameMove(board)
+
+ self.assertIsNone(firstMove.coords)
+
+ secondMove = firstMove.addMove(1, 2)
+
+ self.assertIsNone(firstMove.coords)
+ self.assertEqual(secondMove.coords[0], 1)
+ self.assertEqual(secondMove.coords[1], 2)
+
+ thirdMove = secondMove.addMove(5, 7)
+
+ self.assertIsNone(firstMove.coords)
+ self.assertIsNone(thirdMove.previousMove.previousMove.coords)
+
+ self.assertEqual(secondMove.coords[0], 1)
+ self.assertEqual(secondMove.coords[1], 2)
+ self.assertEqual(thirdMove.previousMove.coords[0], 1)
+ self.assertEqual(thirdMove.previousMove.coords[1], 2)
+
+ self.assertEqual(thirdMove.coords[0], 5)
+ self.assertEqual(thirdMove.coords[1], 7)
+ self.assertEqual(firstMove
+ .nextMoves[0]
+ .nextMoves[0]
+ .coords[0], 5)
+ self.assertEqual(firstMove
+ .nextMoves[0]
+ .nextMoves[0]
+ .coords[1], 7)
+
+ self.assertEqual(firstMove.board.getBoard()[1][2], Player.EMPTY)
+ self.assertEqual(secondMove.board.getBoard()[1][2], Player.BLACK)
+ self.assertEqual(thirdMove.board.getBoard()[1][2], Player.BLACK)
+
+ self.assertEqual(firstMove.board.getBoard()[5][7], Player.EMPTY)
+ self.assertEqual(secondMove.board.getBoard()[5][7], Player.EMPTY)
+ self.assertEqual(thirdMove.board.getBoard()[5][7], Player.WHITE)
+
+ def testGetPlayableVertices(self):
+ """Test getting the set of valid moves."""
+ boardSize = 3
+ board = GameBoard(boardSize, boardSize)
+
+ firstMove = GameMove(board)
+ self.assertSetEqual(
+ firstMove.getPlayableVertices(),
+ set(((0,0), (0,1), (0,2),
+ (1,0), (1,1), (1,2),
+ (2,0), (2,1), (2,2)))
+ )
+
+ secondMove = firstMove.addMove(1, 2)
+ self.assertSetEqual(
+ secondMove.getPlayableVertices(),
+ set(((0,0), (0,1), (0,2),
+ (1,0), (1,1),
+ (2,0), (2,1), (2,2)))
+ )
+
+if __name__ == '__main__':
+ unittest.main()
diff --git a/tests/test_monteCarlo.py b/tests/test_monteCarlo.py
new file mode 100644
index 0000000..b217cf9
--- /dev/null
+++ b/tests/test_monteCarlo.py
@@ -0,0 +1,30 @@
+"""Tests for the MonteCarlo algorithm."""
+
+import unittest
+
+from imago.gameLogic.gameState import GameState
+from imago.engine.monteCarlo import MCTS
+from imago.engine.monteCarlo import MCTSNode
+
+TEST_BOARD_SIZE = 9
+
+class TestMonteCarlo(unittest.TestCase):
+ """Test MonteCarlo algorithm."""
+
+ def testPickMove(self):
+ """Test picking a move."""
+ state = GameState(TEST_BOARD_SIZE)
+ tree = MCTS(state.lastMove)
+ #print(tree.pickMove().toString())
+
+ #def testSimulation(self):
+ # """Test calculation of group liberties."""
+ # board = GameBoard(TEST_BOARD_SIZE, TEST_BOARD_SIZE)
+ # move = GameMove(board)
+ # node = MCTSNode(move, None)
+ # nMatches = 100
+ # scoreDiffHeur = 15
+ # node.simulation(nMatches, scoreDiffHeur)
+
+if __name__ == '__main__':
+ unittest.main()
diff --git a/tests/test_parseHelpers.py b/tests/test_parseHelpers.py
index cf1fa9f..7bbf152 100644
--- a/tests/test_parseHelpers.py
+++ b/tests/test_parseHelpers.py
@@ -13,15 +13,19 @@ class TestParseHelpers(unittest.TestCase):
def testParseMove(self):
"""Test parsing of GtpMove"""
- self.assertEqual(parseHelpers.parseMove(["B"], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.parseMove(["A1"], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.parseMove(["B", "A1", "W"], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
+ wrongMoves = [
+ ["B"],
+ ["A1"],
+ ["B", "A1", "W"]
+ ]
+ for move in wrongMoves:
+ self.assertRaises(
+ RuntimeError,
+ parseHelpers.parseMove,
+ move, TEST_BOARD_SIZE
+ )
parsedMove = parseHelpers.parseMove(["B", "t1"], TEST_BOARD_SIZE)
-
targetMove = parseHelpers.GtpMove(Player.BLACK, [18, 18])
self.assertEqual(parsedMove.color, targetMove.color)
self.assertEqual(parsedMove.vertex, targetMove.vertex)
@@ -32,15 +36,19 @@ class TestParseHelpers(unittest.TestCase):
self.assertEqual(parseHelpers.parseColor("B"), Player.BLACK)
self.assertEqual(parseHelpers.parseColor("w"), Player.WHITE)
self.assertEqual(parseHelpers.parseColor("W"), Player.WHITE)
- self.assertEqual(parseHelpers.parseColor("bw"), parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.parseColor("wb"), parseHelpers.ParseCodes.ERROR)
+
+ self.assertRaises(RuntimeError, parseHelpers.parseColor, "bw")
+ self.assertRaises(RuntimeError, parseHelpers.parseColor, "wb")
def testParseVertexWrongInputs(self):
"""Test wrong inputs for parseVertex."""
inputs = ( "a", "1", "1a", "aa1", "a0", "u1", "a"+str(TEST_BOARD_SIZE+1) )
for text in inputs:
- self.assertEqual(parseHelpers.parseVertex(text, TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
+ self.assertRaises(
+ RuntimeError,
+ parseHelpers.parseVertex,
+ text, TEST_BOARD_SIZE
+ )
def testParseVertexCorrectInputs(self):
"""Test correct inputs and their resulting coordinates for parseVertex."""
@@ -67,6 +75,10 @@ class TestParseHelpers(unittest.TestCase):
"A19", TEST_BOARD_SIZE),
[0,0])
+ self.assertEqual(parseHelpers.parseVertex(
+ "pass", TEST_BOARD_SIZE),
+ "pass")
+
def testVertexToString(self):
"""Test converting vertices to strings."""
self.assertEqual(parseHelpers.vertexToString([0,0], TEST_BOARD_SIZE), "A19")
@@ -78,22 +90,24 @@ class TestParseHelpers(unittest.TestCase):
self.assertEqual(parseHelpers.vertexToString([18,0], TEST_BOARD_SIZE), "A1")
self.assertEqual(parseHelpers.vertexToString([18,18], TEST_BOARD_SIZE), "T1")
- self.assertEqual(parseHelpers.vertexToString([-1,0], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.vertexToString([0,-1], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.vertexToString([-1,-1], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.vertexToString([19,0], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.vertexToString([0,19], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.vertexToString([19,19], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.vertexToString([0], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
- self.assertEqual(parseHelpers.vertexToString([0,0,0], TEST_BOARD_SIZE),
- parseHelpers.ParseCodes.ERROR)
+ self.assertEqual(parseHelpers.vertexToString("pass", TEST_BOARD_SIZE), "pass")
+
+ wrongVertices = [
+ [-1,0],
+ [0,-1],
+ [-1,-1],
+ [19,0],
+ [0,19],
+ [19,19],
+ [0],
+ [0,0,0]
+ ]
+ for vertex in wrongVertices:
+ self.assertRaises(
+ RuntimeError,
+ parseHelpers.vertexToString,
+ vertex, TEST_BOARD_SIZE
+ )
if __name__ == '__main__':
unittest.main()
diff --git a/train.py b/train.py
new file mode 100755
index 0000000..0f518d0
--- /dev/null
+++ b/train.py
@@ -0,0 +1,27 @@
+#!/usr/bin/python
+
+"""Starts training a keras neural network."""
+
+import sys
+
+from imago.sgfParser.sgf import loadGameTree
+from imago.engine.keras.denseNeuralNetwork import DenseNeuralNetwork
+from imago.engine.keras.convNeuralNetwork import ConvNeuralNetwork
+
+def main():
+ games = []
+ for file in sys.argv[1:]:
+ print(file)
+ games.append(loadGameTree(file))
+
+ matches = [game.getMainLineOfPlay() for game in games]
+
+ modelFile = ""
+ boardsize = 9
+ nn = DenseNeuralNetwork(modelFile, boardsize)
+ #nn = ConvNeuralNetwork(modelFile, boardsize)
+ nn.trainModel(matches)
+ nn.saveModel()
+
+if __name__ == '__main__':
+ main()