@INPROCEEDINGS{COG8848037, author={D. J. N. J. {Soemers} and É. {Piette} and M. {Stephenson} and C. {Browne}}, booktitle={2019 IEEE Conference on Games (CoG)}, title={Learning Policies from Self-Play with Policy Gradients and MCTS Value Estimates}, year={2019}, volume={}, number={}, pages={1-8}, keywords={entropy;game theory;learning (artificial intelligence);Monte Carlo methods;tree searching;policy gradient expression;MCTS value estimates;policy gradients;game-playing agents;Monte Carlo tree search algorithms;cross-entropy loss;Games;Linear programming;Standards;Training;Monte Carlo methods;Reinforcement learning;Feature extraction;reinforcement learning;search;self-play}, doi={10.1109/CIG.2019.8848037}, ISSN={2325-4270}, month={Aug},}