@article{journals/corr/abs-1807-01672,
added-at = {2021-10-14T00:00:00.000+0200},
author = {Laterre, Alexandre and Fu, Yunguan and Jabri, Mohamed Khalil and Cohen, Alain-Sam and Kas, David and Hajjar, Karl and Dahl, Torbjorn S. and Kerkeni, Amine and Beguir, Karim},
biburl = {https://www.bibsonomy.org/bibtex/235e0ccd9254196bfc09de092a1199e6f/dblp},
ee = {http://arxiv.org/abs/1807.01672},
interhash = {3bb8b6cafc78a3c141152a9c8205b68a},
intrahash = {35e0ccd9254196bfc09de092a1199e6f},
journal = {CoRR},
keywords = {dblp},
timestamp = {2024-04-08T22:46:11.000+0200},
title = {Ranked Reward: Enabling Self-Play Reinforcement Learning for Combinatorial Optimization.},
url = {http://dblp.uni-trier.de/db/journals/corr/corr1807.html#abs-1807-01672},
volume = {abs/1807.01672},
year = 2018
}