|
| 1 | +@misc{docker, |
| 2 | + title = {What is Docker}, |
| 3 | + howpublished = {\url{https://www.docker.com/what-docker}}, |
| 4 | + author = {Docker Inc}, |
| 5 | + note = {Accessed: 2018-04-20} |
| 6 | +} |
| 7 | + |
| 8 | +@misc{criu, |
| 9 | + title = {CRIU}, |
| 10 | + howpublished = {\url{http://criu.org}}, |
| 11 | + author = {criu.org}, |
| 12 | + note = {Accessed: 2018-04-20} |
| 13 | +} |
| 14 | + |
| 15 | +@misc{clickcli, |
| 16 | + title = {Click_}, |
| 17 | + howpublished = {\url{http://click.pocoo.org/5/}}, |
| 18 | + author = {Ronacher, Armin}, |
| 19 | + note = {Accessed: 2018-04-22} |
| 20 | +} |
| 21 | + |
1 | 22 |
|
2 | 23 | @misc{GoogleColabOnline2018, |
3 | 24 | title = {Google Colab Introduction}, |
@@ -405,6 +426,14 @@ @article{ketter2018powertac |
405 | 426 | journal = {ERIM Report Series Reference No. 2017-016-LIS} |
406 | 427 | } |
407 | 428 |
|
| 429 | +@article{schmitt2018kickstarting, |
| 430 | + title = {Kickstarting Deep Reinforcement Learning}, |
| 431 | + author = {Schmitt, Simon and Hudson, Jonathan J and Zidek, Augustin and Osindero, Simon and Doersch, Carl and Czarnecki, Wojciech M and Leibo, Joel Z and Kuttler, Heinrich and Zisserman, Andrew and Simonyan, Karen and others}, |
| 432 | + journal = {arXiv preprint arXiv:1803.03835}, |
| 433 | + year = {2018} |
| 434 | +} |
| 435 | + |
| 436 | + |
408 | 437 | @article{abbeel2010autonomous, |
409 | 438 | title = {Autonomous helicopter aerobatics through apprenticeship learning}, |
410 | 439 | author = {Abbeel, Pieter and Coates, Adam and Ng, Andrew Y}, |
@@ -452,3 +481,60 @@ @article{EvalGRU2014 |
452 | 481 | bibsource = {dblp computer science bibliography, https://dblp.org} |
453 | 482 | } |
454 | 483 |
|
| 484 | +@inproceedings{mnih2016asynchronous, |
| 485 | + title = {Asynchronous methods for deep reinforcement learning}, |
| 486 | + author = {Mnih, Volodymyr and Badia, Adria Puigdomenech and Mirza, Mehdi and Graves, Alex and Lillicrap, Timothy and Harley, Tim and Silver, David and Kavukcuoglu, Koray}, |
| 487 | + booktitle = {International Conference on Machine Learning}, |
| 488 | + pages = {1928--1937}, |
| 489 | + year = {2016} |
| 490 | +} |
| 491 | + |
| 492 | +@article{arulkumaran2017brief, |
| 493 | + title = {A brief survey of deep reinforcement learning}, |
| 494 | + author = {Arulkumaran, Kai and Deisenroth, Marc Peter and Brundage, Miles and Bharath, Anil Anthony}, |
| 495 | + journal = {arXiv preprint arXiv:1708.05866}, |
| 496 | + year = {2017} |
| 497 | +} |
| 498 | + |
| 499 | +@article{brockman2016openai, |
| 500 | + title = {Openai gym}, |
| 501 | + author = {Brockman, Greg and Cheung, Vicki and Pettersson, Ludwig and Schneider, Jonas and Schulman, John and Tang, Jie and Zaremba, Wojciech}, |
| 502 | + journal = {arXiv preprint arXiv:1606.01540}, |
| 503 | + year = {2016} |
| 504 | +} |
| 505 | + |
| 506 | +@article{matiisen2017teacher, |
| 507 | + title = {Teacher-Student Curriculum Learning}, |
| 508 | + author = {Matiisen, Tambet and Oliver, Avital and Cohen, Taco and Schulman, John}, |
| 509 | + journal = {arXiv preprint arXiv:1707.00183}, |
| 510 | + year = {2017} |
| 511 | +} |
| 512 | + |
| 513 | +@article{silver2016mastering, |
| 514 | + title = {Mastering the game of Go with deep neural networks and tree search}, |
| 515 | + author = {Silver, David and Huang, Aja and Maddison, Chris J and Guez, Arthur and Sifre, Laurent and Van Den Driessche, George and Schrittwieser, Julian and Antonoglou, Ioannis and Panneershelvam, Veda and Lanctot, Marc and others}, |
| 516 | + journal = {nature}, |
| 517 | + volume = {529}, |
| 518 | + number = {7587}, |
| 519 | + pages = {484--489}, |
| 520 | + year = {2016}, |
| 521 | + publisher = {Nature Research} |
| 522 | +} |
| 523 | + |
| 524 | +@misc{baselines, |
| 525 | + author = {Dhariwal, Prafulla and Hesse, Christopher and Klimov, Oleg and Nichol, Alex and Plappert, Matthias and Radford, Alec and Schulman, John and Sidor, Szymon and Wu, Yuhuai}, |
| 526 | + title = {OpenAI Baselines}, |
| 527 | + year = {2017}, |
| 528 | + publisher = {GitHub}, |
| 529 | + journal = {GitHub repository}, |
| 530 | + howpublished = {\url{https://github.com/openai/baselines}}, |
| 531 | +} |
| 532 | + |
| 533 | +@misc{plappert2016kerasrl, |
| 534 | + author = {Matthias Plappert}, |
| 535 | + title = {keras-rl}, |
| 536 | + year = {2016}, |
| 537 | + publisher = {GitHub}, |
| 538 | + journal = {GitHub repository}, |
| 539 | + howpublished = {\url{https://github.com/keras-rl/keras-rl}}, |
| 540 | +} |
0 commit comments