@@ -73,15 +73,7 @@ @article{plappert:2017
73
73
year ={ 2017}
74
74
}
75
75
76
- @inproceedings {sutton:2000 ,
77
- title ={ Policy gradient methods for reinforcement learning with function approximation} ,
78
- author ={ Sutton, Richard S and McAllester, David A and Singh, Satinder P and Mansour, Yishay} ,
79
- booktitle ={ Advances in neural information processing systems} ,
80
- pages ={ 1057--1063} ,
81
- year ={ 2000}
82
- }
83
-
84
- @incollection {Sutton2000 ,
76
+ @incollection {sutton2000 ,
85
77
title = { Policy Gradient Methods for Reinforcement Learning with Function Approximation} ,
86
78
author = { Sutton, Richard S and David A. McAllester and Satinder P. Singh and Mansour, Yishay} ,
87
79
booktitle = { {Advances in Neural Information Processing Systems 12}} ,
@@ -92,10 +84,19 @@ @incollection{Sutton2000
92
84
}
93
85
94
86
@inproceedings {silver2014deterministic ,
95
- title ={ Deterministic policy gradient algorithms} ,
96
- author ={ Silver, David and Lever, Guy and Heess, Nicolas and Degris, Thomas and Wierstra, Daan and Riedmiller, Martin} ,
97
- booktitle ={ ICML} ,
98
- year ={ 2014}
87
+ title = { Deterministic Policy Gradient Algorithms} ,
88
+ author = { David Silver and Guy Lever and Nicolas Heess and Thomas Degris and Daan Wierstra and Martin Riedmiller} ,
89
+ booktitle = { {Proceedings of the 31st International Conference on Machine Learning}} ,
90
+ pages = { 387--395} ,
91
+ year = { 2014} ,
92
+ editor = { Eric P. Xing and Tony Jebara} ,
93
+ volume = { 32} ,
94
+ number = { 1} ,
95
+ series = { Proceedings of Machine Learning Research} ,
96
+ address = { Bejing, China} ,
97
+ month = { 22--24 Jun} ,
98
+ publisher = { {PMLR}} ,
99
+ url = { http://proceedings.mlr.press/v32/silver14.html} ,
99
100
}
100
101
101
102
@article {schulman:2017 ,
@@ -149,4 +150,4 @@ @inproceedings{paszke2017automatic
149
150
author ={ Paszke, Adam and Gross, Sam and Chintala, Soumith and Chanan, Gregory and Yang, Edward and DeVito, Zachary and Lin, Zeming and Desmaison, Alban and Antiga, Luca and Lerer, Adam} ,
150
151
booktitle ={ NIPS Autodiff Workshop} ,
151
152
year ={ 2017}
152
- }
153
+ }
0 commit comments