Detail ES credits. (#265)

mtrofin · web-flow · commit 94f030b5fb16 · 2023-06-22T12:39:54.000-07:00
diff --git a/compiler_opt/es/blackbox_optimizers.py b/compiler_opt/es/blackbox_optimizers.py
@@ -15,11 +15,35 @@
 
 ###############################################################################
 #
-# This is a port of the work by: Krzysztof Choromanski, Mark Rowland,
-# Vikas Sindhwani, Richard E. Turner, Adrian Weller:  "Structured Evolution
-# with Compact Architectures for Scalable Policy Optimization",
-# https://arxiv.org/abs/1804.02395
 #
+# This is a port of the code by Krzysztof Choromanski, Deepali Jain and Vikas
+# Sindhwani, based on the portfolio of Blackbox optimization algorithms listed
+# below:
+#
+# "On Blackbox Backpropagation and Jacobian Sensing"; K. Choromanski,
+#  V. Sindhwani, NeurIPS 2017
+# "Optimizing Simulations with Noise-Tolerant Structured Exploration"; K.
+#  Choromanski, A. Iscen, V. Sindhwani, J. Tan, E. Coumans, ICRA 2018
+# "Structured Evolution with Compact Architectures for Scalable Policy
+#  Optimization"; K. Choromanski, M. Rowland, V. Sindhwani, R. Turner, A.
+#  Weller, ICML 2018, https://arxiv.org/abs/1804.02395
+#  "From Complexity to Simplicity: Adaptive ES-Active Subspaces for Blackbox
+#   Optimization";  K. Choromanski, A. Pacchiano, J. Parker-Holder, Y. Tang, V.
+#   Sindhwani, NeurIPS 2019
+# "i-Sim2Real: Reinforcement Learning on Robotic Policies in Tight Human-Robot
+#  Interaction Loops"; L. Graesser, D. D'Ambrosio, A. Singh, A. Bewley, D. Jain,
+#  K. Choromanski, P. Sanketi , CoRL 2022, https://arxiv.org/abs/2207.06572
+# "Agile Catching with Whole-Body MPC and Blackbox Policy Learning"; S.
+#  Abeyruwan, A. Bewley, N. Boffi, K. Choromanski, D. D'Ambrosio, D. Jain, P.
+#  Sanketi, A. Shankar, V. Sindhwani, S. Singh, J. Slotine, S. Tu, L4DC,
+#  https://arxiv.org/abs/2306.08205
+# "Robotic Table Tennis: A Case Study into a High Speed Learning System"; A.
+#  Bewley, A. Shankar, A. Iscen, A. Singh, C. Lynch, D. D'Ambrosio, D. Jain,
+#  E. Coumans, G. Versom, G. Kouretas, J. Abelian, J. Boyd, K. Oslund,
+#  K. Reymann, K. Choromanski, L. Graesser, M. Ahn, N. Jaitly, N. Lazic,
+#  P. Sanketi, P. Xu, P. Sermanet, R. Mahjourian, S. Abeyruwan, S. Kataoka,
+#  S. Moore, T. Nguyen, T. Ding, V. Sindhwani, V. Vanhoucke, W. Gao, Y. Kuang,
+#  to be presented at RSS 2023
 ###############################################################################
 r"""Library of blackbox optimization algorithms.
 
diff --git a/compiler_opt/es/blackbox_optimizers_test.py b/compiler_opt/es/blackbox_optimizers_test.py
@@ -15,11 +15,35 @@
 
 ###############################################################################
 #
-# This is a port of the work by: Krzysztof Choromanski, Mark Rowland,
-# Vikas Sindhwani, Richard E. Turner, Adrian Weller:  "Structured Evolution
-# with Compact Architectures for Scalable Policy Optimization",
-# https://arxiv.org/abs/1804.02395
 #
+# This is a port of the code by Krzysztof Choromanski, Deepali Jain and Vikas
+# Sindhwani, based on the portfolio of Blackbox optimization algorithms listed
+# below:
+#
+# "On Blackbox Backpropagation and Jacobian Sensing"; K. Choromanski,
+#  V. Sindhwani, NeurIPS 2017
+# "Optimizing Simulations with Noise-Tolerant Structured Exploration"; K.
+#  Choromanski, A. Iscen, V. Sindhwani, J. Tan, E. Coumans, ICRA 2018
+# "Structured Evolution with Compact Architectures for Scalable Policy
+#  Optimization"; K. Choromanski, M. Rowland, V. Sindhwani, R. Turner, A.
+#  Weller, ICML 2018, https://arxiv.org/abs/1804.02395
+#  "From Complexity to Simplicity: Adaptive ES-Active Subspaces for Blackbox
+#   Optimization";  K. Choromanski, A. Pacchiano, J. Parker-Holder, Y. Tang, V.
+#   Sindhwani, NeurIPS 2019
+# "i-Sim2Real: Reinforcement Learning on Robotic Policies in Tight Human-Robot
+#  Interaction Loops"; L. Graesser, D. D'Ambrosio, A. Singh, A. Bewley, D. Jain,
+#  K. Choromanski, P. Sanketi , CoRL 2022, https://arxiv.org/abs/2207.06572
+# "Agile Catching with Whole-Body MPC and Blackbox Policy Learning"; S.
+#  Abeyruwan, A. Bewley, N. Boffi, K. Choromanski, D. D'Ambrosio, D. Jain, P.
+#  Sanketi, A. Shankar, V. Sindhwani, S. Singh, J. Slotine, S. Tu, L4DC,
+#  https://arxiv.org/abs/2306.08205
+# "Robotic Table Tennis: A Case Study into a High Speed Learning System"; A.
+#  Bewley, A. Shankar, A. Iscen, A. Singh, C. Lynch, D. D'Ambrosio, D. Jain,
+#  E. Coumans, G. Versom, G. Kouretas, J. Abelian, J. Boyd, K. Oslund,
+#  K. Reymann, K. Choromanski, L. Graesser, M. Ahn, N. Jaitly, N. Lazic,
+#  P. Sanketi, P. Xu, P. Sermanet, R. Mahjourian, S. Abeyruwan, S. Kataoka,
+#  S. Moore, T. Nguyen, T. Ding, V. Sindhwani, V. Vanhoucke, W. Gao, Y. Kuang,
+#  to be presented at RSS 2023
 ###############################################################################
 r"""Tests for blackbox_optimization_algorithms."""
 
diff --git a/compiler_opt/es/gradient_ascent_optimization_algorithms.py b/compiler_opt/es/gradient_ascent_optimization_algorithms.py
@@ -15,11 +15,35 @@
 
 ###############################################################################
 #
-# This is a port of the work by: Krzysztof Choromanski, Mark Rowland,
-# Vikas Sindhwani, Richard E. Turner, Adrian Weller:  "Structured Evolution
-# with Compact Architectures for Scalable Policy Optimization",
-# https://arxiv.org/abs/1804.02395
 #
+# This is a port of the code by Krzysztof Choromanski, Deepali Jain and Vikas
+# Sindhwani, based on the portfolio of Blackbox optimization algorithms listed
+# below:
+#
+# "On Blackbox Backpropagation and Jacobian Sensing"; K. Choromanski,
+#  V. Sindhwani, NeurIPS 2017
+# "Optimizing Simulations with Noise-Tolerant Structured Exploration"; K.
+#  Choromanski, A. Iscen, V. Sindhwani, J. Tan, E. Coumans, ICRA 2018
+# "Structured Evolution with Compact Architectures for Scalable Policy
+#  Optimization"; K. Choromanski, M. Rowland, V. Sindhwani, R. Turner, A.
+#  Weller, ICML 2018, https://arxiv.org/abs/1804.02395
+#  "From Complexity to Simplicity: Adaptive ES-Active Subspaces for Blackbox
+#   Optimization";  K. Choromanski, A. Pacchiano, J. Parker-Holder, Y. Tang, V.
+#   Sindhwani, NeurIPS 2019
+# "i-Sim2Real: Reinforcement Learning on Robotic Policies in Tight Human-Robot
+#  Interaction Loops"; L. Graesser, D. D'Ambrosio, A. Singh, A. Bewley, D. Jain,
+#  K. Choromanski, P. Sanketi , CoRL 2022, https://arxiv.org/abs/2207.06572
+# "Agile Catching with Whole-Body MPC and Blackbox Policy Learning"; S.
+#  Abeyruwan, A. Bewley, N. Boffi, K. Choromanski, D. D'Ambrosio, D. Jain, P.
+#  Sanketi, A. Shankar, V. Sindhwani, S. Singh, J. Slotine, S. Tu, L4DC,
+#  https://arxiv.org/abs/2306.08205
+# "Robotic Table Tennis: A Case Study into a High Speed Learning System"; A.
+#  Bewley, A. Shankar, A. Iscen, A. Singh, C. Lynch, D. D'Ambrosio, D. Jain,
+#  E. Coumans, G. Versom, G. Kouretas, J. Abelian, J. Boyd, K. Oslund,
+#  K. Reymann, K. Choromanski, L. Graesser, M. Ahn, N. Jaitly, N. Lazic,
+#  P. Sanketi, P. Xu, P. Sermanet, R. Mahjourian, S. Abeyruwan, S. Kataoka,
+#  S. Moore, T. Nguyen, T. Ding, V. Sindhwani, V. Vanhoucke, W. Gao, Y. Kuang,
+#  to be presented at RSS 2023
 ###############################################################################
 r"""Library of gradient ascent algorithms.
 
diff --git a/compiler_opt/es/gradient_ascent_optimization_algorithms_test.py b/compiler_opt/es/gradient_ascent_optimization_algorithms_test.py
@@ -15,11 +15,35 @@
 
 ###############################################################################
 #
-# This is a port of the work by: Krzysztof Choromanski, Mark Rowland,
-# Vikas Sindhwani, Richard E. Turner, Adrian Weller:  "Structured Evolution
-# with Compact Architectures for Scalable Policy Optimization",
-# https://arxiv.org/abs/1804.02395
 #
+# This is a port of the code by Krzysztof Choromanski, Deepali Jain and Vikas
+# Sindhwani, based on the portfolio of Blackbox optimization algorithms listed
+# below:
+#
+# "On Blackbox Backpropagation and Jacobian Sensing"; K. Choromanski,
+#  V. Sindhwani, NeurIPS 2017
+# "Optimizing Simulations with Noise-Tolerant Structured Exploration"; K.
+#  Choromanski, A. Iscen, V. Sindhwani, J. Tan, E. Coumans, ICRA 2018
+# "Structured Evolution with Compact Architectures for Scalable Policy
+#  Optimization"; K. Choromanski, M. Rowland, V. Sindhwani, R. Turner, A.
+#  Weller, ICML 2018, https://arxiv.org/abs/1804.02395
+#  "From Complexity to Simplicity: Adaptive ES-Active Subspaces for Blackbox
+#   Optimization";  K. Choromanski, A. Pacchiano, J. Parker-Holder, Y. Tang, V.
+#   Sindhwani, NeurIPS 2019
+# "i-Sim2Real: Reinforcement Learning on Robotic Policies in Tight Human-Robot
+#  Interaction Loops"; L. Graesser, D. D'Ambrosio, A. Singh, A. Bewley, D. Jain,
+#  K. Choromanski, P. Sanketi , CoRL 2022, https://arxiv.org/abs/2207.06572
+# "Agile Catching with Whole-Body MPC and Blackbox Policy Learning"; S.
+#  Abeyruwan, A. Bewley, N. Boffi, K. Choromanski, D. D'Ambrosio, D. Jain, P.
+#  Sanketi, A. Shankar, V. Sindhwani, S. Singh, J. Slotine, S. Tu, L4DC,
+#  https://arxiv.org/abs/2306.08205
+# "Robotic Table Tennis: A Case Study into a High Speed Learning System"; A.
+#  Bewley, A. Shankar, A. Iscen, A. Singh, C. Lynch, D. D'Ambrosio, D. Jain,
+#  E. Coumans, G. Versom, G. Kouretas, J. Abelian, J. Boyd, K. Oslund,
+#  K. Reymann, K. Choromanski, L. Graesser, M. Ahn, N. Jaitly, N. Lazic,
+#  P. Sanketi, P. Xu, P. Sermanet, R. Mahjourian, S. Abeyruwan, S. Kataoka,
+#  S. Moore, T. Nguyen, T. Ding, V. Sindhwani, V. Vanhoucke, W. Gao, Y. Kuang,
+#  to be presented at RSS 2023
 ###############################################################################
 r"""Tests for gradient_ascent_optimization_algorithms."""