Skip to content

Commit 94f030b

Browse files
authored
Detail ES credits. (#265)
1 parent f39ca9c commit 94f030b

File tree

4 files changed

+112
-16
lines changed

4 files changed

+112
-16
lines changed

compiler_opt/es/blackbox_optimizers.py

Lines changed: 28 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -15,11 +15,35 @@
1515

1616
###############################################################################
1717
#
18-
# This is a port of the work by: Krzysztof Choromanski, Mark Rowland,
19-
# Vikas Sindhwani, Richard E. Turner, Adrian Weller: "Structured Evolution
20-
# with Compact Architectures for Scalable Policy Optimization",
21-
# https://arxiv.org/abs/1804.02395
2218
#
19+
# This is a port of the code by Krzysztof Choromanski, Deepali Jain and Vikas
20+
# Sindhwani, based on the portfolio of Blackbox optimization algorithms listed
21+
# below:
22+
#
23+
# "On Blackbox Backpropagation and Jacobian Sensing"; K. Choromanski,
24+
# V. Sindhwani, NeurIPS 2017
25+
# "Optimizing Simulations with Noise-Tolerant Structured Exploration"; K.
26+
# Choromanski, A. Iscen, V. Sindhwani, J. Tan, E. Coumans, ICRA 2018
27+
# "Structured Evolution with Compact Architectures for Scalable Policy
28+
# Optimization"; K. Choromanski, M. Rowland, V. Sindhwani, R. Turner, A.
29+
# Weller, ICML 2018, https://arxiv.org/abs/1804.02395
30+
# "From Complexity to Simplicity: Adaptive ES-Active Subspaces for Blackbox
31+
# Optimization"; K. Choromanski, A. Pacchiano, J. Parker-Holder, Y. Tang, V.
32+
# Sindhwani, NeurIPS 2019
33+
# "i-Sim2Real: Reinforcement Learning on Robotic Policies in Tight Human-Robot
34+
# Interaction Loops"; L. Graesser, D. D'Ambrosio, A. Singh, A. Bewley, D. Jain,
35+
# K. Choromanski, P. Sanketi , CoRL 2022, https://arxiv.org/abs/2207.06572
36+
# "Agile Catching with Whole-Body MPC and Blackbox Policy Learning"; S.
37+
# Abeyruwan, A. Bewley, N. Boffi, K. Choromanski, D. D'Ambrosio, D. Jain, P.
38+
# Sanketi, A. Shankar, V. Sindhwani, S. Singh, J. Slotine, S. Tu, L4DC,
39+
# https://arxiv.org/abs/2306.08205
40+
# "Robotic Table Tennis: A Case Study into a High Speed Learning System"; A.
41+
# Bewley, A. Shankar, A. Iscen, A. Singh, C. Lynch, D. D'Ambrosio, D. Jain,
42+
# E. Coumans, G. Versom, G. Kouretas, J. Abelian, J. Boyd, K. Oslund,
43+
# K. Reymann, K. Choromanski, L. Graesser, M. Ahn, N. Jaitly, N. Lazic,
44+
# P. Sanketi, P. Xu, P. Sermanet, R. Mahjourian, S. Abeyruwan, S. Kataoka,
45+
# S. Moore, T. Nguyen, T. Ding, V. Sindhwani, V. Vanhoucke, W. Gao, Y. Kuang,
46+
# to be presented at RSS 2023
2347
###############################################################################
2448
r"""Library of blackbox optimization algorithms.
2549

compiler_opt/es/blackbox_optimizers_test.py

Lines changed: 28 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -15,11 +15,35 @@
1515

1616
###############################################################################
1717
#
18-
# This is a port of the work by: Krzysztof Choromanski, Mark Rowland,
19-
# Vikas Sindhwani, Richard E. Turner, Adrian Weller: "Structured Evolution
20-
# with Compact Architectures for Scalable Policy Optimization",
21-
# https://arxiv.org/abs/1804.02395
2218
#
19+
# This is a port of the code by Krzysztof Choromanski, Deepali Jain and Vikas
20+
# Sindhwani, based on the portfolio of Blackbox optimization algorithms listed
21+
# below:
22+
#
23+
# "On Blackbox Backpropagation and Jacobian Sensing"; K. Choromanski,
24+
# V. Sindhwani, NeurIPS 2017
25+
# "Optimizing Simulations with Noise-Tolerant Structured Exploration"; K.
26+
# Choromanski, A. Iscen, V. Sindhwani, J. Tan, E. Coumans, ICRA 2018
27+
# "Structured Evolution with Compact Architectures for Scalable Policy
28+
# Optimization"; K. Choromanski, M. Rowland, V. Sindhwani, R. Turner, A.
29+
# Weller, ICML 2018, https://arxiv.org/abs/1804.02395
30+
# "From Complexity to Simplicity: Adaptive ES-Active Subspaces for Blackbox
31+
# Optimization"; K. Choromanski, A. Pacchiano, J. Parker-Holder, Y. Tang, V.
32+
# Sindhwani, NeurIPS 2019
33+
# "i-Sim2Real: Reinforcement Learning on Robotic Policies in Tight Human-Robot
34+
# Interaction Loops"; L. Graesser, D. D'Ambrosio, A. Singh, A. Bewley, D. Jain,
35+
# K. Choromanski, P. Sanketi , CoRL 2022, https://arxiv.org/abs/2207.06572
36+
# "Agile Catching with Whole-Body MPC and Blackbox Policy Learning"; S.
37+
# Abeyruwan, A. Bewley, N. Boffi, K. Choromanski, D. D'Ambrosio, D. Jain, P.
38+
# Sanketi, A. Shankar, V. Sindhwani, S. Singh, J. Slotine, S. Tu, L4DC,
39+
# https://arxiv.org/abs/2306.08205
40+
# "Robotic Table Tennis: A Case Study into a High Speed Learning System"; A.
41+
# Bewley, A. Shankar, A. Iscen, A. Singh, C. Lynch, D. D'Ambrosio, D. Jain,
42+
# E. Coumans, G. Versom, G. Kouretas, J. Abelian, J. Boyd, K. Oslund,
43+
# K. Reymann, K. Choromanski, L. Graesser, M. Ahn, N. Jaitly, N. Lazic,
44+
# P. Sanketi, P. Xu, P. Sermanet, R. Mahjourian, S. Abeyruwan, S. Kataoka,
45+
# S. Moore, T. Nguyen, T. Ding, V. Sindhwani, V. Vanhoucke, W. Gao, Y. Kuang,
46+
# to be presented at RSS 2023
2347
###############################################################################
2448
r"""Tests for blackbox_optimization_algorithms."""
2549

compiler_opt/es/gradient_ascent_optimization_algorithms.py

Lines changed: 28 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -15,11 +15,35 @@
1515

1616
###############################################################################
1717
#
18-
# This is a port of the work by: Krzysztof Choromanski, Mark Rowland,
19-
# Vikas Sindhwani, Richard E. Turner, Adrian Weller: "Structured Evolution
20-
# with Compact Architectures for Scalable Policy Optimization",
21-
# https://arxiv.org/abs/1804.02395
2218
#
19+
# This is a port of the code by Krzysztof Choromanski, Deepali Jain and Vikas
20+
# Sindhwani, based on the portfolio of Blackbox optimization algorithms listed
21+
# below:
22+
#
23+
# "On Blackbox Backpropagation and Jacobian Sensing"; K. Choromanski,
24+
# V. Sindhwani, NeurIPS 2017
25+
# "Optimizing Simulations with Noise-Tolerant Structured Exploration"; K.
26+
# Choromanski, A. Iscen, V. Sindhwani, J. Tan, E. Coumans, ICRA 2018
27+
# "Structured Evolution with Compact Architectures for Scalable Policy
28+
# Optimization"; K. Choromanski, M. Rowland, V. Sindhwani, R. Turner, A.
29+
# Weller, ICML 2018, https://arxiv.org/abs/1804.02395
30+
# "From Complexity to Simplicity: Adaptive ES-Active Subspaces for Blackbox
31+
# Optimization"; K. Choromanski, A. Pacchiano, J. Parker-Holder, Y. Tang, V.
32+
# Sindhwani, NeurIPS 2019
33+
# "i-Sim2Real: Reinforcement Learning on Robotic Policies in Tight Human-Robot
34+
# Interaction Loops"; L. Graesser, D. D'Ambrosio, A. Singh, A. Bewley, D. Jain,
35+
# K. Choromanski, P. Sanketi , CoRL 2022, https://arxiv.org/abs/2207.06572
36+
# "Agile Catching with Whole-Body MPC and Blackbox Policy Learning"; S.
37+
# Abeyruwan, A. Bewley, N. Boffi, K. Choromanski, D. D'Ambrosio, D. Jain, P.
38+
# Sanketi, A. Shankar, V. Sindhwani, S. Singh, J. Slotine, S. Tu, L4DC,
39+
# https://arxiv.org/abs/2306.08205
40+
# "Robotic Table Tennis: A Case Study into a High Speed Learning System"; A.
41+
# Bewley, A. Shankar, A. Iscen, A. Singh, C. Lynch, D. D'Ambrosio, D. Jain,
42+
# E. Coumans, G. Versom, G. Kouretas, J. Abelian, J. Boyd, K. Oslund,
43+
# K. Reymann, K. Choromanski, L. Graesser, M. Ahn, N. Jaitly, N. Lazic,
44+
# P. Sanketi, P. Xu, P. Sermanet, R. Mahjourian, S. Abeyruwan, S. Kataoka,
45+
# S. Moore, T. Nguyen, T. Ding, V. Sindhwani, V. Vanhoucke, W. Gao, Y. Kuang,
46+
# to be presented at RSS 2023
2347
###############################################################################
2448
r"""Library of gradient ascent algorithms.
2549

compiler_opt/es/gradient_ascent_optimization_algorithms_test.py

Lines changed: 28 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -15,11 +15,35 @@
1515

1616
###############################################################################
1717
#
18-
# This is a port of the work by: Krzysztof Choromanski, Mark Rowland,
19-
# Vikas Sindhwani, Richard E. Turner, Adrian Weller: "Structured Evolution
20-
# with Compact Architectures for Scalable Policy Optimization",
21-
# https://arxiv.org/abs/1804.02395
2218
#
19+
# This is a port of the code by Krzysztof Choromanski, Deepali Jain and Vikas
20+
# Sindhwani, based on the portfolio of Blackbox optimization algorithms listed
21+
# below:
22+
#
23+
# "On Blackbox Backpropagation and Jacobian Sensing"; K. Choromanski,
24+
# V. Sindhwani, NeurIPS 2017
25+
# "Optimizing Simulations with Noise-Tolerant Structured Exploration"; K.
26+
# Choromanski, A. Iscen, V. Sindhwani, J. Tan, E. Coumans, ICRA 2018
27+
# "Structured Evolution with Compact Architectures for Scalable Policy
28+
# Optimization"; K. Choromanski, M. Rowland, V. Sindhwani, R. Turner, A.
29+
# Weller, ICML 2018, https://arxiv.org/abs/1804.02395
30+
# "From Complexity to Simplicity: Adaptive ES-Active Subspaces for Blackbox
31+
# Optimization"; K. Choromanski, A. Pacchiano, J. Parker-Holder, Y. Tang, V.
32+
# Sindhwani, NeurIPS 2019
33+
# "i-Sim2Real: Reinforcement Learning on Robotic Policies in Tight Human-Robot
34+
# Interaction Loops"; L. Graesser, D. D'Ambrosio, A. Singh, A. Bewley, D. Jain,
35+
# K. Choromanski, P. Sanketi , CoRL 2022, https://arxiv.org/abs/2207.06572
36+
# "Agile Catching with Whole-Body MPC and Blackbox Policy Learning"; S.
37+
# Abeyruwan, A. Bewley, N. Boffi, K. Choromanski, D. D'Ambrosio, D. Jain, P.
38+
# Sanketi, A. Shankar, V. Sindhwani, S. Singh, J. Slotine, S. Tu, L4DC,
39+
# https://arxiv.org/abs/2306.08205
40+
# "Robotic Table Tennis: A Case Study into a High Speed Learning System"; A.
41+
# Bewley, A. Shankar, A. Iscen, A. Singh, C. Lynch, D. D'Ambrosio, D. Jain,
42+
# E. Coumans, G. Versom, G. Kouretas, J. Abelian, J. Boyd, K. Oslund,
43+
# K. Reymann, K. Choromanski, L. Graesser, M. Ahn, N. Jaitly, N. Lazic,
44+
# P. Sanketi, P. Xu, P. Sermanet, R. Mahjourian, S. Abeyruwan, S. Kataoka,
45+
# S. Moore, T. Nguyen, T. Ding, V. Sindhwani, V. Vanhoucke, W. Gao, Y. Kuang,
46+
# to be presented at RSS 2023
2347
###############################################################################
2448
r"""Tests for gradient_ascent_optimization_algorithms."""
2549

0 commit comments

Comments
 (0)