|
97 | 97 | ] |
98 | 98 | } |
99 | 99 | }, |
100 | | - "lunar_double_dqn_per": { |
101 | | - "problem": "LunarLander-v2", |
102 | | - "Agent": "DoubleDQN", |
103 | | - "HyperOptimizer": "GridSearch", |
104 | | - "Memory": "PrioritizedExperienceReplay", |
105 | | - "Optimizer": "AdamOptimizer", |
106 | | - "Policy": "DoubleDQNBoltzmannPolicy", |
107 | | - "PreProcessor": "StackStates", |
108 | | - "param": { |
109 | | - "train_per_n_new_exp": 2, |
110 | | - "lr": 0.005, |
111 | | - "gamma": 0.99, |
112 | | - "hidden_layers": [800, 400], |
113 | | - "hidden_layers_activation": "sigmoid", |
114 | | - "output_layer_activation": "linear", |
115 | | - "exploration_anneal_episodes": 150, |
116 | | - "epi_change_lr": 200, |
117 | | - "max_mem_len": 30000 |
118 | | - }, |
119 | | - "param_range": { |
120 | | - "lr": [0.001, 0.005, 0.01], |
121 | | - "gamma": [0.97, 0.99, 0.999], |
122 | | - "hidden_layers": [ |
123 | | - [400, 200], |
124 | | - [800, 400], |
125 | | - [400, 200, 100] |
126 | | - ] |
127 | | - } |
128 | | - }, |
129 | 100 | "lunar_double_dqn_nopreprocess": { |
130 | 101 | "problem": "LunarLander-v2", |
131 | 102 | "Agent": "DoubleDQN", |
|
266 | 237 | ] |
267 | 238 | } |
268 | 239 | }, |
269 | | - "lunar_ddpg_linearnoise": { |
| 240 | + "lunar_cont_ddpg_per_linearnoise": { |
270 | 241 | "problem": "LunarLanderContinuous-v2", |
271 | 242 | "Agent": "DDPG", |
272 | 243 | "HyperOptimizer": "GridSearch", |
273 | | - "Memory": "LinearMemoryWithForgetting", |
| 244 | + "Memory": "PrioritizedExperienceReplay", |
274 | 245 | "Optimizer": "AdamOptimizer", |
275 | 246 | "Policy": "LinearNoisePolicy", |
276 | 247 | "PreProcessor": "NoPreProcessor", |
|
327 | 298 | [800, 400, 200] |
328 | 299 | ] |
329 | 300 | } |
| 301 | + }, |
| 302 | + "walker_ddpg_per_linearnoise": { |
| 303 | + "problem": "BipedalWalker-v2", |
| 304 | + "Agent": "DDPG", |
| 305 | + "HyperOptimizer": "GridSearch", |
| 306 | + "Memory": "PrioritizedExperienceReplay", |
| 307 | + "Optimizer": "AdamOptimizer", |
| 308 | + "Policy": "LinearNoisePolicy", |
| 309 | + "PreProcessor": "NoPreProcessor", |
| 310 | + "param": { |
| 311 | + "batch_size": 64, |
| 312 | + "n_epoch": 1, |
| 313 | + "tau": 0.005, |
| 314 | + "lr": 0.0005, |
| 315 | + "critic_lr": 0.001, |
| 316 | + "gamma": 0.97, |
| 317 | + "hidden_layers": [400, 200], |
| 318 | + "hidden_layers_activation": "relu", |
| 319 | + "output_layer_activation": "tanh" |
| 320 | + }, |
| 321 | + "param_range": { |
| 322 | + "lr": [0.0001, 0.0005], |
| 323 | + "critic_lr": [0.001, 0.005], |
| 324 | + "gamma": [0.95, 0.97, 0.99], |
| 325 | + "hidden_layers": [ |
| 326 | + [200, 100], |
| 327 | + [400, 300], |
| 328 | + [800, 400] |
| 329 | + ] |
| 330 | + } |
330 | 331 | } |
331 | 332 | } |
0 commit comments