Skip to content

Commit ca28b7e

Browse files
committed
find state specific std is better than parameter only std for ppo
1 parent b7e6353 commit ca28b7e

File tree

3 files changed

+3
-3
lines changed

3 files changed

+3
-3
lines changed

ppo_gae_continuous.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -12,8 +12,8 @@
1212
gamma = 0.99
1313
lmbda = 0.95
1414
eps_clip = 0.1
15-
batch_size = 4096
16-
K_epoch = 20
15+
batch_size = 1280
16+
K_epoch = 10
1717
T_horizon = 10000
1818

1919
class NormalizedActions(gym.ActionWrapper):
@@ -50,7 +50,7 @@ def __init__(self, num_inputs, num_actions, hidden_size, action_range = 1.):
5050

5151
self.mean_linear = nn.Linear(hidden_size, num_actions)
5252
self.log_std_linear = nn.Linear(hidden_size, num_actions)
53-
# self.log_std_param = nn.Parameter(torch.zeros(num_actions))
53+
# self.log_std_param = nn.Parameter(torch.zeros(num_actions, requires_grad=True))
5454

5555
self.v_linear = nn.Linear(hidden_size, 1)
5656

sac.png

-47.3 KB
Binary file not shown.

sac_v2.png

-66.3 KB
Binary file not shown.

0 commit comments

Comments
 (0)