Skip to content

Commit bc82c3f

Browse files
authored
Update tutorial_atari_pong.py
1 parent 302a435 commit bc82c3f

File tree

1 file changed

+6
-8
lines changed

1 file changed

+6
-8
lines changed

example/tutorial_atari_pong.py

Lines changed: 6 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -93,17 +93,17 @@ def prepro(I):
9393

9494
prob = sess.run(
9595
sampling_prob,
96-
feed_dict={t_states: x}
97-
)
96+
feed_dict={t_states: x})
97+
9898
# action. 1: STOP 2: UP 3: DOWN
9999
# action = np.random.choice([1,2,3], p=prob.flatten())
100100
action = tl.rein.choice_action_by_probs(prob.flatten(), [1,2,3])
101101

102102
observation, reward, done, _ = env.step(action)
103103
reward_sum += reward
104-
xs.append(x) # all observations in a episode
105-
ys.append(action - 1) # all fake labels in a episode (action begins from 1, so minus 1)
106-
rs.append(reward) # all rewards in a episode
104+
xs.append(x) # all observations in an episode
105+
ys.append(action - 1) # all fake labels in an episode (action begins from 1, so minus 1)
106+
rs.append(reward) # all rewards in an episode
107107

108108
if done:
109109
episode_number += 1
@@ -125,9 +125,7 @@ def prepro(I):
125125
feed_dict={
126126
t_states: epx,
127127
t_actions: epy,
128-
t_discount_rewards: disR
129-
}
130-
)
128+
t_discount_rewards: disR})
131129

132130
if episode_number % (batch_size * 100) == 0:
133131
tl.files.save_npz(network.all_params, name=model_file_name+'.npz')

0 commit comments

Comments
 (0)