Skip to content

Commit e244f77

Browse files
committed
bugfix and update tests
1 parent 8b5252b commit e244f77

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

src/Utils/policy.jl

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -88,12 +88,12 @@ function evaluate_policy!(
8888
policy, envs::Vector{<:AbstractEnvironment}, episodes::Int=1; kwargs...
8989
)
9090
E = length(envs)
91-
rewards = zeros(Float64, E)
91+
avg_rewards = zeros(Float64, E)
9292
datasets = map(1:E) do e
9393
rewards, datasets = evaluate_policy!(policy, envs[e], episodes; kwargs...)
94-
rewards[e] = sum(reward) / episodes
94+
avg_rewards[e] = sum(rewards) / episodes
9595
dataset = vcat(datasets...)
9696
return dataset
9797
end
98-
return rewards, vcat(datasets...)
98+
return avg_rewards, vcat(datasets...)
9999
end

test/dynamic_vsp.jl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,7 @@
4545
θ2 = model2(x2)
4646
y2 = maximizer(θ2; instance=instance2)
4747
@test size(x, 1) == 2
48-
@test size(x2, 1) == 14
48+
@test size(x2, 1) == 27
4949

5050
anticipative_value, solution = generate_anticipative_solution(b, env; reset_env=true)
5151
reset!(env; reset_rng=true)

0 commit comments

Comments
 (0)