Skip to content

Commit e036f63

Browse files
committed
rename to action_log_prob
1 parent a6c092e commit e036f63

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

src/ReinforcementLearningZoo/src/algorithms/bootstrapping/retrace.jl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ export retrace
77
function retrace_operator(qnetwork, policy, batch, γ, λ)
88
s = batch[:state] |> send_to_device(qnetwork)
99
a = batch[:action] |> send_to_device(qnetwork)
10-
behavior_log_probs = batch[:log_prob] |> send_to_device(qnetwork)
10+
behavior_log_probs = batch[:action_log_problog_prob] |> send_to_device(qnetwork)
1111
r = batch[:reward] |> send_to_device(qnetwork)
1212
t = last.(batch[:terminal]) |> send_to_device(qnetwork)
1313
ns = batch[:next_state] |> send_to_device(qnetwork)

src/ReinforcementLearningZoo/test/operators.jl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ import ReinforcementLearningCore
22
@testset "retrace" begin
33
batch = (state= [[1 2 3], [10 11 12]],
44
action = [[1 2 3],[10 11 12]],
5-
log_prob = [log.([0.2,0.2,0.2]), log.([0.1,0.1,0.1])],
5+
action_log_problog_prob = [log.([0.2,0.2,0.2]), log.([0.1,0.1,0.1])],
66
reward = [[1f0,2f0,3f0],[10f0,11f0,12f0]],
77
terminal= [[0,0,1], [0,0,0]],
88
next_state = [[2 3 4],[11 12 13]])

0 commit comments

Comments
 (0)