Test without partialnt

HenriDeh · HenriDeh · commit ca511f7d3e30 · 2023-07-06T17:26:55.000+02:00
diff --git a/test/episodes.jl b/test/episodes.jl
@@ -4,16 +4,16 @@ using Test
 @testset "EpisodesBuffer" begin
     @testset "with circular traces" begin 
         eb = EpisodesBuffer(
-            CircularArraySARSATTraces(;
+            CircularArraySARTTraces(;
             capacity=10)
         )
         #push a first episode l=5 
-        push!(eb, (state = 1, action = 1))
+        push!(eb, (state = 1,))
         @test eb.sampleable_inds[end] == 0
         @test eb.episodes_lengths[end] == 0
         @test eb.step_numbers[end] == 1
         for i = 1:5
-            push!(eb, (state = i+1, action =i+1, reward = i, terminal = false))
+            push!(eb, (state = i+1, action =i, reward = i, terminal = false))
             @test eb.sampleable_inds[end] == 0
             @test eb.sampleable_inds[end-1] == 1
             @test eb.step_numbers[end] == i + 1
@@ -22,7 +22,7 @@ using Test
         @test eb.sampleable_inds == [1,1,1,1,1,0]
         @test length(eb.traces) == 5
         #start new episode of 6 periods.
-        push!(eb, (state = 7, action = 7))
+        push!(eb, (state = 7,))
         @test eb.sampleable_inds[end] == 0
         @test eb.sampleable_inds[end-1] == 0
         @test eb.episodes_lengths[end] == 0
@@ -32,7 +32,7 @@ using Test
         ep2_len = 0
         for (j,i) = enumerate(8:11)
             ep2_len += 1
-            push!(eb, (state = i, action =i, reward = i-1, terminal = false))
+            push!(eb, (state = i, action =i-1, reward = i-1, terminal = false))
             @test eb.sampleable_inds[end] == 0
             @test eb.sampleable_inds[end-1] == 1
             @test eb.step_numbers[end] == j + 1
@@ -43,7 +43,7 @@ using Test
         #three last steps replace oldest steps in the buffer.
         for (i, s) = enumerate(12:13)
             ep2_len += 1
-            push!(eb, (state = s, action =s, reward = s-1, terminal = false))
+            push!(eb, (state = s, action =s-1, reward = s-1, terminal = false))
             @test eb.sampleable_inds[end] == 0
             @test eb.sampleable_inds[end-1] == 1
             @test eb.step_numbers[end] == i + 1 + 4
@@ -59,18 +59,18 @@ using Test
             end
             b = eb[i]
             @test b[:state] == b[:action] == b[:reward] == s
-            @test b[:next_state] == b[:next_action] == s + 1
+            @test b[:next_state] == s + 1
         end
         #episode 2
         #start a third episode
-        push!(eb, (state = 14, action = 14))
+        push!(eb, (state = 14, ))
         @test eb.sampleable_inds[end] == 0
         @test eb.sampleable_inds[end-1] == 0
         @test eb.episodes_lengths[end] == 0
         @test eb.step_numbers[end] == 1
         #push until it reaches it own start
         for (i,s) in enumerate(15:26)
-            push!(eb, (state = s, action =s, reward = s-1, terminal = false))
+            push!(eb, (state = s, action =s-1, reward = s-1, terminal = false))
         end
         @test eb.sampleable_inds == [fill(true, 10); [false]]
         @test eb.episodes_lengths == fill(length(15:26), 11)