File tree 1 file changed +2
-2
lines changed
1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -130,7 +130,7 @@ def get_nstep_return_data(
130
130
if cum_reward :
131
131
data [i ]['reward' ] = sum ([data [i + j ]['reward' ] * (gamma ** j ) for j in range (nstep )])
132
132
else :
133
- data [i ]['reward' ] = torch .stack ([data [i + j ]['reward' ] for j in range (nstep )], dim = - 1 )
133
+ data [i ]['reward' ] = torch .stack ([data [i + j ]['reward' ] for j in range (nstep )], dim = - 1 )
134
134
data [i ]['done' ] = data [i + nstep - 1 ]['done' ]
135
135
if correct_terminate_gamma :
136
136
data [i ]['value_gamma' ] = gamma ** nstep
@@ -143,7 +143,7 @@ def get_nstep_return_data(
143
143
data [i ]['reward' ] = torch .stack (
144
144
[data [i + j ]['reward' ]
145
145
for j in range (len (data ) - i )] + [fake_reward for _ in range (nstep - (len (data ) - i ))],
146
- dim = - 1
146
+ dim = - 1
147
147
)
148
148
# try:
149
149
# assert len(data[i]['reward']) == 300
You can’t perform that action at this time.
0 commit comments