From 56e2c2bda943616ea755b144cdace61126a53b35 Mon Sep 17 00:00:00 2001 From: vmoens Date: Mon, 27 Mar 2023 18:33:11 +0100 Subject: [PATCH] init --- intermediate_source/reinforcement_ppo.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/intermediate_source/reinforcement_ppo.py b/intermediate_source/reinforcement_ppo.py index 6b0e8522f8d..8dee73969db 100644 --- a/intermediate_source/reinforcement_ppo.py +++ b/intermediate_source/reinforcement_ppo.py @@ -604,7 +604,7 @@ data_view = tensordict_data.reshape(-1) replay_buffer.extend(data_view.cpu()) for _ in range(frames_per_batch // sub_batch_size): - subdata, *_ = replay_buffer.sample(sub_batch_size) + subdata = replay_buffer.sample(sub_batch_size) loss_vals = loss_module(subdata.to(device)) loss_value = ( loss_vals["loss_objective"]