diff --git a/intermediate_source/reinforcement_q_learning.py b/intermediate_source/reinforcement_q_learning.py index 4ac542f4644..e36db61c6eb 100644 --- a/intermediate_source/reinforcement_q_learning.py +++ b/intermediate_source/reinforcement_q_learning.py @@ -403,7 +403,7 @@ def optimize_model(): num_episodes = 50 for i_episode in range(num_episodes): - # Initialize the environment and get it's state + # Initialize the environment and get its state state, info = env.reset() state = torch.tensor(state, dtype=torch.float32, device=device).unsqueeze(0) for t in count():