diff --git a/intermediate_source/reinforcement_q_learning.py b/intermediate_source/reinforcement_q_learning.py index 1522db24bc1..61e374a8b21 100644 --- a/intermediate_source/reinforcement_q_learning.py +++ b/intermediate_source/reinforcement_q_learning.py @@ -150,7 +150,7 @@ def __len__(self): # rewards from the uncertain far future less important for our agent # than the ones in the near future that it can be fairly confident # about. It also encourages agents to collect reward closer in time -# than equivalent rewards temporally future away. +# than equivalent rewards that are temporally far away in the future. # # The main idea behind Q-learning is that if we had a function # :math:`Q^*: State \times Action \rightarrow \mathbb{R}`, that could tell