Fix typo in comment (#690)

soumith · web-flow · commit 1318058e3376 · 2020-03-04T20:14:10.000-05:00
diff --git a/reinforcement_learning/actor_critic.py b/reinforcement_learning/actor_critic.py
@@ -63,7 +63,7 @@ def forward(self, x):
         # critic: evaluates being in the state s_t
         state_values = self.value_head(x)
 
-        # return values for both actor and critic as a tupel of 2 values:
+        # return values for both actor and critic as a tuple of 2 values:
         # 1. a list with the probability of each action over the action space
         # 2. the value from state s_t 
         return action_prob, state_values