diff --git a/notebooks/unit2/unit2.ipynb b/notebooks/unit2/unit2.ipynb index 2fd2530..2ff7a9d 100644 --- a/notebooks/unit2/unit2.ipynb +++ b/notebooks/unit2/unit2.ipynb @@ -695,9 +695,9 @@ "source": [ "def epsilon_greedy_policy(Qtable, state, epsilon):\n", " # Randomly generate a number between 0 and 1\n", - " random_int = random.uniform(0,1)\n", - " # if random_int > greater than epsilon --> exploitation\n", - " if random_int > epsilon:\n", + " random_num = random.uniform(0,1)\n", + " # if random_num > greater than epsilon --> exploitation\n", + " if random_num > epsilon:\n", " # Take the action with the highest value given a state\n", " # np.argmax can be useful here\n", " action = greedy_policy(Qtable, state)\n", diff --git a/units/en/unit2/hands-on.mdx b/units/en/unit2/hands-on.mdx index f8dd666..e3f3212 100644 --- a/units/en/unit2/hands-on.mdx +++ b/units/en/unit2/hands-on.mdx @@ -388,9 +388,9 @@ def epsilon_greedy_policy(Qtable, state, epsilon): ```python def epsilon_greedy_policy(Qtable, state, epsilon): # Randomly generate a number between 0 and 1 - random_int = random.uniform(0, 1) - # if random_int > greater than epsilon --> exploitation - if random_int > epsilon: + random_num = random.uniform(0, 1) + # if random_num > greater than epsilon --> exploitation + if random_num > epsilon: # Take the action with the highest value given a state # np.argmax can be useful here action = greedy_policy(Qtable, state)