Shuffle legal actions

......@@ -81,7 +81,7 @@ class QLearningAgent(ReinforcementAgent):
if len(legalActions) == 0:
return None
# Shuffle so the argmax action is chosen randomly
# random.shuffle(legalActions)
qValues = [self.getQValue(state, action) for action in legalActions]
maxQ = qValues[0]
maxAction = 0
