We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 70a08d4 commit 28d2536Copy full SHA for 28d2536
contents/2_Q_Learning_maze/RL_brain.py
@@ -24,7 +24,7 @@ def choose_action(self, observation):
24
# choose best action
25
state_action = self.q_table.ix[observation, :]
26
state_action = state_action.reindex(np.random.permutation(state_action.index)) # some actions have same value
27
- action = state_action.argmax()
+ action = state_action.idxmax()
28
else:
29
# choose random action
30
action = np.random.choice(self.actions)
0 commit comments