Changed argmax to idxmax.

hiroyachiba · hiroyachiba · commit 28d25366eb5e · 2017-12-02T15:31:38.000+09:00
diff --git a/contents/2_Q_Learning_maze/RL_brain.py b/contents/2_Q_Learning_maze/RL_brain.py
@@ -24,7 +24,7 @@ def choose_action(self, observation):
             # choose best action
             state_action = self.q_table.ix[observation, :]
             state_action = state_action.reindex(np.random.permutation(state_action.index))     # some actions have same value
-            action = state_action.argmax()
+            action = state_action.idxmax()
         else:
             # choose random action
             action = np.random.choice(self.actions)