max_q_cur = np.max(self.Q[next_state, :]) if not absorbing else 0.