q_next = np.max(self.Q[next_state, :]) if not absorbing else 0.