def max(self): with chainer.force_backprop_mode(): return F.select_item(self.q_values, self.greedy_actions)