def get_greedy_action(Q, obs): xp = Q.xp obs = xp.expand_dims(xp.asarray(obs, dtype=np.float32), 0) with chainer.no_backprop_mode(): q = Q(obs).data[0] return int(xp.argmax(q))