def pi_and_v(self, state): if self.normalize_obs: state = F.clip(self.obs_filter(state, update=False), -5.0, 5.0) return self.pi(state), self.v(state)