def sampleEnvironment(self, s, environments, T = 1):
problem = self.encodeProblem(s).view(1,-1)
environmentScores = self.environmentLogLikelihoods(environments, problem)
distribution = (environmentScores/T).exp()
i = torch.multinomial(distribution.data, 1)[0]
return environments[i]
评论列表
文章目录