def __init__(self, model, optimizer,
gpu=None,
gamma=0.99,
lambd=0.95,
phi=lambda x: x,
value_func_coef=1.0,
entropy_coef=0.01,
update_interval=2048,
minibatch_size=64,
epochs=10,
clip_eps=0.2,
clip_eps_vf=None,
standardize_advantages=True,
average_v_decay=0.999, average_loss_decay=0.99,
):
self.model = model
if gpu is not None and gpu >= 0:
cuda.get_device_from_id(gpu).use()
self.model.to_gpu(device=gpu)
self.optimizer = optimizer
self.gamma = gamma
self.lambd = lambd
self.phi = phi
self.value_func_coef = value_func_coef
self.entropy_coef = entropy_coef
self.update_interval = update_interval
self.minibatch_size = minibatch_size
self.epochs = epochs
self.clip_eps = clip_eps
self.clip_eps_vf = clip_eps_vf
self.standardize_advantages = standardize_advantages
self.average_v = 0
self.average_v_decay = average_v_decay
self.average_loss_policy = 0
self.average_loss_value_func = 0
self.average_loss_entropy = 0
self.average_loss_decay = average_loss_decay
self.xp = self.model.xp
self.last_state = None
self.memory = []
self.last_episode = []
评论列表
文章目录