def update_one_gpu(self, param, state):
cuda.elementwise(
'T grad, T lr, T momentum',
'T param, T v',
'''v = v * momentum - lr * grad;
param += momentum * momentum * v - (1 + momentum) * lr * grad;
''',
'nesterov_ag')(param.grad, self.lr, self.momentum,
param.data, state['v'])
评论列表
文章目录