def __init__(self, num_actions, discount, exploration_prob, step_size, logging=True):
self.actions = range(num_actions)
self.discount = discount
self.exploration_prob = exploration_prob
self.step_size = step_size
self.num_iters = 1
self.weights = collections.Counter()
self.logger = logger.Logger(agent_name='QLearningAgent', logging=logging)
self.prev_state = None
self.prev_action = None
评论列表
文章目录