def init_common(self):
# initialize variables common to training and testing
self.t = 0
self.learning_step = 0
self.replay = []
self.losses = []
self.games = []
self.q_t = None
self.s_t = None
self.a_t = None
self.r_t = 0
self.s_t1 = None
self.q_t1 = None
self.terminal = False
self.test_mode = False
self.baseline = False
# enable logging
self.q_train.summaries = self.q_target.summaries = self.summaries = tf.merge_all_summaries()
评论列表
文章目录