def __initialize_DDQN(self):
"""Initialize Double DQN."""
tf.reset_default_graph()
self.mainDQN = Qnetwork(self.num_dims, self.num_actions, clip=self.grad_clip, activation_fn=tf.nn.relu, hidden_layer_sizes=self.ddqn_hidden_layer_sizes)
self.targetDQN = Qnetwork(self.num_dims, self.num_actions, clip=self.grad_clip, activation_fn=tf.nn.relu, hidden_layer_sizes=self.ddqn_hidden_layer_sizes)
init = tf.global_variables_initializer()
self.trainables = tf.trainable_variables()
self.targetOps = self.__update_target_graph()
self.sess = tf.Session()
self.sess.run(init)
self.__update_target()
评论列表
文章目录