def __init__(self, input_num, hidden_num,num_of_actions):
self.input_num = input_num
self.hidden_num = hidden_num
self.num_of_actions = num_of_actions
super(Q_DNN, self).__init__(
fc1=L.Linear(self.input_num, self.hidden_num),
bn1=L.BatchNormalization(self.hidden_num),
fc2=L.Linear(self.hidden_num, self.hidden_num),
bn2=L.BatchNormalization(self.hidden_num),
fc3=L.Linear(self.hidden_num, self.hidden_num),
bn3=L.BatchNormalization(self.hidden_num),
fc4=L.Linear(self.hidden_num, self.hidden_num),
bn4=L.BatchNormalization(self.hidden_num),
fc5=L.Linear(self.hidden_num, self.hidden_num),
bn5=L.BatchNormalization(self.hidden_num),
q_value=L.Linear(self.hidden_num, self.num_of_actions,
initialW=np.zeros((self.num_of_actions, self.hidden_num),
dtype=np.float32))
)
评论列表
文章目录