def __init__(self, input_num, hidden_num,num_of_actions):
self.input_num = input_num
self.hidden_num = hidden_num
self.num_of_actions = num_of_actions
self.agent_state_dim = 4
self.market_state_dim = input_num - self.agent_state_dim
assert self.market_state_dim > 0
super(Q_DNN, self).__init__(
a1=L.Linear(self.agent_state_dim, 2),
a2=L.Linear(2, 2),
a3=L.Linear(2, 2),
s1=L.Linear(self.market_state_dim, self.hidden_num),
s2=L.Linear(self.hidden_num, self.hidden_num),
s3=L.Linear(self.hidden_num, self.hidden_num),
fc4=L.Linear(self.hidden_num + 2, self.hidden_num),
fc5=L.Linear(self.hidden_num, self.hidden_num),
q_value=L.Linear(self.hidden_num, self.num_of_actions,
initialW=np.zeros((self.num_of_actions, self.hidden_num),
dtype=np.float32))
)
评论列表
文章目录