def policy_network(observations): hidden = tf_layers.fully_connected(observations, args.hidden_layer, activation_fn=tf.nn.relu) logits = tf_layers.linear(hidden, env.actions) return logits