def q_network(observations): return tf_layers.linear(observations, env.actions, biases_initializer=None)