|
|
|
|
|
|
|
|
|
|
with tf.variable_scope("value"): |
|
|
|
if policy.use_continuous_act: |
|
|
|
self._create_cc_critic(h_size, num_layers, vis_encode_type) |
|
|
|
self._create_cc_critic(h_size, hyperparameters.value_layers, vis_encode_type) |
|
|
|
self._create_dc_critic(h_size, num_layers, vis_encode_type) |
|
|
|
self._create_dc_critic(h_size, hyperparameters.value_layers, vis_encode_type) |
|
|
|
|
|
|
|
with tf.variable_scope("optimizer/"): |
|
|
|
self.learning_rate = ModelUtils.create_schedule( |
|
|
|