Fix policy's scoping

5 年前 · 1f094da9
--- a/ml-agents/mlagents/trainers/common/nn_policy.py
+++ b/ml-agents/mlagents/trainers/common/nn_policy.py
        """
        Builds the tensorflow graph needed for this policy.
        """
-        with tf.variable_scope("policy/"):
-            self.create_input_placeholders()
-            with self.graph.as_default():
+        with self.graph.as_default():
+            with tf.variable_scope("policy"):
+                self.create_input_placeholders()
                if self.use_continuous_act:
                    self.create_cc_actor(
                        self.h_size,
            h_size,
            num_layers,
            vis_encode_type,
-            stream_scopes=["policy/"],
        )[0]

        if self.use_recurrent:
            hidden_policy,
            self.act_size[0],
            activation=None,
+            name="mu",
            kernel_initializer=LearningModel.scaled_init(0.01),
            reuse=tf.AUTO_REUSE,
        )
            h_size,
            num_layers,
            vis_encode_type,
-            stream_scopes=["policy/"],
        )[0]

        if self.use_recurrent: