|
|
|
|
|
|
else: |
|
|
|
if self.policy.use_continuous_act: # For hybrid action buffer support |
|
|
|
feed_dict[self.policy.output] = mini_batch["continuous_action"] |
|
|
|
if self.policy.use_recurrent: |
|
|
|
feed_dict[self.policy.prev_action] = mini_batch[ |
|
|
|
"prev_continuous_action" |
|
|
|
] |
|
|
|
if self.policy.use_recurrent: |
|
|
|
feed_dict[self.policy.prev_action] = mini_batch["prev_action"] |
|
|
|
if self.policy.use_recurrent: |
|
|
|
feed_dict[self.policy.prev_action] = mini_batch[ |
|
|
|
"prev_discrete_action" |
|
|
|
] |
|
|
|
feed_dict[self.policy.action_masks] = mini_batch["action_mask"] |
|
|
|
if "vector_obs" in mini_batch: |
|
|
|
feed_dict[self.policy.vector_in] = mini_batch["vector_obs"] |
|
|
|