|
|
|
|
|
|
all_value_tensors, |
|
|
|
all_baseline_tensors, |
|
|
|
all_next_value_mem, |
|
|
|
next_value_mem, |
|
|
|
next_value_mem, |
|
|
|
next_baseline_mem, |
|
|
|
) |
|
|
|
|
|
|
|
|
|
|
) |
|
|
|
|
|
|
|
next_value_estimates, _ = self.critic.critic_pass( |
|
|
|
all_next_obs, next_value_mem, sequence_length=batch.num_experiences |
|
|
|
all_next_obs, next_value_mem, sequence_length=1 |
|
|
|
) |
|
|
|
|
|
|
|
for name, estimate in baseline_estimates.items(): |
|
|
|