浏览代码

Merge pull request #4990 from Unity-Technologies/goal-conditioning-new-vince

Tried to make improvements to the initialization of the hyperNetwork weights
/goal-conditioning/new
GitHub 4 年前
当前提交
ca8a4ae2
共有 2 个文件被更改,包括 17 次插入15 次删除
  1. 30
      ml-agents/mlagents/trainers/torch/layers.py
  2. 2
      ml-agents/mlagents/trainers/torch/networks.py

30
ml-agents/mlagents/trainers/torch/layers.py


from mlagents.torch_utils import torch
import abc
import math
from typing import Tuple
from enum import Enum

layer_in_size = layer_size
flat_output = linear_layer(
layer_size,
input_size * output_size + output_size,
input_size * output_size,
self.hypernet = torch.nn.Sequential(*layers, flat_output)
# Re-initializing the weights of the last layer of the hypernetwork
bound = math.sqrt(1 / (layer_size * self.input_size))
flat_output.weight.data.uniform_(-bound, bound)
self.hypernet = torch.nn.Sequential(*layers, LayerNorm(), flat_output)
# The hypernetwork will not generate the bias of the main network layer
self.bias = torch.nn.Parameter(torch.zeros(output_size))
flat_output_weights = self.hypernet(hyper_input)
batch_size = input_activation.size(0)
output_weights = self.hypernet(hyper_input)
output_weights, output_bias = torch.split(
flat_output_weights, self.input_size * self.output_size, dim=-1
)
output_weights = output_weights.view(
batch_size, self.input_size, self.output_size
)
output_bias = output_bias.view(batch_size, self.output_size)
output = (
output_weights = output_weights.view(-1, self.input_size, self.output_size)
return (
+ output_bias
+ self.bias
return output

2
ml-agents/mlagents/trainers/torch/networks.py


self.obs_types[idx] == ObservationType.GOAL
and self.conditioning_type != ConditioningType.DEFAULT
):
if goal_signal is not None:
raise Exception("TODO : Cannot currently handle more than one goal")
goal_signal = processed_obs
if len(encodes) == 0:

正在加载...
取消
保存