浏览代码
Merge branch 'develop-critic-optimizer' into develop-critic-op-lstm
/develop/critic-op-lstm-currentmem
Merge branch 'develop-critic-optimizer' into develop-critic-op-lstm
/develop/critic-op-lstm-currentmem
Ervin Teng
4 年前
当前提交
93a59971
共有 53 个文件被更改,包括 5162 次插入 和 115 次删除
-
3.github/workflows/pytest.yml
-
1Project/ProjectSettings/TagManager.asset
-
15com.unity.ml-agents/CHANGELOG.md
-
16com.unity.ml-agents/Editor/BehaviorParametersEditor.cs
-
6com.unity.ml-agents/Runtime/Academy.cs
-
4com.unity.ml-agents/Runtime/Agent.cs
-
15com.unity.ml-agents/Runtime/Communicator/GrpcExtensions.cs
-
5com.unity.ml-agents/Runtime/Communicator/UnityRLCapabilities.cs
-
40com.unity.ml-agents/Runtime/Grpc/CommunicatorObjects/Capabilities.cs
-
70com.unity.ml-agents/Runtime/Inference/BarracudaModelParamLoader.cs
-
6com.unity.ml-agents/Runtime/Inference/ModelRunner.cs
-
21com.unity.ml-agents/Runtime/Sensors/BufferSensor.cs
-
14com.unity.ml-agents/Runtime/Sensors/BufferSensorComponent.cs
-
17com.unity.ml-agents/Runtime/Sensors/CameraSensor.cs
-
2com.unity.ml-agents/Runtime/Sensors/IDimensionPropertiesSensor.cs
-
30com.unity.ml-agents/Tests/Editor/ParameterLoaderTest.cs
-
2docs/Installation.md
-
51docs/Learning-Environment-Design-Agents.md
-
27docs/Learning-Environment-Examples.md
-
2gym-unity/README.md
-
11ml-agents-envs/mlagents_envs/communicator_objects/capabilities_pb2.py
-
6ml-agents-envs/mlagents_envs/communicator_objects/capabilities_pb2.pyi
-
4ml-agents-envs/mlagents_envs/environment.py
-
16ml-agents-envs/mlagents_envs/rpc_utils.py
-
14ml-agents-envs/mlagents_envs/tests/test_rpc_utils.py
-
49ml-agents/mlagents/trainers/torch/attention.py
-
3protobuf-definitions/proto/mlagents_envs/communicator_objects/capabilities.proto
-
8Project/Assets/ML-Agents/Examples/Sorter.meta
-
105config/ppo/Sorter_curriculum.yaml
-
1001docs/images/sorter.png
-
8Project/Assets/ML-Agents/Examples/Sorter/Meshes.meta
-
63Project/Assets/ML-Agents/Examples/Sorter/Meshes/ArenaWalls.fbx
-
247Project/Assets/ML-Agents/Examples/Sorter/Meshes/ArenaWalls.fbx.meta
-
8Project/Assets/ML-Agents/Examples/Sorter/Prefabs.meta
-
8Project/Assets/ML-Agents/Examples/Sorter/Scenes.meta
-
8Project/Assets/ML-Agents/Examples/Sorter/Scripts.meta
-
8Project/Assets/ML-Agents/Examples/Sorter/TFModels.meta
-
15Project/Assets/ML-Agents/Examples/Sorter/TFModels/Sorter.onnx.meta
-
1001Project/Assets/ML-Agents/Examples/Sorter/TFModels/Sorter.onnx
-
7Project/Assets/ML-Agents/Examples/Sorter/Prefabs/Area.prefab.meta
-
1001Project/Assets/ML-Agents/Examples/Sorter/Prefabs/Area.prefab
-
11Project/Assets/ML-Agents/Examples/Sorter/Scripts/SorterAgent.cs.meta
-
11Project/Assets/ML-Agents/Examples/Sorter/Scripts/NumberTile.cs.meta
-
34Project/Assets/ML-Agents/Examples/Sorter/Scripts/NumberTile.cs
-
273Project/Assets/ML-Agents/Examples/Sorter/Scripts/SorterAgent.cs
-
9Project/Assets/ML-Agents/Examples/Sorter/Scenes/Sorter.unity.meta
-
1001Project/Assets/ML-Agents/Examples/Sorter/Scenes/Sorter.unity
|
|||
fileFormatVersion: 2 |
|||
guid: 5921b34611f764a849f03ecb648faaed |
|||
folderAsset: yes |
|||
DefaultImporter: |
|||
externalObjects: {} |
|||
userData: |
|||
assetBundleName: |
|||
assetBundleVariant: |
|
|||
behaviors: |
|||
Sorter: |
|||
trainer_type: ppo |
|||
hyperparameters: |
|||
batch_size: 512 |
|||
buffer_size: 40960 |
|||
learning_rate: 0.0003 |
|||
beta: 0.005 |
|||
epsilon: 0.2 |
|||
lambd: 0.95 |
|||
num_epoch: 3 |
|||
learning_rate_schedule: constant |
|||
network_settings: |
|||
normalize: False |
|||
hidden_units: 128 |
|||
num_layers: 2 |
|||
vis_encode_type: simple |
|||
reward_signals: |
|||
extrinsic: |
|||
gamma: 0.99 |
|||
strength: 1.0 |
|||
keep_checkpoints: 5 |
|||
max_steps: 5000000 |
|||
time_horizon: 256 |
|||
summary_freq: 10000 |
|||
threaded: true |
|||
environment_parameters: |
|||
num_tiles: |
|||
curriculum: |
|||
- name: Lesson0 # The '-' is important as this is a list |
|||
completion_criteria: |
|||
measure: progress |
|||
behavior: Sorter |
|||
signal_smoothing: true |
|||
min_lesson_length: 100 |
|||
threshold: 0.3 |
|||
value: 2.0 |
|||
- name: Lesson1 |
|||
completion_criteria: |
|||
measure: progress |
|||
behavior: Sorter |
|||
signal_smoothing: true |
|||
min_lesson_length: 100 |
|||
threshold: 0.4 |
|||
value: 4.0 |
|||
- name: Lesson2 |
|||
completion_criteria: |
|||
measure: progress |
|||
behavior: Sorter |
|||
signal_smoothing: true |
|||
min_lesson_length: 100 |
|||
threshold: 0.45 |
|||
value: 6.0 |
|||
- name: Lesson3 |
|||
completion_criteria: |
|||
measure: progress |
|||
behavior: Sorter |
|||
signal_smoothing: true |
|||
min_lesson_length: 100 |
|||
threshold: 0.5 |
|||
value: 8.0 |
|||
- name: Lesson4 |
|||
completion_criteria: |
|||
measure: progress |
|||
behavior: Sorter |
|||
signal_smoothing: true |
|||
min_lesson_length: 100 |
|||
threshold: 0.55 |
|||
value: 10.0 |
|||
- name: Lesson5 |
|||
completion_criteria: |
|||
measure: progress |
|||
behavior: Sorter |
|||
signal_smoothing: true |
|||
min_lesson_length: 100 |
|||
threshold: 0.6 |
|||
value: 12.0 |
|||
- name: Lesson6 |
|||
completion_criteria: |
|||
measure: progress |
|||
behavior: Sorter |
|||
signal_smoothing: true |
|||
min_lesson_length: 100 |
|||
threshold: 0.65 |
|||
value: 14.0 |
|||
- name: Lesson7 |
|||
completion_criteria: |
|||
measure: progress |
|||
behavior: Sorter |
|||
signal_smoothing: true |
|||
min_lesson_length: 100 |
|||
threshold: 0.7 |
|||
value: 16.0 |
|||
- name: Lesson8 |
|||
completion_criteria: |
|||
measure: progress |
|||
behavior: Sorter |
|||
signal_smoothing: true |
|||
min_lesson_length: 100 |
|||
threshold: 0.75 |
|||
value: 18.0 |
|||
- name: Lesson9 |
|||
value: 20.0 |
|||
env_settings: |
|||
num_envs: 8 |
1001
docs/images/sorter.png
文件差异内容过多而无法显示
查看文件
文件差异内容过多而无法显示
查看文件
|
|||
fileFormatVersion: 2 |
|||
guid: 21f2df9a3b371479883c5f6a9c1f5314 |
|||
folderAsset: yes |
|||
DefaultImporter: |
|||
externalObjects: {} |
|||
userData: |
|||
assetBundleName: |
|||
assetBundleVariant: |
|
|||
Kaydara FBX Binary � M FBXHeaderExtension\ FBXHeaderVersionI� x |
|||
FBXVersionI� � EncryptionTypeI � CreationTimeStamp� VersionI� � YearI� � MonthI DayI ' HourI ? MinuteI W SecondI t MillisecondI5 � . CreatorS) Blender (stable FBX IO) - 2.91.0 - 4.21.3@ ' |