diff --git a/.gitattributes b/.gitattributes index e32645fa4eda9e8cc5fbb6ce24c3cb806271be82..59055dbb3b9f53f4337012ebab41dcc957237a8f 100644 --- a/.gitattributes +++ b/.gitattributes @@ -49,10 +49,13 @@ com.unity.ml-agents/Tests/Editor/TestModels/hybrid0vis53vec_3c_2daction_v1_0.onn com.unity.ml-agents/Tests/Editor/TestModels/hybrid0vis8vec_2c_2_3d_v2_0.onnx filter=lfs diff=lfs merge=lfs -text docs/images/image-banner.png filter=lfs diff=lfs merge=lfs -text localized_docs/KR/docs/images/image-banner.png filter=lfs diff=lfs merge=lfs -text -results/Pyramids[[:space:]]Training/Pyramids/Pyramids-100064.onnx filter=lfs diff=lfs merge=lfs -text -results/Pyramids[[:space:]]Training/Pyramids/Pyramids-100064.pt filter=lfs diff=lfs merge=lfs -text +results/Pyramids[[:space:]]Training/Pyramids/Pyramids-1000115.onnx filter=lfs diff=lfs merge=lfs -text +results/Pyramids[[:space:]]Training/Pyramids/Pyramids-1000115.pt filter=lfs diff=lfs merge=lfs -text +results/Pyramids[[:space:]]Training/Pyramids/Pyramids-499967.onnx filter=lfs diff=lfs merge=lfs -text +results/Pyramids[[:space:]]Training/Pyramids/Pyramids-499967.pt filter=lfs diff=lfs merge=lfs -text +results/Pyramids[[:space:]]Training/Pyramids/Pyramids-999987.onnx filter=lfs diff=lfs merge=lfs -text +results/Pyramids[[:space:]]Training/Pyramids/Pyramids-999987.pt filter=lfs diff=lfs merge=lfs -text results/Pyramids[[:space:]]Training/Pyramids/checkpoint.pt filter=lfs diff=lfs merge=lfs -text -results/Pyramids[[:space:]]Training/Pyramids/events.out.tfevents.1692804545.f1fcbdb9d0a8.1697.0 filter=lfs diff=lfs merge=lfs -text results/Pyramids[[:space:]]Training/Pyramids.onnx filter=lfs diff=lfs merge=lfs -text training-envs-executables/linux/Pyramids/Pyramids_Data/Managed/System.Core.dll filter=lfs diff=lfs merge=lfs -text training-envs-executables/linux/Pyramids/Pyramids_Data/Managed/System.Data.dll filter=lfs diff=lfs merge=lfs -text diff --git a/config.json b/config.json index 412634e4c38e3f06dc7a230670f0d6445be25aa9..ef4208efa65b3f46532d0206e3d488d77e033ac7 100644 --- a/config.json +++ b/config.json @@ -1 +1 @@ -{"behaviors": {"Pyramids": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.01, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "linear"}, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple"}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0}, "rnd": {"gamma": 0.99, "strength": 0.01, "network_settings": {"hidden_units": 64, "num_layers": 3}, "learning_rate": 0.0001}}, "keep_checkpoints": 5, "max_steps": 100000, "time_horizon": 128, "summary_freq": 30000}}} \ No newline at end of file +{"behaviors": {"Pyramids": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.01, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "linear"}, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple"}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0}, "rnd": {"gamma": 0.99, "strength": 0.01, "network_settings": {"hidden_units": 64, "num_layers": 3}, "learning_rate": 0.0001}}, "keep_checkpoints": 5, "max_steps": 1000000, "time_horizon": 128, "summary_freq": 30000}}} \ No newline at end of file diff --git a/config/ppo/PyramidsRND.yaml b/config/ppo/PyramidsRND.yaml index 622413ac6534d7786e0d899b9a47b361949d75d8..cff3bc25a6adad89a250d52fdf404dc23d2cdd96 100644 --- a/config/ppo/PyramidsRND.yaml +++ b/config/ppo/PyramidsRND.yaml @@ -27,6 +27,6 @@ behaviors: num_layers: 3 learning_rate: 0.0001 keep_checkpoints: 5 - max_steps: 100000 + max_steps: 1000000 time_horizon: 128 summary_freq: 30000 diff --git a/configuration.yaml b/configuration.yaml index 622413ac6534d7786e0d899b9a47b361949d75d8..cff3bc25a6adad89a250d52fdf404dc23d2cdd96 100644 --- a/configuration.yaml +++ b/configuration.yaml @@ -27,6 +27,6 @@ behaviors: num_layers: 3 learning_rate: 0.0001 keep_checkpoints: 5 - max_steps: 100000 + max_steps: 1000000 time_horizon: 128 summary_freq: 30000 diff --git a/ml-agents-envs/mlagents_envs/__pycache__/__init__.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/__init__.cpython-310.pyc index 022673589283339c2b556b630373c8ef87a1e8c2..f1d315dcfdd639d36cb2e8511fd4f0c96c4cb5ef 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/__init__.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/__pycache__/base_env.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/base_env.cpython-310.pyc index faa6bb12e444daad76bbf20174716e2315f1d50f..1005899b1c925f1bf7e6aeb688494d0f220d1b0a 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/base_env.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/base_env.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/__pycache__/communicator.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/communicator.cpython-310.pyc index 3f1c04cb989e06e108cb2ce1f14236bac4ecadea..706fd462b58af6f7938ac503439b09affc0c0e64 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/communicator.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/communicator.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/__pycache__/env_utils.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/env_utils.cpython-310.pyc index f2fb345fe0e6e331210bba12b4b38bc40f49d350..c210ed47768088d5bcfcf5a86de43b85748c6800 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/env_utils.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/env_utils.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/__pycache__/environment.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/environment.cpython-310.pyc index dd393c6aaee9fd925b55eac72418821fbee5afaa..1a55716bf373cd4625a4b8f2de389470160ceaf7 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/environment.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/environment.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/__pycache__/exception.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/exception.cpython-310.pyc index 13049f54abdf02bb60f2900438554bcae6937a25..c16e7de96d1eb5d0f359544b1201dc8ee15cd9d5 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/exception.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/exception.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/__pycache__/logging_util.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/logging_util.cpython-310.pyc index 985b08e684489a9ec23cc5f42a21247783adc8c3..2ccaf75b6ef741cf21dec79351eb40fd686a50c7 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/logging_util.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/logging_util.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/__pycache__/rpc_communicator.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/rpc_communicator.cpython-310.pyc index 42d27730d49e918c1b01308d5d56d5e04c740bcc..aa96f781f1cfd29ee79701995455d857b1c39c09 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/rpc_communicator.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/rpc_communicator.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/__pycache__/rpc_utils.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/rpc_utils.cpython-310.pyc index 86a97987381376f078c69a120bd29756dbd624db..fcc8bdf766003363fa96cccfe53bf100a0658a23 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/rpc_utils.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/rpc_utils.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/__pycache__/timers.cpython-310.pyc b/ml-agents-envs/mlagents_envs/__pycache__/timers.cpython-310.pyc index b8c44803c7829bc55cff718099d58f5f73906efd..c0f2b962e72a797e2fa0e1abae2309b48f585dd0 100644 Binary files a/ml-agents-envs/mlagents_envs/__pycache__/timers.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/__pycache__/timers.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/__init__.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/__init__.cpython-310.pyc index b4601d313a5c6996cd0904e38deac4b79706bd7f..1f7fbe404a17d95e0cfad1f65cd5a542b3c11526 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/__init__.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_action_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_action_pb2.cpython-310.pyc index a2638b216bbe4b8929dd48487379c019bf0df823..ee8827e91f54638a650b8272f9b3f8edd35f6827 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_action_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_action_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_info_action_pair_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_info_action_pair_pb2.cpython-310.pyc index c1087c5ce8501395073f81da815e5e490143b5e0..4e57aadbc59ac69683025a603b57c90358a25175 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_info_action_pair_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_info_action_pair_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_info_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_info_pb2.cpython-310.pyc index 090dc43fd74fb8b7945ad994c0f327352c885fc8..7cb264e67b3c5d161d42aa88e0701d4f34b28bf9 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_info_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/agent_info_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/brain_parameters_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/brain_parameters_pb2.cpython-310.pyc index f0469e65f0b33216b990e4b8f7af0470b347af79..c4cdad692290223b8d72806d9c6219e1c1e2f0ed 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/brain_parameters_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/brain_parameters_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/capabilities_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/capabilities_pb2.cpython-310.pyc index dc4f70af0de23534d8f7377f44267a7b8012ded5..81fd204a7c829ccc9c23b10db3eb153ed7efc2a9 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/capabilities_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/capabilities_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/command_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/command_pb2.cpython-310.pyc index 036e99f1bb5899c6b699f03a1b36fd5207135044..a7890b4b3bf3464c25a5d3bdc83ca7999f91c65d 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/command_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/command_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/demonstration_meta_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/demonstration_meta_pb2.cpython-310.pyc index 23ec801213c5ec6f0c9543b289860553fc31e959..5dc3cdad28894d7cc4ccdfa53e7bc46028284bce 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/demonstration_meta_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/demonstration_meta_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/header_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/header_pb2.cpython-310.pyc index 55c1d53e85c22902f7a919081ad0c107ebf8d8aa..fcc45932362483fe68671b1f73d3d1a91facf396 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/header_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/header_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/observation_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/observation_pb2.cpython-310.pyc index 0d8021d35cbfa20b4c57b7954e5f6f5d0cbba933..cd3449a7b021e47eb0457bec79016f1f498c48eb 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/observation_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/observation_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/space_type_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/space_type_pb2.cpython-310.pyc index f6e1ed41ef219d245fb7d97dfdd024210f9b0ed9..8faa5a631135612f2fa6827cca4907ac027adda0 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/space_type_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/space_type_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/training_analytics_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/training_analytics_pb2.cpython-310.pyc index 8c75a132dff295c916ea37e15a653f7b14d9cff6..d05e39c3da09ba2dd0c634da8f3110f0591a877b 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/training_analytics_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/training_analytics_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_input_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_input_pb2.cpython-310.pyc index a1e263395180168349ea83cff75ee18e6005b7ad..e217a1411a1a6d61927097bcfc8abe44f35803b2 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_input_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_input_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_message_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_message_pb2.cpython-310.pyc index 41d952a1c6b0f3a98a14bfb58e35a65b31a28e0c..bb8c26e0f7a292e7dc2d48ed0b8f6956a6c4d6af 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_message_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_message_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_output_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_output_pb2.cpython-310.pyc index 123d1f3ce6f40cd9edef8eaddc6cb8cbd92356b3..64aea95b3a5d6cdd4534153edc9fa4f95f9102e3 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_output_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_output_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_initialization_input_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_initialization_input_pb2.cpython-310.pyc index b93a9ac922941fb81c10f8ec7228ce9a14d9378b..9bcf4c0e1c9029ede62f9d0335a1df537de321dd 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_initialization_input_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_initialization_input_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_initialization_output_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_initialization_output_pb2.cpython-310.pyc index cb90113375256a44933888b97fd0c5ded1a500ad..496c6ab6454aa2af7ee85789a3bfdf5aa589b6a2 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_initialization_output_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_initialization_output_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_input_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_input_pb2.cpython-310.pyc index 2edba242b8a6adb96445f4007df832ee02c7872d..eb29343ece86684636da2321678661cb104c7cd3 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_input_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_input_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_output_pb2.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_output_pb2.cpython-310.pyc index abd5fafaafb6997ad653c31f7e025050f8b64ccd..4d5b3751e024bc845025773c53fdf0057cb5ab6d 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_output_pb2.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_rl_output_pb2.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_to_external_pb2_grpc.cpython-310.pyc b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_to_external_pb2_grpc.cpython-310.pyc index 705fbf8b967eb9768913d1f1dbb852cb276a0d5f..1c690144d9e60f25bda79c369c91d95dbdcc81c0 100644 Binary files a/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_to_external_pb2_grpc.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/communicator_objects/__pycache__/unity_to_external_pb2_grpc.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/__init__.cpython-310.pyc b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/__init__.cpython-310.pyc index 769cf7cd71478dfa0051df1137ec6e8dd51269e1..8a377c4ced89f2b26db78fdf1eee095f7b9c79a7 100644 Binary files a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/__init__.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/default_training_analytics_side_channel.cpython-310.pyc b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/default_training_analytics_side_channel.cpython-310.pyc index 1a5db831e9409cd660a3491102ef3c90fae7d628..257cae1b6c55c7e8f6f0e09b21ee8176a138734c 100644 Binary files a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/default_training_analytics_side_channel.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/default_training_analytics_side_channel.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/engine_configuration_channel.cpython-310.pyc b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/engine_configuration_channel.cpython-310.pyc index b3542471c3a00d61b7200259a7950bdcb9fcaaa4..1974aae2d302e2562b68e91c2f5ea3c15abeae57 100644 Binary files a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/engine_configuration_channel.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/engine_configuration_channel.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/environment_parameters_channel.cpython-310.pyc b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/environment_parameters_channel.cpython-310.pyc index f60eb874be7bf6721f1f8f5b9903fc822831e4fb..033e715ea647bcbd62c50ca2eda3cc49fbb220c2 100644 Binary files a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/environment_parameters_channel.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/environment_parameters_channel.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/incoming_message.cpython-310.pyc b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/incoming_message.cpython-310.pyc index b7506d6dbc4f446c88f82522a7216f5adea94a97..4c19d824fd429b6794d0e51f145a313506c81a70 100644 Binary files a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/incoming_message.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/incoming_message.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/outgoing_message.cpython-310.pyc b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/outgoing_message.cpython-310.pyc index a11ae160b26be5b7ba527778f531deaea4cb6e85..8995b9adcb8c86c8f6820fefea241d9ab9cfda2f 100644 Binary files a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/outgoing_message.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/outgoing_message.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/side_channel.cpython-310.pyc b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/side_channel.cpython-310.pyc index 2cd66bc5ded1487e0a6ce2834011e27ab70b02a0..28dd3a0a27cee7bb1624a400cf70d4043d026836 100644 Binary files a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/side_channel.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/side_channel.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/side_channel_manager.cpython-310.pyc b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/side_channel_manager.cpython-310.pyc index 1405e19a2a596d8080d7647dfa7494122adf6a2a..f590a107bed8935dbfc5eda2a6f4c01a59ca01f1 100644 Binary files a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/side_channel_manager.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/side_channel_manager.cpython-310.pyc differ diff --git a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/stats_side_channel.cpython-310.pyc b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/stats_side_channel.cpython-310.pyc index d0d51f731267044a764d826c8b88c4439843760e..5709baed51d6cfe1419f9c49b04877b27da580d3 100644 Binary files a/ml-agents-envs/mlagents_envs/side_channel/__pycache__/stats_side_channel.cpython-310.pyc and b/ml-agents-envs/mlagents_envs/side_channel/__pycache__/stats_side_channel.cpython-310.pyc differ diff --git a/ml-agents/mlagents/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/__pycache__/__init__.cpython-310.pyc index 03793193ba77ae449326da5b07bbf86542ee33c5..111cb6b25ec834e79f0ea1111edfe7c9f025827c 100644 Binary files a/ml-agents/mlagents/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/plugins/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/plugins/__pycache__/__init__.cpython-310.pyc index 4fe62ca497ba24d7b8f73e435f80d24538075522..80582c71beb4a629a5922c8b07a39e009a39ec77 100644 Binary files a/ml-agents/mlagents/plugins/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/plugins/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/plugins/__pycache__/stats_writer.cpython-310.pyc b/ml-agents/mlagents/plugins/__pycache__/stats_writer.cpython-310.pyc index 221afbc45d14de242dd82ac7001278a27cbf7a73..06fb5e3c21734b86471eafe0ccd8efc09e160fc2 100644 Binary files a/ml-agents/mlagents/plugins/__pycache__/stats_writer.cpython-310.pyc and b/ml-agents/mlagents/plugins/__pycache__/stats_writer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/plugins/__pycache__/trainer_type.cpython-310.pyc b/ml-agents/mlagents/plugins/__pycache__/trainer_type.cpython-310.pyc index f3e97f669eb1ad1ae1ba0e53bdbe279d270aff4e..9be93ba197117a88cec541086f171dfddb262b04 100644 Binary files a/ml-agents/mlagents/plugins/__pycache__/trainer_type.cpython-310.pyc and b/ml-agents/mlagents/plugins/__pycache__/trainer_type.cpython-310.pyc differ diff --git a/ml-agents/mlagents/torch_utils/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/torch_utils/__pycache__/__init__.cpython-310.pyc index 99df1ef35b12880de2f7e471f993f1ce60390a12..389928b74607be0109b3bcfa7d2623344dd34e8e 100644 Binary files a/ml-agents/mlagents/torch_utils/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/torch_utils/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/torch_utils/__pycache__/cpu_utils.cpython-310.pyc b/ml-agents/mlagents/torch_utils/__pycache__/cpu_utils.cpython-310.pyc index be5700c390a5bd43647a2c150115b753fe7b029f..b2375339b71d76a64819ca0bf97c6fa2e8bd04ae 100644 Binary files a/ml-agents/mlagents/torch_utils/__pycache__/cpu_utils.cpython-310.pyc and b/ml-agents/mlagents/torch_utils/__pycache__/cpu_utils.cpython-310.pyc differ diff --git a/ml-agents/mlagents/torch_utils/__pycache__/globals.cpython-310.pyc b/ml-agents/mlagents/torch_utils/__pycache__/globals.cpython-310.pyc index aa830557489425ec9ce403f9afd2cdddc6aed948..9a762264296967a56cf17c06d157749000a6bda1 100644 Binary files a/ml-agents/mlagents/torch_utils/__pycache__/globals.cpython-310.pyc and b/ml-agents/mlagents/torch_utils/__pycache__/globals.cpython-310.pyc differ diff --git a/ml-agents/mlagents/torch_utils/__pycache__/torch.cpython-310.pyc b/ml-agents/mlagents/torch_utils/__pycache__/torch.cpython-310.pyc index 928695ac289a80d15299f0c0b6fe4f51c6a6b35b..9801d90153f486dc38ce00544ab03b189fba094e 100644 Binary files a/ml-agents/mlagents/torch_utils/__pycache__/torch.cpython-310.pyc and b/ml-agents/mlagents/torch_utils/__pycache__/torch.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/__init__.cpython-310.pyc index 39109a11ad3d9d07eca50ef03afc01065904d0cd..074575d10eec8aef226c53cdb79678539647f9f3 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/action_info.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/action_info.cpython-310.pyc index 284a8b6474db913b34387ef0bc7ea3b6a9f991f7..619f795ee4210cb8069be1309a8fde5932d4a0ec 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/action_info.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/action_info.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/agent_processor.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/agent_processor.cpython-310.pyc index a474f198a40ea5b0e1cf0f3ceb782646739a4324..a79ca40de0009cbe30d259d291dae71f6cad9de9 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/agent_processor.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/agent_processor.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/behavior_id_utils.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/behavior_id_utils.cpython-310.pyc index b03d08d925640a72c6a13b780e519bf5edf4607a..7a7f46c9fe6a9096aba6dfeeda776427184ec7ae 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/behavior_id_utils.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/behavior_id_utils.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/buffer.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/buffer.cpython-310.pyc index 40c8cf6b81a0904269275625e415fe472559f5ad..9ae63c706b4fd4a0bcac5e3a037396ecde208662 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/buffer.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/buffer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/cli_utils.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/cli_utils.cpython-310.pyc index eff85d382c20683795bd512b3c60ec3356c40ba2..94e56a325435141947e1cac5d3b53c081f1ede48 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/cli_utils.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/cli_utils.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/demo_loader.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/demo_loader.cpython-310.pyc index ef14cce1b7218e9fa57ada94bfef05d4f08bb125..e131ae1e8dbc347dead9dcb60e0488b9f19dca23 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/demo_loader.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/demo_loader.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/directory_utils.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/directory_utils.cpython-310.pyc index b2e97561f35860528800aedbf8e5f9c6fa073b62..fc3108ae1abaff3f13e25161ae8ad943a71fe521 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/directory_utils.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/directory_utils.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/env_manager.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/env_manager.cpython-310.pyc index 234f4e31fb6a86353820ace4cda9f80bc698820d..87214e6154926bac1b23c9fdf67efc8afa6c1e7b 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/env_manager.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/env_manager.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/environment_parameter_manager.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/environment_parameter_manager.cpython-310.pyc index ab5f04074e23178b8d66e967dc312375d6c99bd3..3e4124d135af2019e8a66252a3b7e627330eb52d 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/environment_parameter_manager.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/environment_parameter_manager.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/exception.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/exception.cpython-310.pyc index 030f45bf9b659ebc236ea210a92ae98fa8f75382..8facacdbc4cb9fd92b98201314b80216bea91f4c 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/exception.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/exception.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/learn.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/learn.cpython-310.pyc index 737f8d34c7535905f14f8dcbb0511e7f66b30bdf..65db2d8291572921d73efa0d376db3f285d7761a 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/learn.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/learn.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/settings.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/settings.cpython-310.pyc index d3985cc770ec7df85458bbc653f00c98cc2568a5..46623ecafaf39f6a972a9d918ba41501dddbd80c 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/settings.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/settings.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/stats.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/stats.cpython-310.pyc index 892d8094ce716f85135f20463e8ab1081f53dde4..38b12af11e7425e50611e46c14ae5af4c46b6723 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/stats.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/stats.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/subprocess_env_manager.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/subprocess_env_manager.cpython-310.pyc index 8e66bbf64a2ac9f9f8312181e6ab03f9a7fb0428..77ac2666e82a608595fce4836e1d7c97c627645f 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/subprocess_env_manager.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/subprocess_env_manager.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/trainer_controller.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/trainer_controller.cpython-310.pyc index 506e5714fe17e116ccfed358032c0624ed094d8b..9933943cd45c7a2ce59a7f10b32f73dcfdb0cced 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/trainer_controller.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/trainer_controller.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/training_analytics_side_channel.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/training_analytics_side_channel.cpython-310.pyc index 4d7e1b614447f14f7517e50f27688e3231d8e441..af941fd9680b21b7bc9d269a8d5c658c56abb246 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/training_analytics_side_channel.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/training_analytics_side_channel.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/training_status.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/training_status.cpython-310.pyc index f18d03c7796d58f19ff4fd21515abc17db0d94c5..e0a51ba4797d7788e6341aadbf6fc38a7913fa16 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/training_status.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/training_status.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/__pycache__/trajectory.cpython-310.pyc b/ml-agents/mlagents/trainers/__pycache__/trajectory.cpython-310.pyc index e497c80c5166b353f42c46fd8d635498af1ca8d5..d5e7d73c87848233d5a232a17253a5f1b457cb4e 100644 Binary files a/ml-agents/mlagents/trainers/__pycache__/trajectory.cpython-310.pyc and b/ml-agents/mlagents/trainers/__pycache__/trajectory.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/ghost/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/ghost/__pycache__/__init__.cpython-310.pyc index 993986534feb1a2715edd8995ed4d4f6da24ebe7..3510c5fb7a1bd8eb3928b6d11571acfb888e8215 100644 Binary files a/ml-agents/mlagents/trainers/ghost/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/ghost/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/ghost/__pycache__/controller.cpython-310.pyc b/ml-agents/mlagents/trainers/ghost/__pycache__/controller.cpython-310.pyc index 1c43830e6c7feb23cd89e0e32aa850c6f44d3320..d84240d9929cb875415edee22df1167203ac5c67 100644 Binary files a/ml-agents/mlagents/trainers/ghost/__pycache__/controller.cpython-310.pyc and b/ml-agents/mlagents/trainers/ghost/__pycache__/controller.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/ghost/__pycache__/trainer.cpython-310.pyc b/ml-agents/mlagents/trainers/ghost/__pycache__/trainer.cpython-310.pyc index 5edf64d5acff990ebf56595ea7cc0fbda96fcbf1..c0355fbdf698ce56aca4270afd3943371859a980 100644 Binary files a/ml-agents/mlagents/trainers/ghost/__pycache__/trainer.cpython-310.pyc and b/ml-agents/mlagents/trainers/ghost/__pycache__/trainer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/model_saver/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/model_saver/__pycache__/__init__.cpython-310.pyc index bf81b4fe13d2423dffe1cf6977c805bc840c8455..10f21d74be5c0261f33fac180ed7b3f651134d22 100644 Binary files a/ml-agents/mlagents/trainers/model_saver/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/model_saver/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/model_saver/__pycache__/model_saver.cpython-310.pyc b/ml-agents/mlagents/trainers/model_saver/__pycache__/model_saver.cpython-310.pyc index 6ae4fc8f62e4c416960ee1153545b2b7220103e6..c7b3fd8ccda9608ee30b697a8ffc18ac248891e3 100644 Binary files a/ml-agents/mlagents/trainers/model_saver/__pycache__/model_saver.cpython-310.pyc and b/ml-agents/mlagents/trainers/model_saver/__pycache__/model_saver.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/model_saver/__pycache__/torch_model_saver.cpython-310.pyc b/ml-agents/mlagents/trainers/model_saver/__pycache__/torch_model_saver.cpython-310.pyc index 960f436e215d29cbb5495a6035261e2b10308611..2afbb33f93058d1804118ca20e4ef67c37527ad3 100644 Binary files a/ml-agents/mlagents/trainers/model_saver/__pycache__/torch_model_saver.cpython-310.pyc and b/ml-agents/mlagents/trainers/model_saver/__pycache__/torch_model_saver.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/optimizer/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/optimizer/__pycache__/__init__.cpython-310.pyc index ed813048fa6eaedf31bd202ffd72c37c70f76cf9..cad6b88f8f1bf30ac140c167874488512d8b0307 100644 Binary files a/ml-agents/mlagents/trainers/optimizer/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/optimizer/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/optimizer/__pycache__/optimizer.cpython-310.pyc b/ml-agents/mlagents/trainers/optimizer/__pycache__/optimizer.cpython-310.pyc index bd7e15fc0037cfbe0843df1c15d94b0381352638..1923bac70cee50c95ad1b7301b3d6fe4e04fad22 100644 Binary files a/ml-agents/mlagents/trainers/optimizer/__pycache__/optimizer.cpython-310.pyc and b/ml-agents/mlagents/trainers/optimizer/__pycache__/optimizer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/optimizer/__pycache__/torch_optimizer.cpython-310.pyc b/ml-agents/mlagents/trainers/optimizer/__pycache__/torch_optimizer.cpython-310.pyc index 81e631f2150d08587d154fbb21c76d4c176b8737..a8f7a38e9f9ed980fb55fb0808914eec96ddcc7d 100644 Binary files a/ml-agents/mlagents/trainers/optimizer/__pycache__/torch_optimizer.cpython-310.pyc and b/ml-agents/mlagents/trainers/optimizer/__pycache__/torch_optimizer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/poca/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/poca/__pycache__/__init__.cpython-310.pyc index aab9c3a7ffc7db8ad4820225d684cd08892302c3..fd862593bea18d42b4fefaf2bea35535bbc922ed 100644 Binary files a/ml-agents/mlagents/trainers/poca/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/poca/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/poca/__pycache__/optimizer_torch.cpython-310.pyc b/ml-agents/mlagents/trainers/poca/__pycache__/optimizer_torch.cpython-310.pyc index 0be0927e0592d5e458f762b9c2b4e0b94a9f045b..7bf89453c097c92497288148c0deaf85735c695c 100644 Binary files a/ml-agents/mlagents/trainers/poca/__pycache__/optimizer_torch.cpython-310.pyc and b/ml-agents/mlagents/trainers/poca/__pycache__/optimizer_torch.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/poca/__pycache__/trainer.cpython-310.pyc b/ml-agents/mlagents/trainers/poca/__pycache__/trainer.cpython-310.pyc index 184188815680f51792508b264194813626c7433c..43bb8821d0024edaa5393d6b5df446f1171b0671 100644 Binary files a/ml-agents/mlagents/trainers/poca/__pycache__/trainer.cpython-310.pyc and b/ml-agents/mlagents/trainers/poca/__pycache__/trainer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/policy/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/policy/__pycache__/__init__.cpython-310.pyc index 8133db8d7663ac42a34804461fc3898a8ff11634..88636e8edc36f81274eb327d1eaf7694f98fa1fc 100644 Binary files a/ml-agents/mlagents/trainers/policy/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/policy/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/policy/__pycache__/checkpoint_manager.cpython-310.pyc b/ml-agents/mlagents/trainers/policy/__pycache__/checkpoint_manager.cpython-310.pyc index 8cd32418b320de2a6c7087bebd6c98c0b54c8f53..e2026997082e80f028959d628742aef7130d4700 100644 Binary files a/ml-agents/mlagents/trainers/policy/__pycache__/checkpoint_manager.cpython-310.pyc and b/ml-agents/mlagents/trainers/policy/__pycache__/checkpoint_manager.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/policy/__pycache__/policy.cpython-310.pyc b/ml-agents/mlagents/trainers/policy/__pycache__/policy.cpython-310.pyc index 7d194c1e4dd3d37329b115a641f9a1fffb461c3e..bd8ad55be30c341edd37b5d30b62b558772c5e61 100644 Binary files a/ml-agents/mlagents/trainers/policy/__pycache__/policy.cpython-310.pyc and b/ml-agents/mlagents/trainers/policy/__pycache__/policy.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/policy/__pycache__/torch_policy.cpython-310.pyc b/ml-agents/mlagents/trainers/policy/__pycache__/torch_policy.cpython-310.pyc index 771116cd644001fa31a99a547e8fae829419f008..952f8316fc460f6610a0d9a43deaf66ae9cc9218 100644 Binary files a/ml-agents/mlagents/trainers/policy/__pycache__/torch_policy.cpython-310.pyc and b/ml-agents/mlagents/trainers/policy/__pycache__/torch_policy.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/ppo/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/ppo/__pycache__/__init__.cpython-310.pyc index efbb203181f6c16eff9a6ee935c326ac460a9b8e..0d3c977fd4661b82c39806003e83c3ab28618cb3 100644 Binary files a/ml-agents/mlagents/trainers/ppo/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/ppo/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/ppo/__pycache__/optimizer_torch.cpython-310.pyc b/ml-agents/mlagents/trainers/ppo/__pycache__/optimizer_torch.cpython-310.pyc index 43259d1f08f07ba58a69ec8072cc0cb040513417..84e18cc876c79bf7f67b4a3d651406233848b9bb 100644 Binary files a/ml-agents/mlagents/trainers/ppo/__pycache__/optimizer_torch.cpython-310.pyc and b/ml-agents/mlagents/trainers/ppo/__pycache__/optimizer_torch.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/ppo/__pycache__/trainer.cpython-310.pyc b/ml-agents/mlagents/trainers/ppo/__pycache__/trainer.cpython-310.pyc index d7b09a21764d5e7b27b8bd5ff73514c3feb0839b..f55a46f3e58a06c11a68f0f2fe87b04ed78800f5 100644 Binary files a/ml-agents/mlagents/trainers/ppo/__pycache__/trainer.cpython-310.pyc and b/ml-agents/mlagents/trainers/ppo/__pycache__/trainer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/sac/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/sac/__pycache__/__init__.cpython-310.pyc index 36c5f6e48b591d9843421a7fa913dde9dd9381cd..eb312fb2b2f04fd1eb4a87823d2a283d7523fad1 100644 Binary files a/ml-agents/mlagents/trainers/sac/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/sac/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/sac/__pycache__/optimizer_torch.cpython-310.pyc b/ml-agents/mlagents/trainers/sac/__pycache__/optimizer_torch.cpython-310.pyc index 61d98796e171d9921e1f22f34e730ee5610958e5..75c6c57258bfd8712a022f6b9809eae14c23f819 100644 Binary files a/ml-agents/mlagents/trainers/sac/__pycache__/optimizer_torch.cpython-310.pyc and b/ml-agents/mlagents/trainers/sac/__pycache__/optimizer_torch.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/sac/__pycache__/trainer.cpython-310.pyc b/ml-agents/mlagents/trainers/sac/__pycache__/trainer.cpython-310.pyc index afad26ef89f672760ca5a34433c664214cb67d5a..2db6b50839535604b1a88602726f829d990ebda8 100644 Binary files a/ml-agents/mlagents/trainers/sac/__pycache__/trainer.cpython-310.pyc and b/ml-agents/mlagents/trainers/sac/__pycache__/trainer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/__init__.cpython-310.pyc index 4271756c965015f0491d21c3d343a4200b303118..dd2914af5daa354d765947e91553d6fba9e54990 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_flattener.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_flattener.cpython-310.pyc index c20226cd062229e0144462ca9b176d1ace125ca8..8c64aafb600dd624b148d44011870f56c51889ab 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_flattener.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_flattener.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_log_probs.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_log_probs.cpython-310.pyc index 543df3d9e4f6f9cfd997292340a9c62a7dc71ace..e3fe0e66943306a5fa720427f9c743b513689a6f 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_log_probs.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_log_probs.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_model.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_model.cpython-310.pyc index 364b4cbc90fcde86d6350db18bb254f7a79e69d3..f1ddd45653effb7940abcbd8c62cc2bad0be39f6 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_model.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/action_model.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/agent_action.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/agent_action.cpython-310.pyc index a94638562c3f141e62bd95a44dc76cb1bb287044..b5c61e882374d87d88f44f4746af3831a12fe8e8 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/agent_action.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/agent_action.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/attention.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/attention.cpython-310.pyc index e6371ef83f66b57f9197dccf0b4a8138fb3f3e5e..045e5be271da03f5455bff26696c29c33fb01065 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/attention.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/attention.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/conditioning.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/conditioning.cpython-310.pyc index 2cf020d9c008c4fcf0c68561f8ab9474f17e32fc..941ed23c8a53d545478a288dee70540fde7adb5a 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/conditioning.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/conditioning.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/decoders.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/decoders.cpython-310.pyc index 5b10f53819dbb3000e697475584644081f2e539a..9cc51416c24766264cbc835acd678a201486ce7a 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/decoders.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/decoders.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/distributions.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/distributions.cpython-310.pyc index 5c95681c5c7d76db06adf03f9fc3134704a170fb..dce254999f6d81494b9868ae30b5adce5b4a7e7a 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/distributions.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/distributions.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/encoders.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/encoders.cpython-310.pyc index 62dd0f60ff9cc04b4ed62e822e28a2970c0a73aa..9c2ce0d305bd597e57a1413b6184b4aee716f5d1 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/encoders.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/encoders.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/layers.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/layers.cpython-310.pyc index fe6ec627dc878df2049b63b0b781f893779159b7..0ec6dfef67547112698a0102d3950d0bdd336c1f 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/layers.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/layers.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/model_serialization.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/model_serialization.cpython-310.pyc index 0f1a78be8874d2c07ac86a343f7010f132d06274..ea8621445f67a59e4d2b90f858bf6355ab4bce66 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/model_serialization.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/model_serialization.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/networks.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/networks.cpython-310.pyc index 4768e2ba3480b95aaa7ada0b0b606a9a2fe7e0d5..5765ca09017134860393399fd136d42d7120515d 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/networks.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/networks.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/__pycache__/utils.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/__pycache__/utils.cpython-310.pyc index da3dfae66822121e6bf851454c1a7d189387b3d9..92256bcf162bbaa750c70ee5211bdde7ec709d6d 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/__pycache__/utils.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/__pycache__/utils.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/__pycache__/__init__.cpython-310.pyc index ca44b52dbf409c015bc55abc665ca9bbeaf83ade..641b72d3c813df47e069890eb9610b1f39c4a41c 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/bc/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/bc/__pycache__/__init__.cpython-310.pyc index 539473993d9dc70a0640cc67adf44e790bf4286c..4c3ea319a9dc296041a17dc94ab614319106f0c5 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/bc/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/bc/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/bc/__pycache__/module.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/bc/__pycache__/module.cpython-310.pyc index a8bde817abb5da0c0bcc941ccb2389c47958625d..5342b332e4397944598c422cc9b40a57318edbdb 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/bc/__pycache__/module.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/bc/__pycache__/module.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/__init__.cpython-310.pyc index 711fed186d269af382762aec203d4f92d0384a08..782eb4156ba88e0c263292cfe48e012b160093c6 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/base_reward_provider.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/base_reward_provider.cpython-310.pyc index 184880491f4079b39ef3a6bdd8af9434dabe2c54..73752ffa1d981310f5f50b7a4a58d70b85fccb9a 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/base_reward_provider.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/base_reward_provider.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/curiosity_reward_provider.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/curiosity_reward_provider.cpython-310.pyc index 768115c5ac6e9c2fda64e8663d08c83b4ed39492..48b50f4477bf7660f72f7857e51f66a928038416 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/curiosity_reward_provider.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/curiosity_reward_provider.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/extrinsic_reward_provider.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/extrinsic_reward_provider.cpython-310.pyc index 0f9275a0a6dca805347d21bc76d8332c3bbf889e..a6a7eebfdbc5248b72b5f87b7428c2440f587799 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/extrinsic_reward_provider.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/extrinsic_reward_provider.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/gail_reward_provider.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/gail_reward_provider.cpython-310.pyc index 55d950e2f820f2feca2d72bf85661e3743f19e4d..8f43e29f57392f68160e957723ab84078db27987 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/gail_reward_provider.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/gail_reward_provider.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/reward_provider_factory.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/reward_provider_factory.cpython-310.pyc index 69d5ad62d7518b47046b6b0d8a7e3ae8b4c0f3ae..f0352201f4972546dabc8562927a66468378d50a 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/reward_provider_factory.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/reward_provider_factory.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/rnd_reward_provider.cpython-310.pyc b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/rnd_reward_provider.cpython-310.pyc index 3a18e62bf33c182c4e0591a0350aedb59085c5b8..984aee5eb4a05e07dc2204315d1e518ffbba0696 100644 Binary files a/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/rnd_reward_provider.cpython-310.pyc and b/ml-agents/mlagents/trainers/torch_entities/components/reward_providers/__pycache__/rnd_reward_provider.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/trainer/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/trainers/trainer/__pycache__/__init__.cpython-310.pyc index 4e89c2a16ff14c37fa9d3c00399f07a53b900801..156997172eef7d27a3ec4efeca4e59d3b9215a7c 100644 Binary files a/ml-agents/mlagents/trainers/trainer/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/trainers/trainer/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/trainer/__pycache__/off_policy_trainer.cpython-310.pyc b/ml-agents/mlagents/trainers/trainer/__pycache__/off_policy_trainer.cpython-310.pyc index 139039852e469605223fc0e5e8e5c31f7e229783..9abe9765c7f1b14cd675f96d31e20763fe079116 100644 Binary files a/ml-agents/mlagents/trainers/trainer/__pycache__/off_policy_trainer.cpython-310.pyc and b/ml-agents/mlagents/trainers/trainer/__pycache__/off_policy_trainer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/trainer/__pycache__/on_policy_trainer.cpython-310.pyc b/ml-agents/mlagents/trainers/trainer/__pycache__/on_policy_trainer.cpython-310.pyc index 378becdf02f391abbab6a78c8156a600c0d570dd..baca386f92b5352f69edb9f2efe7511410061ba3 100644 Binary files a/ml-agents/mlagents/trainers/trainer/__pycache__/on_policy_trainer.cpython-310.pyc and b/ml-agents/mlagents/trainers/trainer/__pycache__/on_policy_trainer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/trainer/__pycache__/rl_trainer.cpython-310.pyc b/ml-agents/mlagents/trainers/trainer/__pycache__/rl_trainer.cpython-310.pyc index 0667b3a51ba66ccc96407398756c6bc70e2db3fe..7ef35693ff18d5f75a7ce5b1e2623882ef44de26 100644 Binary files a/ml-agents/mlagents/trainers/trainer/__pycache__/rl_trainer.cpython-310.pyc and b/ml-agents/mlagents/trainers/trainer/__pycache__/rl_trainer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/trainer/__pycache__/trainer.cpython-310.pyc b/ml-agents/mlagents/trainers/trainer/__pycache__/trainer.cpython-310.pyc index bd9d3a4468ca9b8a6e243e4bd513701ca55716e0..f5e4216be8170c6c64821d6330074dc3e9f11706 100644 Binary files a/ml-agents/mlagents/trainers/trainer/__pycache__/trainer.cpython-310.pyc and b/ml-agents/mlagents/trainers/trainer/__pycache__/trainer.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/trainer/__pycache__/trainer_factory.cpython-310.pyc b/ml-agents/mlagents/trainers/trainer/__pycache__/trainer_factory.cpython-310.pyc index 5d530179ece47b039b63c36123120cf9cfac011b..b46e7498ec66337131a1d26a1aca671730bc4c87 100644 Binary files a/ml-agents/mlagents/trainers/trainer/__pycache__/trainer_factory.cpython-310.pyc and b/ml-agents/mlagents/trainers/trainer/__pycache__/trainer_factory.cpython-310.pyc differ diff --git a/ml-agents/mlagents/trainers/trainer/__pycache__/trainer_utils.cpython-310.pyc b/ml-agents/mlagents/trainers/trainer/__pycache__/trainer_utils.cpython-310.pyc index 8853b0e0d0204389e232dfa62ad110a78bbec833..7bcb01942f52c36e406b01a4677d727c6fc1e683 100644 Binary files a/ml-agents/mlagents/trainers/trainer/__pycache__/trainer_utils.cpython-310.pyc and b/ml-agents/mlagents/trainers/trainer/__pycache__/trainer_utils.cpython-310.pyc differ diff --git a/ml-agents/mlagents/utils/__pycache__/__init__.cpython-310.pyc b/ml-agents/mlagents/utils/__pycache__/__init__.cpython-310.pyc index 5286b7cce244893951f7b12ef213f75bb1071bf3..88b3c2d1b3b28237cecfc1fbf1c3e63d1a8a6391 100644 Binary files a/ml-agents/mlagents/utils/__pycache__/__init__.cpython-310.pyc and b/ml-agents/mlagents/utils/__pycache__/__init__.cpython-310.pyc differ diff --git a/ml-agents/mlagents/utils/__pycache__/push_to_hf.cpython-310.pyc b/ml-agents/mlagents/utils/__pycache__/push_to_hf.cpython-310.pyc index b3ef5e996ac25892e9c9c81150a3f661629d55aa..b18b239d737e6ab3ee9a69633cc8f1359b0cbadd 100644 Binary files a/ml-agents/mlagents/utils/__pycache__/push_to_hf.cpython-310.pyc and b/ml-agents/mlagents/utils/__pycache__/push_to_hf.cpython-310.pyc differ diff --git a/results/Pyramids Training/Pyramids.onnx b/results/Pyramids Training/Pyramids.onnx index f9ea165567dd02a77b179b2b8af4a70f36189b1d..31afef316d7d10f51827bf553b4f002040adc602 100644 --- a/results/Pyramids Training/Pyramids.onnx +++ b/results/Pyramids Training/Pyramids.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d3d49743dbc47dfc239a581bddc3e92eeebf83852350f4c641406c16b2e894a0 +oid sha256:fd0ec5688eecb36dfc6d50b15b852b07b0480ccb3b92fc43e6b96b9b54930ac6 size 1418184 diff --git a/results/Pyramids Training/Pyramids/Pyramids-1000115.onnx b/results/Pyramids Training/Pyramids/Pyramids-1000115.onnx new file mode 100644 index 0000000000000000000000000000000000000000..31afef316d7d10f51827bf553b4f002040adc602 --- /dev/null +++ b/results/Pyramids Training/Pyramids/Pyramids-1000115.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd0ec5688eecb36dfc6d50b15b852b07b0480ccb3b92fc43e6b96b9b54930ac6 +size 1418184 diff --git a/results/Pyramids Training/Pyramids/Pyramids-1000115.pt b/results/Pyramids Training/Pyramids/Pyramids-1000115.pt new file mode 100644 index 0000000000000000000000000000000000000000..44ae617209f943a91482a3faa83e80180bbce4ac --- /dev/null +++ b/results/Pyramids Training/Pyramids/Pyramids-1000115.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50383044fe53ed1fc4901ea6c869d4f5684df293a7c4f2f8064605aa8714a5f8 +size 8650990 diff --git a/results/Pyramids Training/Pyramids/Pyramids-499967.onnx b/results/Pyramids Training/Pyramids/Pyramids-499967.onnx new file mode 100644 index 0000000000000000000000000000000000000000..394cccc46c569cc85c59bc0c1d9a79f525815c53 --- /dev/null +++ b/results/Pyramids Training/Pyramids/Pyramids-499967.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:359a5858813a136967df685c6ddc1789e9fdbcbd8ef8cc79ce0fb35be820ebfe +size 1418184 diff --git a/results/Pyramids Training/Pyramids/Pyramids-499967.pt b/results/Pyramids Training/Pyramids/Pyramids-499967.pt new file mode 100644 index 0000000000000000000000000000000000000000..964d8d3ae202bf13b8b6586ddae05515d905804a --- /dev/null +++ b/results/Pyramids Training/Pyramids/Pyramids-499967.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f3279d3bb67d07b9903ed0123175ae1f3667ed1d14b2e59d6c62b494750d2c4 +size 8650990 diff --git a/results/Pyramids Training/Pyramids/Pyramids-999987.onnx b/results/Pyramids Training/Pyramids/Pyramids-999987.onnx new file mode 100644 index 0000000000000000000000000000000000000000..31afef316d7d10f51827bf553b4f002040adc602 --- /dev/null +++ b/results/Pyramids Training/Pyramids/Pyramids-999987.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd0ec5688eecb36dfc6d50b15b852b07b0480ccb3b92fc43e6b96b9b54930ac6 +size 1418184 diff --git a/results/Pyramids Training/Pyramids/Pyramids-999987.pt b/results/Pyramids Training/Pyramids/Pyramids-999987.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a839d64b4417c4c0c339aa54891f7f3a838b70a --- /dev/null +++ b/results/Pyramids Training/Pyramids/Pyramids-999987.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2bc91d619b0608918fecb18149fae257035f5d9ac342396d3a339c2285d849 +size 8650990 diff --git a/results/Pyramids Training/Pyramids/checkpoint.pt b/results/Pyramids Training/Pyramids/checkpoint.pt index 5e2775ca5fe2b8535ecdf7b15179fe19fbcfedc3..44ae617209f943a91482a3faa83e80180bbce4ac 100644 --- a/results/Pyramids Training/Pyramids/checkpoint.pt +++ b/results/Pyramids Training/Pyramids/checkpoint.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:68ced699fa330f474c5a12cd254aac59d8872a29b4b0fe098f839f10c309bf4a +oid sha256:50383044fe53ed1fc4901ea6c869d4f5684df293a7c4f2f8064605aa8714a5f8 size 8650990 diff --git a/results/Pyramids Training/Pyramids/events.out.tfevents.1692805953.71b50ae053ce.1485.0 b/results/Pyramids Training/Pyramids/events.out.tfevents.1692805953.71b50ae053ce.1485.0 new file mode 100644 index 0000000000000000000000000000000000000000..7ad17d3d067c8892ff6930dfd2ccbb7ac8afee65 Binary files /dev/null and b/results/Pyramids Training/Pyramids/events.out.tfevents.1692805953.71b50ae053ce.1485.0 differ diff --git a/results/Pyramids Training/configuration.yaml b/results/Pyramids Training/configuration.yaml index d747af353b305feb208147f3185d0cc5223f2008..fa80105747b57afb5427d818598fb36179afbb2a 100644 --- a/results/Pyramids Training/configuration.yaml +++ b/results/Pyramids Training/configuration.yaml @@ -51,7 +51,7 @@ behaviors: init_path: null keep_checkpoints: 5 even_checkpoints: false - max_steps: 100000 + max_steps: 1000000 time_horizon: 128 summary_freq: 30000 threaded: false diff --git a/results/Pyramids Training/run_logs/Player-0.log b/results/Pyramids Training/run_logs/Player-0.log index 5145a430cd75f77e5efeb85c664a610de8274219..df9f079f00f3d4f71b876437fe92d87c018f1fc1 100644 --- a/results/Pyramids Training/run_logs/Player-0.log +++ b/results/Pyramids Training/run_logs/Player-0.log @@ -1,7 +1,7 @@ Mono path[0] = '/content/ml-agents/training-envs-executables/linux/Pyramids/Pyramids_Data/Managed' Mono config path = '/content/ml-agents/training-envs-executables/linux/Pyramids/Pyramids_Data/MonoBleedingEdge/etc' Found 1 interfaces on host : 0) 172.28.0.12 -Multi-casting "[IP] 172.28.0.12 [Port] 55029 [Flags] 2 [Guid] 2863475657 [EditorId] 764847374 [Version] 1048832 [Id] LinuxPlayer(13,172.28.0.12) [Debug] 0 [PackageName] LinuxPlayer [ProjectName] UnityEnvironment" to [225.0.0.222:54997]... +Multi-casting "[IP] 172.28.0.12 [Port] 55239 [Flags] 2 [Guid] 3434094306 [EditorId] 764847374 [Version] 1048832 [Id] LinuxPlayer(13,172.28.0.12) [Debug] 0 [PackageName] LinuxPlayer [ProjectName] UnityEnvironment" to [225.0.0.222:54997]... Preloaded 'lib_burst_generated.so' Preloaded 'libgrpc_csharp_ext.x64.so' PlayerPrefs - Creating folder: /root/.config/unity3d/Unity Technologies @@ -36,7 +36,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default FMOD failed to initialize the output device.: "Error initializing output device. " (60) FMOD initialized on nosound output Begin MonoManager ReloadAssembly -- Completed reload, in 0.146 seconds +- Completed reload, in 0.213 seconds ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable) ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable) ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable) @@ -68,7 +68,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f WARNING: Shader Unsupported: 'Standard' - All subshaders removed WARNING: Shader Did you use #pragma only_renderers and omit this platform? WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off? -UnloadTime: 1.131512 ms +UnloadTime: 1.190950 ms ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable) requesting resize 84 x 84 Setting up 1 worker threads for Enlighten. @@ -76,7 +76,7 @@ PlayerConnection::CleanupMemory Statistics: [ALLOC_TEMP_TLS] TLS Allocator StackAllocators : [ALLOC_TEMP_MAIN] - Peak usage frame count: [16.0 KB-32.0 KB]: 1556 frames, [32.0 KB-64.0 KB]: 266 frames, [64.0 KB-128.0 KB]: 54 frames, [2.0 MB-4.0 MB]: 1 frames + Peak usage frame count: [16.0 KB-32.0 KB]: 4385 frames, [32.0 KB-64.0 KB]: 11769 frames, [64.0 KB-128.0 KB]: 2616 frames, [2.0 MB-4.0 MB]: 1 frames Initial Block Size 4.0 MB Current Block Size 4.0 MB Peak Allocated Bytes 2.0 MB @@ -131,12 +131,12 @@ PlayerConnection::CleanupMemory Statistics: Current Block Size 32.0 KB Peak Allocated Bytes 0 B Overflow Count 0 - [ALLOC_TEMP_Background Job.Worker 7] + [ALLOC_TEMP_Background Job.Worker 15] Initial Block Size 32.0 KB Current Block Size 32.0 KB Peak Allocated Bytes 0 B Overflow Count 0 - [ALLOC_TEMP_Background Job.Worker 15] + [ALLOC_TEMP_Background Job.Worker 7] Initial Block Size 32.0 KB Current Block Size 32.0 KB Peak Allocated Bytes 0 B @@ -207,28 +207,28 @@ PlayerConnection::CleanupMemory Statistics: Peak Allocated Bytes 128 B Overflow Count 0 [ALLOC_MEMORYPROFILER] - Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 1578 frames + Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 18472 frames Requested Block Size 1.0 MB Peak Block count 2 Peak Allocated memory 1.6 MB Peak Large allocation bytes 0 B [ALLOC_DEFAULT] Dual Thread Allocator - Peak main deferred allocation count 12451 + Peak main deferred allocation count 12313 [ALLOC_BUCKET] Large Block size 4.0 MB Used Block count 1 Peak Allocated bytes 1.7 MB [ALLOC_DEFAULT_MAIN] - Peak usage frame count: [8.0 MB-16.0 MB]: 1 frames, [16.0 MB-32.0 MB]: 1876 frames + Peak usage frame count: [8.0 MB-16.0 MB]: 7 frames, [16.0 MB-32.0 MB]: 18764 frames Requested Block Size 16.0 MB Peak Block count 3 - Peak Allocated memory 30.7 MB + Peak Allocated memory 29.0 MB Peak Large allocation bytes 0 B [ALLOC_DEFAULT_THREAD] - Peak usage frame count: [16.0 MB-32.0 MB]: 1877 frames + Peak usage frame count: [16.0 MB-32.0 MB]: 18771 frames Requested Block Size 16.0 MB Peak Block count 1 - Peak Allocated memory 23.1 MB + Peak Allocated memory 24.7 MB Peak Large allocation bytes 16.0 MB [ALLOC_TEMP_JOB_1_FRAME] Initial Block Size 2.0 MB @@ -257,13 +257,13 @@ PlayerConnection::CleanupMemory Statistics: Used Block count 1 Peak Allocated bytes 1.7 MB [ALLOC_GFX_MAIN] - Peak usage frame count: [32.0 KB-64.0 KB]: 1876 frames, [64.0 KB-128.0 KB]: 1 frames + Peak usage frame count: [32.0 KB-64.0 KB]: 18770 frames, [64.0 KB-128.0 KB]: 1 frames Requested Block Size 16.0 MB Peak Block count 1 Peak Allocated memory 67.0 KB Peak Large allocation bytes 0 B [ALLOC_GFX_THREAD] - Peak usage frame count: [64.0 KB-128.0 KB]: 1877 frames + Peak usage frame count: [64.0 KB-128.0 KB]: 18771 frames Requested Block Size 16.0 MB Peak Block count 1 Peak Allocated memory 67.7 KB @@ -275,16 +275,16 @@ PlayerConnection::CleanupMemory Statistics: Used Block count 1 Peak Allocated bytes 1.7 MB [ALLOC_CACHEOBJECTS_MAIN] - Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 1578 frames + Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 18472 frames Requested Block Size 4.0 MB Peak Block count 1 Peak Allocated memory 1.4 MB Peak Large allocation bytes 0 B [ALLOC_CACHEOBJECTS_THREAD] - Peak usage frame count: [1.0 MB-2.0 MB]: 1876 frames, [2.0 MB-4.0 MB]: 1 frames + Peak usage frame count: [1.0 MB-2.0 MB]: 18770 frames, [4.0 MB-8.0 MB]: 1 frames Requested Block Size 4.0 MB - Peak Block count 1 - Peak Allocated memory 3.9 MB + Peak Block count 2 + Peak Allocated memory 4.4 MB Peak Large allocation bytes 0 B [ALLOC_TYPETREE] Dual Thread Allocator Peak main deferred allocation count 0 @@ -293,25 +293,25 @@ PlayerConnection::CleanupMemory Statistics: Used Block count 1 Peak Allocated bytes 1.7 MB [ALLOC_TYPETREE_MAIN] - Peak usage frame count: [0-1.0 KB]: 1877 frames + Peak usage frame count: [0-1.0 KB]: 18771 frames Requested Block Size 2.0 MB Peak Block count 1 Peak Allocated memory 1.0 KB Peak Large allocation bytes 0 B [ALLOC_TYPETREE_THREAD] - Peak usage frame count: [1.0 KB-2.0 KB]: 1877 frames + Peak usage frame count: [1.0 KB-2.0 KB]: 18771 frames Requested Block Size 2.0 MB Peak Block count 1 Peak Allocated memory 1.9 KB Peak Large allocation bytes 0 B [ALLOC_PROFILER] - Peak usage frame count: [16.0 KB-32.0 KB]: 1877 frames + Peak usage frame count: [16.0 KB-32.0 KB]: 18771 frames Requested Block Size 16.0 MB Peak Block count 1 - Peak Allocated memory 28.5 KB + Peak Allocated memory 29.1 KB Peak Large allocation bytes 0 B [ALLOC_PROFILER_BUCKET] Large Block size 4.0 MB Used Block count 1 Peak Allocated bytes 396 B -##utp:{"type":"MemoryLeaks","version":2,"phase":"Immediate","time":1692804747732,"processId":1713,"allocatedMemory":1970133,"memoryLabels":[{"Default":9033},{"Permanent":1264},{"NewDelete":12801},{"Thread":34460},{"Manager":10603},{"VertexData":12},{"Geometry":280},{"Texture":16},{"Shader":69173},{"Material":24},{"GfxDevice":35248},{"Animation":304},{"Audio":3976},{"Physics":288},{"Serialization":216},{"Input":9176},{"JobScheduler":200},{"Mono":40},{"ScriptingNativeRuntime":216},{"BaseObject":1609212},{"Resource":592},{"Renderer":1936},{"Transform":48},{"File":800},{"WebCam":24},{"Culling":40},{"Terrain":953},{"Wind":24},{"String":3447},{"DynamicArray":30868},{"HashMap":7680},{"Utility":1360},{"PoolAlloc":1160},{"TypeTree":1792},{"ScriptManager":80},{"RuntimeInitializeOnLoadManager":72},{"SpriteAtlas":112},{"GI":3272},{"Unet":16},{"Director":7760},{"WebRequest":720},{"VR":45473},{"SceneManager":424},{"Video":32},{"LazyScriptCache":32},{"NativeArray":384},{"Camera":25},{"Secure":1},{"SerializationCache":624},{"APIUpdating":5872},{"Subsystems":384},{"VirtualTexturing":57552},{"AssetReference":32}]} +##utp:{"type":"MemoryLeaks","version":2,"phase":"Immediate","time":1692808327224,"processId":1509,"allocatedMemory":1970133,"memoryLabels":[{"Default":9033},{"Permanent":1264},{"NewDelete":12801},{"Thread":34460},{"Manager":10603},{"VertexData":12},{"Geometry":280},{"Texture":16},{"Shader":69173},{"Material":24},{"GfxDevice":35248},{"Animation":304},{"Audio":3976},{"Physics":288},{"Serialization":216},{"Input":9176},{"JobScheduler":200},{"Mono":40},{"ScriptingNativeRuntime":216},{"BaseObject":1609212},{"Resource":592},{"Renderer":1936},{"Transform":48},{"File":800},{"WebCam":24},{"Culling":40},{"Terrain":953},{"Wind":24},{"String":3447},{"DynamicArray":30868},{"HashMap":7680},{"Utility":1360},{"PoolAlloc":1160},{"TypeTree":1792},{"ScriptManager":80},{"RuntimeInitializeOnLoadManager":72},{"SpriteAtlas":112},{"GI":3272},{"Unet":16},{"Director":7760},{"WebRequest":720},{"VR":45473},{"SceneManager":424},{"Video":32},{"LazyScriptCache":32},{"NativeArray":384},{"Camera":25},{"Secure":1},{"SerializationCache":624},{"APIUpdating":5872},{"Subsystems":384},{"VirtualTexturing":57552},{"AssetReference":32}]} diff --git a/results/Pyramids Training/run_logs/timers.json b/results/Pyramids Training/run_logs/timers.json index 414ea86f29620576a959bc06000a38e3e31de9d3..240808ac07796d0b4747e27f8613c62dc6a53063 100644 --- a/results/Pyramids Training/run_logs/timers.json +++ b/results/Pyramids Training/run_logs/timers.json @@ -2,189 +2,189 @@ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { - "value": 0.8312854170799255, - "min": 0.8312854170799255, - "max": 1.3563001155853271, - "count": 3 + "value": 0.44153398275375366, + "min": 0.44153398275375366, + "max": 1.3355467319488525, + "count": 33 }, "Pyramids.Policy.Entropy.sum": { - "value": 24898.66015625, - "min": 24898.66015625, - "max": 41144.71875, - "count": 3 + "value": 13281.341796875, + "min": 13281.341796875, + "max": 40515.14453125, + "count": 33 }, "Pyramids.Step.mean": { - "value": 89928.0, - "min": 29952.0, - "max": 89928.0, - "count": 3 + "value": 989934.0, + "min": 29938.0, + "max": 989934.0, + "count": 33 }, "Pyramids.Step.sum": { - "value": 89928.0, - "min": 29952.0, - "max": 89928.0, - "count": 3 + "value": 989934.0, + "min": 29938.0, + "max": 989934.0, + "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { - "value": -0.08230863511562347, - "min": -0.08230863511562347, - "max": 0.10929840058088303, - "count": 3 + "value": 0.5360538959503174, + "min": -0.09771484136581421, + "max": 0.5360538959503174, + "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { - "value": -19.754072189331055, - "min": -19.754072189331055, - "max": 25.90372085571289, - "count": 3 + "value": 147.41482543945312, + "min": -23.744707107543945, + "max": 147.41482543945312, + "count": 33 }, "Pyramids.Policy.RndValueEstimate.mean": { - "value": 0.2390647828578949, - "min": 0.2390647828578949, - "max": 0.4782101809978485, - "count": 3 + "value": 0.045880451798439026, + "min": 0.010581070557236671, + "max": 0.5021049976348877, + "count": 33 }, "Pyramids.Policy.RndValueEstimate.sum": { - "value": 57.37554931640625, - "min": 57.37554931640625, - "max": 113.3358154296875, - "count": 3 + "value": 12.617124557495117, + "min": 2.888632297515869, + "max": 118.99888610839844, + "count": 33 }, "Pyramids.Losses.PolicyLoss.mean": { - "value": 0.06781620180218115, - "min": 0.06781620180218115, - "max": 0.07437090419963259, - "count": 3 + "value": 0.06800152817611686, + "min": 0.0626208541326793, + "max": 0.07585402798444363, + "count": 33 }, "Pyramids.Losses.PolicyLoss.sum": { - "value": 0.6103458162196304, - "min": 0.5205963293974282, - "max": 0.6228010015109029, - "count": 3 + "value": 1.020022922641753, + "min": 0.5309781958911054, + "max": 1.0388171774815704, + "count": 33 }, "Pyramids.Losses.ValueLoss.mean": { - "value": 0.00028290575580746486, - "min": 0.00028290575580746486, - "max": 0.017566065812303716, - "count": 3 + "value": 0.016296319718498528, + "min": 0.0003848882069151467, + "max": 0.016296319718498528, + "count": 33 }, "Pyramids.Losses.ValueLoss.sum": { - "value": 0.0025461518022671836, - "min": 0.0025461518022671836, - "max": 0.12296246068612601, - "count": 3 + "value": 0.24444479577747794, + "min": 0.0053884348968120535, + "max": 0.24444479577747794, + "count": 33 }, "Pyramids.Policy.LearningRate.mean": { - "value": 7.47974084008889e-05, - "min": 7.47974084008889e-05, - "max": 0.0002515063018788571, - "count": 3 + "value": 7.44773751745333e-06, + "min": 7.44773751745333e-06, + "max": 0.0002952335158745429, + "count": 33 }, "Pyramids.Policy.LearningRate.sum": { - "value": 0.000673176675608, - "min": 0.000673176675608, - "max": 0.0017605441131519997, - "count": 3 + "value": 0.00011171606276179995, + "min": 0.00011171606276179995, + "max": 0.0033756046747984996, + "count": 33 }, "Pyramids.Policy.Epsilon.mean": { - "value": 0.12493244444444446, - "min": 0.12493244444444446, - "max": 0.1838354285714286, - "count": 3 + "value": 0.10248254666666669, + "min": 0.10248254666666669, + "max": 0.19841117142857143, + "count": 33 }, "Pyramids.Policy.Epsilon.sum": { - "value": 1.124392, - "min": 1.124392, - "max": 1.3864400000000001, - "count": 3 + "value": 1.5372382000000002, + "min": 1.3888782, + "max": 2.4442315, + "count": 33 }, "Pyramids.Policy.Beta.mean": { - "value": 0.0025007512, - "min": 0.0025007512, - "max": 0.008385159314285713, - "count": 3 + "value": 0.00025800641199999995, + "min": 0.00025800641199999995, + "max": 0.009841276025714286, + "count": 33 }, "Pyramids.Policy.Beta.sum": { - "value": 0.0225067608, - "min": 0.0225067608, - "max": 0.058696115199999996, - "count": 3 + "value": 0.0038700961799999992, + "min": 0.0038700961799999992, + "max": 0.11253762985000001, + "count": 33 }, "Pyramids.Losses.RNDLoss.mean": { - "value": 0.12777526676654816, - "min": 0.12777526676654816, - "max": 0.6339518427848816, - "count": 3 + "value": 0.011442345567047596, + "min": 0.011442345567047596, + "max": 0.5378549695014954, + "count": 33 }, "Pyramids.Losses.RNDLoss.sum": { - "value": 1.149977445602417, - "min": 1.149977445602417, - "max": 4.4376630783081055, - "count": 3 + "value": 0.17163518071174622, + "min": 0.1698571741580963, + "max": 3.764984607696533, + "count": 33 }, "Pyramids.Environment.EpisodeLength.mean": { - "value": 999.0, - "min": 986.3939393939394, + "value": 346.6024096385542, + "min": 331.79545454545456, "max": 999.0, - "count": 3 + "count": 33 }, "Pyramids.Environment.EpisodeLength.sum": { - "value": 31968.0, - "min": 15984.0, - "max": 32551.0, - "count": 3 + "value": 28768.0, + "min": 16737.0, + "max": 33458.0, + "count": 33 }, "Pyramids.Environment.CumulativeReward.mean": { - "value": -1.0000000521540642, - "min": -1.0000000521540642, - "max": -0.9267576264612603, - "count": 3 + "value": 1.60518793223134, + "min": -0.9999226326903989, + "max": 1.60518793223134, + "count": 33 }, "Pyramids.Environment.CumulativeReward.sum": { - "value": -32.000001668930054, - "min": -32.000001668930054, - "max": -16.000000834465027, - "count": 3 + "value": 133.23059837520123, + "min": -30.997601613402367, + "max": 140.7999990209937, + "count": 33 }, "Pyramids.Policy.ExtrinsicReward.mean": { - "value": -1.0000000521540642, - "min": -1.0000000521540642, - "max": -0.9267576264612603, - "count": 3 + "value": 1.60518793223134, + "min": -0.9999226326903989, + "max": 1.60518793223134, + "count": 33 }, "Pyramids.Policy.ExtrinsicReward.sum": { - "value": -32.000001668930054, - "min": -32.000001668930054, - "max": -16.000000834465027, - "count": 3 + "value": 133.23059837520123, + "min": -30.997601613402367, + "max": 140.7999990209937, + "count": 33 }, "Pyramids.Policy.RndReward.mean": { - "value": 1.4460240851622075, - "min": 1.4460240851622075, - "max": 13.75953196361661, - "count": 3 + "value": 0.04125872459115337, + "min": 0.04125872459115337, + "max": 10.914842418011498, + "count": 33 }, "Pyramids.Policy.RndReward.sum": { - "value": 46.27277072519064, - "min": 46.27277072519064, - "max": 220.15251141786575, - "count": 3 + "value": 3.42447414106573, + "min": 3.42447414106573, + "max": 185.55232110619545, + "count": 33 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, - "count": 3 + "count": 33 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, - "count": 3 + "count": 33 } }, "metadata": { "timer_format_version": "0.1.0", - "start_time_seconds": "1692804543", + "start_time_seconds": "1692805951", "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "0.31.0.dev0", @@ -192,59 +192,59 @@ "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", - "end_time_seconds": "1692804747" + "end_time_seconds": "1692808327" }, - "total": 204.19198903099993, + "total": 2375.802249766, "count": 1, - "self": 0.4899939809998841, + "self": 0.5414836889999606, "children": { "run_training.setup": { - "total": 0.06392974700003151, + "total": 0.08603750300000002, "count": 1, - "self": 0.06392974700003151 + "self": 0.08603750300000002 }, "TrainerController.start_learning": { - "total": 203.63806530300002, + "total": 2375.174728574, "count": 1, - "self": 0.11630722500376578, + "self": 1.6104274699587222, "children": { "TrainerController._reset_env": { - "total": 5.664806805000012, + "total": 6.435223317000009, "count": 1, - "self": 5.664806805000012 + "self": 6.435223317000009 }, "TrainerController.advance": { - "total": 197.68372270599633, - "count": 6256, - "self": 0.12858404899691322, + "total": 2367.0318223880404, + "count": 63669, + "self": 1.6474626610411178, "children": { "env_step": { - "total": 128.0640337120036, - "count": 6256, - "self": 117.52189123600681, + "total": 1656.2595894459862, + "count": 63669, + "self": 1529.6149483669933, "children": { "SubprocessEnvManager._take_step": { - "total": 10.468025390996502, - "count": 6256, - "self": 0.460955429995181, + "total": 125.62256894601364, + "count": 63669, + "self": 5.285052924938384, "children": { "TorchPolicy.evaluate": { - "total": 10.00706996100132, - "count": 6256, - "self": 10.00706996100132 + "total": 120.33751602107526, + "count": 62568, + "self": 120.33751602107526 } } }, "workers": { - "total": 0.0741170850002959, - "count": 6256, + "total": 1.02207213297919, + "count": 63669, "self": 0.0, "children": { "worker_root": { - "total": 202.8067307250015, - "count": 6256, + "total": 2369.5006298850412, + "count": 63669, "is_parallel": true, - "self": 96.13989460700554, + "self": 970.9220600870476, "children": { "run_training.setup": { "total": 0.0, @@ -253,48 +253,48 @@ "self": 0.0, "children": { "steps_from_proto": { - "total": 0.007218233000003238, + "total": 0.006806372999960786, "count": 1, "is_parallel": true, - "self": 0.005098795999913364, + "self": 0.004339678999883745, "children": { "_process_rank_one_or_two_observation": { - "total": 0.0021194370000898743, + "total": 0.002466694000077041, "count": 8, "is_parallel": true, - "self": 0.0021194370000898743 + "self": 0.002466694000077041 } } }, "UnityEnvironment.step": { - "total": 0.048321342999997796, + "total": 0.05508127199999535, "count": 1, "is_parallel": true, - "self": 0.0006320440000422423, + "self": 0.0006543889999761632, "children": { "UnityEnvironment._generate_step_input": { - "total": 0.0004916980000189142, + "total": 0.0005038240000203587, "count": 1, "is_parallel": true, - "self": 0.0004916980000189142 + "self": 0.0005038240000203587 }, "communicator.exchange": { - "total": 0.04510858199995482, + "total": 0.05190107900000385, "count": 1, "is_parallel": true, - "self": 0.04510858199995482 + "self": 0.05190107900000385 }, "steps_from_proto": { - "total": 0.0020890189999818176, + "total": 0.002021979999994983, "count": 1, "is_parallel": true, - "self": 0.00039074199986544045, + "self": 0.0003985949999218974, "children": { "_process_rank_one_or_two_observation": { - "total": 0.0016982770001163772, + "total": 0.0016233850000730854, "count": 8, "is_parallel": true, - "self": 0.0016982770001163772 + "self": 0.0016233850000730854 } } } @@ -303,34 +303,34 @@ } }, "UnityEnvironment.step": { - "total": 106.66683611799596, - "count": 6255, + "total": 1398.5785697979936, + "count": 63668, "is_parallel": true, - "self": 3.402988120983821, + "self": 38.27181555097968, "children": { "UnityEnvironment._generate_step_input": { - "total": 2.3105800810022856, - "count": 6255, + "total": 24.648736908995204, + "count": 63668, "is_parallel": true, - "self": 2.3105800810022856 + "self": 24.648736908995204 }, "communicator.exchange": { - "total": 90.51425783600394, - "count": 6255, + "total": 1218.9988498530163, + "count": 63668, "is_parallel": true, - "self": 90.51425783600394 + "self": 1218.9988498530163 }, "steps_from_proto": { - "total": 10.439010080005914, - "count": 6255, + "total": 116.65916748500229, + "count": 63668, "is_parallel": true, - "self": 2.016303890011045, + "self": 23.363543891041104, "children": { "_process_rank_one_or_two_observation": { - "total": 8.42270618999487, - "count": 50040, + "total": 93.29562359396118, + "count": 509344, "is_parallel": true, - "self": 8.42270618999487 + "self": 93.29562359396118 } } } @@ -343,24 +343,31 @@ } }, "trainer_advance": { - "total": 69.49110494499581, - "count": 6256, - "self": 0.1492662109924936, + "total": 709.1247702810131, + "count": 63669, + "self": 3.075229964958453, "children": { "process_trajectory": { - "total": 10.805358220003086, - "count": 6256, - "self": 10.805358220003086 + "total": 118.341159932057, + "count": 63669, + "self": 118.128314521057, + "children": { + "RLTrainer._checkpoint": { + "total": 0.21284541099998933, + "count": 2, + "self": 0.21284541099998933 + } + } }, "_update_policy": { - "total": 58.53648051400023, - "count": 28, - "self": 39.11264502799969, + "total": 587.7083803839976, + "count": 450, + "self": 383.09043097799736, "children": { "TorchPPOOptimizer.update": { - "total": 19.42383548600054, - "count": 2286, - "self": 19.42383548600054 + "total": 204.6179494060002, + "count": 22770, + "self": 204.6179494060002 } } } @@ -369,19 +376,19 @@ } }, "trainer_threads": { - "total": 1.4109999710854026e-06, + "total": 9.660002433520276e-07, "count": 1, - "self": 1.4109999710854026e-06 + "self": 9.660002433520276e-07 }, "TrainerController._save_models": { - "total": 0.173227155999939, + "total": 0.09725443300021652, "count": 1, - "self": 0.002028516999871499, + "self": 0.001454587000353058, "children": { "RLTrainer._checkpoint": { - "total": 0.1711986390000675, + "total": 0.09579984599986346, "count": 1, - "self": 0.1711986390000675 + "self": 0.09579984599986346 } } } diff --git a/results/Pyramids Training/run_logs/training_status.json b/results/Pyramids Training/run_logs/training_status.json index 381327128fed52188fc009e6e6603f2b70aa4cd3..1c529c021d7ccc4cc41f2d1c323408e533bd6ec9 100644 --- a/results/Pyramids Training/run_logs/training_status.json +++ b/results/Pyramids Training/run_logs/training_status.json @@ -2,22 +2,40 @@ "Pyramids": { "checkpoints": [ { - "steps": 100064, - "file_path": "results/Pyramids Training/Pyramids/Pyramids-100064.onnx", - "reward": null, - "creation_time": 1692804747.3104196, + "steps": 499967, + "file_path": "results/Pyramids Training/Pyramids/Pyramids-499967.onnx", + "reward": -0.9992000460624695, + "creation_time": 1692807092.771054, "auxillary_file_paths": [ - "results/Pyramids Training/Pyramids/Pyramids-100064.pt" + "results/Pyramids Training/Pyramids/Pyramids-499967.pt" + ] + }, + { + "steps": 999987, + "file_path": "results/Pyramids Training/Pyramids/Pyramids-999987.onnx", + "reward": 1.7710000028212864, + "creation_time": 1692808326.6422815, + "auxillary_file_paths": [ + "results/Pyramids Training/Pyramids/Pyramids-999987.pt" + ] + }, + { + "steps": 1000115, + "file_path": "results/Pyramids Training/Pyramids/Pyramids-1000115.onnx", + "reward": 1.7710000028212864, + "creation_time": 1692808326.7511857, + "auxillary_file_paths": [ + "results/Pyramids Training/Pyramids/Pyramids-1000115.pt" ] } ], "final_checkpoint": { - "steps": 100064, + "steps": 1000115, "file_path": "results/Pyramids Training/Pyramids.onnx", - "reward": null, - "creation_time": 1692804747.3104196, + "reward": 1.7710000028212864, + "creation_time": 1692808326.7511857, "auxillary_file_paths": [ - "results/Pyramids Training/Pyramids/Pyramids-100064.pt" + "results/Pyramids Training/Pyramids/Pyramids-1000115.pt" ] } }, diff --git a/training-envs-executables/linux/Pyramids/Pyramids_Data/ML-Agents/Timers/Pyramids_timers.json b/training-envs-executables/linux/Pyramids/Pyramids_Data/ML-Agents/Timers/Pyramids_timers.json index 85e4fe6eaaf777921a68031e2485fba90262a7a2..06ed8e551a5fa7fe51fe506e3ba3e4608963504a 100644 --- a/training-envs-executables/linux/Pyramids/Pyramids_Data/ML-Agents/Timers/Pyramids_timers.json +++ b/training-envs-executables/linux/Pyramids/Pyramids_Data/ML-Agents/Timers/Pyramids_timers.json @@ -1 +1 @@ -{"count":1,"self":50.060537599999996,"total":203.155656,"children":{"InitializeActuators":{"count":16,"self":0.005065,"total":0.005065,"children":null},"InitializeSensors":{"count":16,"self":0.006683,"total":0.006683,"children":null},"AgentSendState":{"count":31284,"self":12.0318872,"total":17.368325,"children":{"CollectObservations":{"count":100112,"self":0.151332,"total":0.151332,"children":null},"WriteActionMask":{"count":100112,"self":0.052844999999999996,"total":0.052844999999999996,"children":null},"RequestDecision":{"count":100112,"self":0.33597,"total":5.132261,"children":{"AgentInfo.ToProto":{"count":100112,"self":0.24107299999999998,"total":4.796291,"children":{"GenerateSensorData":{"count":100112,"self":3.7408192,"total":4.555218,"children":{"RayPerceptionSensor.Perceive":{"count":300336,"self":0.814399,"total":0.814399,"children":null}}}}}}}}},"DecideAction":{"count":31284,"self":133.736896,"total":133.736896,"children":null},"AgentAct":{"count":31284,"self":1.9630349999999999,"total":1.972497,"children":{"AgentInfo.ToProto":{"count":95,"self":0.000377,"total":0.009462,"children":{"GenerateSensorData":{"count":95,"self":0.008309,"total":0.009085,"children":{"RayPerceptionSensor.Perceive":{"count":285,"self":0.000776,"total":0.000776,"children":null}}}}}}},"AgentInfo.ToProto":{"count":1,"self":1.8E-05,"total":5.6999999999999996E-05,"children":{"GenerateSensorData":{"count":1,"self":3.2E-05,"total":3.9E-05,"children":{"RayPerceptionSensor.Perceive":{"count":3,"self":7E-06,"total":7E-06,"children":null}}}}}},"gauges":{"Pyramids.CumulativeReward":{"count":96,"max":1.41700387,"min":-0.99994123,"runningAverage":-0.9747646,"value":-0.99994123,"weightedAverage":-0.9999411}},"metadata":{"timer_format_version":"0.1.0","start_time_seconds":"1692804544","unity_version":"2021.3.5f1","command_line_arguments":".\/training-envs-executables\/linux\/Pyramids\/Pyramids -nographics -batchmode --mlagents-port 5005 -logFile \/content\/ml-agents\/results\/Pyramids Training\/run_logs\/Player-0.log","communication_protocol_version":"1.5.0","com.unity.ml-agents_version":"2.2.1-exp.1","scene_name":"Pyramids","end_time_seconds":"1692804747"}} \ No newline at end of file +{"count":1,"self":756.56862719999992,"total":2374.527123,"children":{"InitializeActuators":{"count":16,"self":0.005064,"total":0.005064,"children":null},"InitializeSensors":{"count":16,"self":0.01224,"total":0.01224,"children":null},"AgentSendState":{"count":312851,"self":141.232832,"total":197.48497899999998,"children":{"CollectObservations":{"count":1001136,"self":1.719525,"total":1.719525,"children":null},"WriteActionMask":{"count":1001136,"self":0.56162099999999993,"total":0.56162099999999993,"children":null},"RequestDecision":{"count":1001136,"self":3.5670319999999998,"total":53.970999,"children":{"AgentInfo.ToProto":{"count":1001136,"self":2.2894419999999998,"total":50.403966999999994,"children":{"GenerateSensorData":{"count":1001136,"self":38.931926399999995,"total":48.114525,"children":{"RayPerceptionSensor.Perceive":{"count":3003408,"self":9.1825992,"total":9.182599,"children":null}}}}}}}}},"DecideAction":{"count":312851,"self":1401.1147263999999,"total":1401.114732,"children":null},"AgentAct":{"count":312851,"self":19.241404799999998,"total":19.278015,"children":{"AgentInfo.ToProto":{"count":580,"self":0.0030199999999999997,"total":0.03661,"children":{"GenerateSensorData":{"count":580,"self":0.028381,"total":0.03359,"children":{"RayPerceptionSensor.Perceive":{"count":1740,"self":0.005209,"total":0.005209,"children":null}}}}}}},"AgentInfo.ToProto":{"count":1015,"self":0.0056089999999999994,"total":0.057657999999999994,"children":{"GenerateSensorData":{"count":1015,"self":0.043011,"total":0.052049,"children":{"RayPerceptionSensor.Perceive":{"count":3045,"self":0.009038,"total":0.009038,"children":null}}}}}},"gauges":{"Pyramids.CumulativeReward":{"count":1595,"max":1.97380006,"min":-0.99994123,"runningAverage":0.6491522,"value":1.74499679,"weightedAverage":1.725136}},"metadata":{"timer_format_version":"0.1.0","start_time_seconds":"1692805952","unity_version":"2021.3.5f1","command_line_arguments":".\/training-envs-executables\/linux\/Pyramids\/Pyramids -nographics -batchmode --mlagents-port 5005 -logFile \/content\/ml-agents\/results\/Pyramids Training\/run_logs\/Player-0.log","communication_protocol_version":"1.5.0","com.unity.ml-agents_version":"2.2.1-exp.1","scene_name":"Pyramids","end_time_seconds":"1692808326"}} \ No newline at end of file