diff --git a/results/tau_agent_D11_110M/Tau-D11-110M.onnx b/results/tau_agent_D11_110M/Tau-D11-110M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..4130772df0baeb9e7b26bfcce16676b3009948b2 --- /dev/null +++ b/results/tau_agent_D11_110M/Tau-D11-110M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93447a483234592c5c6d2f6e07ebb06808404eb7e515eed33b962a4e51b2e7c +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-10002300.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-10002300.onnx new file mode 100644 index 0000000000000000000000000000000000000000..4130772df0baeb9e7b26bfcce16676b3009948b2 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-10002300.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93447a483234592c5c6d2f6e07ebb06808404eb7e515eed33b962a4e51b2e7c +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-10002300.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-10002300.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec822e45e1ed47cb9d6a08b906651bbbd626300 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-10002300.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5af120cf500b57847cc4b0c87c869cd3c0ea9cd82f7953a98aeaa49acfe4ba7 +size 15534410 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..4dd7ef2dbb5308ffcbe14f7170385e600e3c93db --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbaf9d29599e6a0ad3c52797d9ebe24fe094e4cf5bca45905f5732c5258821bb +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b1ef21f1ea56171528d5049ca2171e4616dffc4 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51cd707dfb14da5a691d2d067be095ec47795b2e1394977f928adb5c39f98a43 +size 15534256 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-2999867.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-2999867.onnx new file mode 100644 index 0000000000000000000000000000000000000000..3996d7d0096bf16ab573ba088dd08dcc34cd8694 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-2999867.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e928e87c579da58f3acf43dc04527748440c0d6fe3e269ba0315f6cd010d8a8 +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-2999867.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-2999867.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbc6f3ae3f03da13e0114deff40e9f6bc21ede25 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-2999867.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b24a7c85d1ba619c7e632c966480ba26c102f2423f182c80289a466394671e6 +size 15534256 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-3999723.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-3999723.onnx new file mode 100644 index 0000000000000000000000000000000000000000..5548d2bcb2917fc91f3eb97444735e77976dbecc --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-3999723.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:285ab7ad09379ae7e0b21fd96855335f5f4d9fdd5d1891869b1139492be98d5f +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-3999723.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-3999723.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2e4a9ca2d022e7507d195d727cf0c6e79ef9d58 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-3999723.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41d651a581239a502cab88d4bb3a124f7b8c0f4e058e9656de42cdd4e9374e37 +size 15534256 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-4999878.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-4999878.onnx new file mode 100644 index 0000000000000000000000000000000000000000..7eb0a7e7a7be0733da35bb4a54992d6f52dd8902 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-4999878.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af5aabc2cbd8d111d2915f9b548fe372cb2cb0cd93668a344bad88babefdc3d5 +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-4999878.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-4999878.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d447cebeb4fe8ec2df3af4569fff3791eafae87 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-4999878.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f93d188769652ecaf6ddb5227325bb051365c4ee4b9f90779b148f5acbfbd406 +size 15534256 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-5999734.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-5999734.onnx new file mode 100644 index 0000000000000000000000000000000000000000..ebcd5199e69071473a1b6d6538ecbba498ae3ca5 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-5999734.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:813079a68d2bcac62e02e72eb3b07aa763683a2fa23e877bb1411b6d846275d7 +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-5999734.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-5999734.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ca9e649b4473d6f62ea1c45439418f392372e8e --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-5999734.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae7ed6bd0234f292efe98c9043fe846f48c5534b2287588efd6079b04f1b52c2 +size 15534256 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-6999889.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-6999889.onnx new file mode 100644 index 0000000000000000000000000000000000000000..8ddeb9c66ffc71cb37e93627dcc35780a46299f8 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-6999889.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a3e383c2594092bbbe85af9dd7e59978f2ad78b7709dc85746fef1e1eb876c6 +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-6999889.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-6999889.pt new file mode 100644 index 0000000000000000000000000000000000000000..a696ac103fb9da1801b832804b186c52cefb4e2a --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-6999889.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f8666e681aa6946cfb92385c7d79016d44aec7401c95da85fd0e628db106de3 +size 15534256 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-7999745.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-7999745.onnx new file mode 100644 index 0000000000000000000000000000000000000000..b889c911c3dfe658525deb3ae8ce33bc5b4a0fc7 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-7999745.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e8a8fd7a1189818dd6b341fc6c5e0cbf6849244b0c0e7b965cab3b6a858ddc2 +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-7999745.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-7999745.pt new file mode 100644 index 0000000000000000000000000000000000000000..c775877249582f8db31dc24d3a2f9c6c6e934b9b --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-7999745.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4175b42c47aa01a2039706c8dca7eccbb5e398d262a223ce6162507e337afdbc +size 15534256 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-8999900.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-8999900.onnx new file mode 100644 index 0000000000000000000000000000000000000000..692a5ba0fddc8ed3bd1e87d457173a5f46c9ca4b --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-8999900.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5daf549a19d3d4812f6976e5dd3075650f4286b278f6ca614ff864715b5e70f +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-8999900.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-8999900.pt new file mode 100644 index 0000000000000000000000000000000000000000..773d490c3596dd9c36b960430ef2b5382ddd0b30 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-8999900.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef8736eb4ab8c0bbaef28d38d67ebbd8669d72095b18aac5129b4ffb61d0204f +size 15534256 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-9999900.onnx b/results/tau_agent_D11_110M/TauAgent/TauAgent-9999900.onnx new file mode 100644 index 0000000000000000000000000000000000000000..aaa69451a6265864ef599a5a6653dcc0ca6f93fe --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-9999900.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:914160a68717d3a4964d0c8f29b039f7f50e86e738a90847439fb5c1abc3a059 +size 2186395 diff --git a/results/tau_agent_D11_110M/TauAgent/TauAgent-9999900.pt b/results/tau_agent_D11_110M/TauAgent/TauAgent-9999900.pt new file mode 100644 index 0000000000000000000000000000000000000000..74eefba21ab9af3be14ee4a825a227d276e8811f --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/TauAgent-9999900.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d3d34c850f86eeb36355007d3048a0a0f05cfae9075b5a6c5704a23bb35d05e +size 15534256 diff --git a/results/tau_agent_D11_110M/TauAgent/checkpoint.pt b/results/tau_agent_D11_110M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..df578b2eb2c8628380ba7e083ac8fbfbc0527710 --- /dev/null +++ b/results/tau_agent_D11_110M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8031a423bd447f01590d6859f903ad169581ed6a7c81a34969d5778440ee58e0 +size 15533332 diff --git a/results/tau_agent_D11_110M/configuration.yaml b/results/tau_agent_D11_110M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..d954ab110e3eefcb77357f42d619eaa56136cf0c --- /dev/null +++ b/results/tau_agent_D11_110M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D10\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Build + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D11 + initialize_from: tau_agent_D10 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false diff --git a/results/tau_agent_D12_120M/Tau-D12-120M.onnx b/results/tau_agent_D12_120M/Tau-D12-120M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..57b7e784993620d033bb366165aa38bf74a547d2 --- /dev/null +++ b/results/tau_agent_D12_120M/Tau-D12-120M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9bbb49c2fb1448abfff70421ef63826da0400df1de1900c24ccde55ce57d13 +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-10015005.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-10015005.onnx new file mode 100644 index 0000000000000000000000000000000000000000..57b7e784993620d033bb366165aa38bf74a547d2 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-10015005.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9bbb49c2fb1448abfff70421ef63826da0400df1de1900c24ccde55ce57d13 +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-10015005.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-10015005.pt new file mode 100644 index 0000000000000000000000000000000000000000..16035fb8e185cdd1024634ede4feaf3432a46180 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-10015005.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31488e308c5ece73d8118e73cdac38f7622044276bee3b28104f7b15d8a85d8b +size 15534410 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..7b197de628f2aa9bd98d588b91820004c3a163ad --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:334a037a38160272804cb79b9034385fedfd2346f7dadb5c20e8aa3a40ed716b +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16efc04a7bd48299839b1254bfbc4166e144e89 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bc2fdba71d65d7e6bbe3d36bb73cd330166129db275cd00dfb419f2c82488b6 +size 15534256 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-2999867.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-2999867.onnx new file mode 100644 index 0000000000000000000000000000000000000000..6a8397a991557a5ae799f73dfb5eb1749a772a03 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-2999867.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:640f7fd8cefe5973f3e4eb4ce305ddaecf023f92eb85e53a842ed8fec1b91cfb +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-2999867.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-2999867.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4106ea078f427d0097929ea98161c369b34e7af --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-2999867.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4a0f10b3160a3bebb7831d050c37d34d3115832b14e48e6f04464455970090f +size 15534256 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-3999723.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-3999723.onnx new file mode 100644 index 0000000000000000000000000000000000000000..955d4f5809a569970a02c11a64434fee1a9fb9e5 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-3999723.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:306a63a4b24afd397cf2606decec6b54b8674846d19ab29ef7982f9edc8b5b73 +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-3999723.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-3999723.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae6092d5bdca128a195f599f6726fbb519ea9aa8 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-3999723.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:465771084c0c7090124a5fbb21cea536fd7579ce49c4fef0d4f98da0af032c39 +size 15534256 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-4999878.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-4999878.onnx new file mode 100644 index 0000000000000000000000000000000000000000..7bd1b06ea54971d9f9cbf3a6b98dd5f2455c6bf5 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-4999878.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f624483fd08603871fcf8c34e7fe94dbf07811bf52504f0353b3c8120d3b7e39 +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-4999878.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-4999878.pt new file mode 100644 index 0000000000000000000000000000000000000000..44db2b043bff165acbca3ff57f9feb0803cc5d99 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-4999878.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e45557347c222ee1e3374007e154096814b3db3f4cdb6c8aeb5039bc25d43bb +size 15534256 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-5999734.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-5999734.onnx new file mode 100644 index 0000000000000000000000000000000000000000..a5dc77de35a74a835f1fc64c35618d134af3f25f --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-5999734.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a3276271aec9c6e4731da7b4bbc55a9d96a5734d0cb27ca77a4a205a23a7731 +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-5999734.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-5999734.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf4a3d9adcbc527d43b9be5d82cd4eb97264a54a --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-5999734.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a5508bd0cfd541bd472ca36297fb82a03de701ad212e10cb11b385bbe6e044c +size 15534256 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-657800.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-657800.onnx new file mode 100644 index 0000000000000000000000000000000000000000..193b1f7dfea7ed094d954be1fa804408febe54f1 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-657800.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9209eaec6d31cf6fb04e4c44350c0f8a96296580748e93f455f2784c7916531d +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-657800.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-657800.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec49cda8d3b098444a391b5a33e93e06cda2166a --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-657800.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f44f14c760052cd3702e789f8278287e958eb94a58e53983b8c4f505e24349 +size 15534102 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-6999889.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-6999889.onnx new file mode 100644 index 0000000000000000000000000000000000000000..415a980deb6d46a1576c26e8b6491ec03759d56a --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-6999889.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40311cb454c6a053bfdafde3a9b87f89d1635e39e3574ccac5c651efb13ebe56 +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-6999889.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-6999889.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3d5b836d0c4eed9ad9349a45b542166c398b74 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-6999889.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76f3f3364bcff7ce5a86533e3c27f2303d7ce94cd28c8539f6d18d8a8207f5ef +size 15534256 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-7999745.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-7999745.onnx new file mode 100644 index 0000000000000000000000000000000000000000..4ffe6b3f737777f28070cefead355dbdd99563a9 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-7999745.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13acccd224287a412f1e7d0044ea66e84567202b332b50f51e12f17195ba65de +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-7999745.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-7999745.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5b14868e019449e7eaa96fc5c03b42c10762c6f --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-7999745.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2bc9302228e9db24bae4318bc827c68907abccd83751a611a177975a0126b58 +size 15534256 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-8999900.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-8999900.onnx new file mode 100644 index 0000000000000000000000000000000000000000..5128efde4f65d031972e2084167bd895f9268aa3 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-8999900.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e470a80060920e1229dcdca7ad54bead837a630b06bf36e6c85b7b388413439b +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-8999900.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-8999900.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3dd739f1e7e7dd16fc81693af307acecf6a6911 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-8999900.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf4c652142bcb1c1afac8bc5d0f9c1af90ec63fe187ad4bfbbeb01732ed72722 +size 15534256 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-9999756.onnx b/results/tau_agent_D12_120M/TauAgent/TauAgent-9999756.onnx new file mode 100644 index 0000000000000000000000000000000000000000..5f980e567887ac36a692d0bd932798a54236a838 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-9999756.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c656665d645c34b3d7a8e5df2f77f726300b674f4fe6c2d3144ea9471118e9c4 +size 2186395 diff --git a/results/tau_agent_D12_120M/TauAgent/TauAgent-9999756.pt b/results/tau_agent_D12_120M/TauAgent/TauAgent-9999756.pt new file mode 100644 index 0000000000000000000000000000000000000000..9beb207a67fa30db27c31664fd78007454e1a775 --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/TauAgent-9999756.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948794047d26d7d4e43bae12f3ea2bc161e41a8dc70c9fcd443446ffeff57427 +size 15534256 diff --git a/results/tau_agent_D12_120M/TauAgent/checkpoint.pt b/results/tau_agent_D12_120M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ac20195a0b5cb1ed4f881ec53a9b046e1cdc9da --- /dev/null +++ b/results/tau_agent_D12_120M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167da69a09bfbaf0b2c24e6016140699791cc439c437f0f04fb586c1eda82207 +size 15533332 diff --git a/results/tau_agent_D12_120M/configuration.yaml b/results/tau_agent_D12_120M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..b3abd446e03b964ee88dc968994d4b1d00c30421 --- /dev/null +++ b/results/tau_agent_D12_120M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D11\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Build + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D12 + initialize_from: tau_agent_D11 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false diff --git a/results/tau_agent_D13_130M/Tau-D13-130M.onnx b/results/tau_agent_D13_130M/Tau-D13-130M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..0f8343f9b1099932d40d9e6564d1082dce7725a4 --- /dev/null +++ b/results/tau_agent_D13_130M/Tau-D13-130M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f23c84a698d6fa0ce22f2fcdff4b7591e26e635aa7b82074034b3bc5eaf19e1b +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-10030875.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-10030875.onnx new file mode 100644 index 0000000000000000000000000000000000000000..0f8343f9b1099932d40d9e6564d1082dce7725a4 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-10030875.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f23c84a698d6fa0ce22f2fcdff4b7591e26e635aa7b82074034b3bc5eaf19e1b +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-10030875.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-10030875.pt new file mode 100644 index 0000000000000000000000000000000000000000..814d58d7dc0a0e74bdb10c80b07e1929366c93be --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-10030875.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c24058f0486fdeb91e13fa7da4e335365ba1749eb604b577bd1907eb417a10a +size 15534410 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..7566a30f7dea68477b6afa4b7bcd7b6360366f16 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7070a8321cf3469bbc7b99acc46307ce62bbc80aad3e50d001299b38310b3e9 +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..b501affbf54ddd5a3970d1958ae9eb6ee21c99bd --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8f9cb04668d83680d7e94a7f8be3e30d6c1b7bc3f0f8e3babff5227687f6278 +size 15534256 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-2999867.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-2999867.onnx new file mode 100644 index 0000000000000000000000000000000000000000..554b6c477638249925fae05a499b2e40276318c3 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-2999867.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e6aff8f99aa8c9edc7195a7605585589b948b3bcca645397dbafc7532e69e7 +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-2999867.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-2999867.pt new file mode 100644 index 0000000000000000000000000000000000000000..83f05bcd676112c912a72a9f96eb6aff9dde2c58 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-2999867.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c4fa8339901416f7ddbf4abf45ab495048f12d49018e6cb1438e242488aebe3 +size 15534256 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-3999723.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-3999723.onnx new file mode 100644 index 0000000000000000000000000000000000000000..678a1a6817da901c2396aa8fb96767275953aff7 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-3999723.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a771a84f09fa04f94fd183e883819f3ba6d387240099d273c61808c91a16a00 +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-3999723.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-3999723.pt new file mode 100644 index 0000000000000000000000000000000000000000..40aa771eeb3e33e76deee55ee4ee92ba4a4463b1 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-3999723.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631858304a7e54c30837a2748f93b1af19ef8339769b76212a7ce1ea00e7cd8b +size 15534256 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-4999878.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-4999878.onnx new file mode 100644 index 0000000000000000000000000000000000000000..e61bee40acc5e922911195ab9c1d2f8e876978a2 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-4999878.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:419865f8dc5177b51ac9df2b9a9d61473ec5b36b13f66a7dd15ea9b3222d1397 +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-4999878.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-4999878.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdf70c8e9aaad6e78a56d43208a3d9827ff0b926 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-4999878.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ce038c9e98192272d028c2cc9039fe7cef58fb3a2d953ed227c7794e2e81e83 +size 15534256 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-5999775.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-5999775.onnx new file mode 100644 index 0000000000000000000000000000000000000000..1e960f56f13fe6d2f10409f361c1f3717bf0daba --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-5999775.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eff6748402168c1cbe8283c603afe77c704b855ff8bbc596cdda0beb41c3828 +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-5999775.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-5999775.pt new file mode 100644 index 0000000000000000000000000000000000000000..176440243240af7cca91b50c2e75989e5803b00a --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-5999775.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac56af43e00cbb9db52273b4e7dfec87ce0e784e3a00c28bd62f45080a8e2673 +size 15534256 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-6999975.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-6999975.onnx new file mode 100644 index 0000000000000000000000000000000000000000..ca9024346313ac546442a11bd6ad913932a88b87 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-6999975.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2852a88751b73462557c5e6060bd04306b0c729b862f6c6bcf89239f154ab2 +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-6999975.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-6999975.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c6e3abfa85d4ed968f0b9972771db2b09f31316 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-6999975.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43327563aa53cb6d4336c533ed436122d9477b48382277f7bf713f0147938b68 +size 15534256 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-7999875.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-7999875.onnx new file mode 100644 index 0000000000000000000000000000000000000000..342c7152bd65229fbe8ad9dac55f99f02058c6cf --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-7999875.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb638c9dd8e50475522a99660f7d796771316e5092474bf52086b219ae62b3c6 +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-7999875.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-7999875.pt new file mode 100644 index 0000000000000000000000000000000000000000..58d98e87c91d95c26825b050ed32c57ec2da9bf6 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-7999875.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28b8f86f40cf0a9139c0160c240c468faac0df8f44f66078966fd8ab5543f36b +size 15534256 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-8999775.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-8999775.onnx new file mode 100644 index 0000000000000000000000000000000000000000..c80528bea52f7adab6fc3566eac7c7fb3c690c9d --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-8999775.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06dc9a594e6b143cbd1d078d9377db8333c8d29ab6550d73352babf093867252 +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-8999775.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-8999775.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ae849aea6b47f0eaba82f2b590101dfec9cbce7 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-8999775.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d36837021d95a4c04f89eec398be41fe51298a252745da605c8d8e5e8d1397 +size 15534256 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-9999975.onnx b/results/tau_agent_D13_130M/TauAgent/TauAgent-9999975.onnx new file mode 100644 index 0000000000000000000000000000000000000000..fff58c0c145022def4a30369a4027f26ac667204 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-9999975.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8418bef3922a4a896e9b08939e570808a3a79279cc11dce335497364c94e870 +size 2186395 diff --git a/results/tau_agent_D13_130M/TauAgent/TauAgent-9999975.pt b/results/tau_agent_D13_130M/TauAgent/TauAgent-9999975.pt new file mode 100644 index 0000000000000000000000000000000000000000..c42e300784eda0eb293576b5e8934f64bb39750a --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/TauAgent-9999975.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7bbb10dbdc84050bb2a3d0fe5d646dd39220b359c523b082f3f15bb19966c3 +size 15534256 diff --git a/results/tau_agent_D13_130M/TauAgent/checkpoint.pt b/results/tau_agent_D13_130M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..fccb07e790d1dee9862c68d241c7a6e3f2d56340 --- /dev/null +++ b/results/tau_agent_D13_130M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:779b0a59f1bf07f13fed641ed3a112f5ac5631788f705bc58f7c52b21fae9417 +size 15533332 diff --git a/results/tau_agent_D13_130M/configuration.yaml b/results/tau_agent_D13_130M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..4d1fa08fa97cf6cd8e7ac9711b437e6a2cbe15d9 --- /dev/null +++ b/results/tau_agent_D13_130M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D12\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Build + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D13 + initialize_from: tau_agent_D12 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false diff --git a/results/tau_agent_D14_140M/Tau-D14-140M.onnx b/results/tau_agent_D14_140M/Tau-D14-140M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..9cc6083984616339e2566ca157fc3cd878d07e68 --- /dev/null +++ b/results/tau_agent_D14_140M/Tau-D14-140M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d997d52482df54f04b306e77bfc5415f3d8f93f2abd8cb2b2bb66d3d5efb40c +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-10029500.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-10029500.onnx new file mode 100644 index 0000000000000000000000000000000000000000..9cc6083984616339e2566ca157fc3cd878d07e68 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-10029500.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d997d52482df54f04b306e77bfc5415f3d8f93f2abd8cb2b2bb66d3d5efb40c +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-10029500.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-10029500.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f3ce6351338ce8d3df3845231027a695cee697f --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-10029500.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c5face27532448f5901a4441c071e6f9ff07e7d0b8f02e24f834de00517474a +size 15534410 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..a33742b6442e8062f228438ad99098deacc134ca --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8f4e85035e5716c868896de4d8034820b2a216025300cb5c22f3288ba8e1910 +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..d37c923e32bc84b59b77ce9ca912ec88c1bdfe77 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39629cf8fadb1e43d2d3fd30cd01543f131a2d555f4e41423959b3dfcc770d2c +size 15534256 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-2999867.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-2999867.onnx new file mode 100644 index 0000000000000000000000000000000000000000..17006dcc6b78d64521a52701543be2c5b74fc498 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-2999867.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07a6970da877068ace5e1e1627134008bc048e2b7b3a1f6d26579eb2d02c9bd5 +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-2999867.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-2999867.pt new file mode 100644 index 0000000000000000000000000000000000000000..28aad5f0f21151fd0c9605ba5f3c728cb3836a85 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-2999867.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f23506678ced610c7f586b32e691e19f3bfda2b7d9727d0ced21c4403fcf67 +size 15534256 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-3999723.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-3999723.onnx new file mode 100644 index 0000000000000000000000000000000000000000..ac02314f02d5ff2f44d45e94a25d531738b1318a --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-3999723.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73803e366604cef2e89840caef647af273ddc195499f7bd35a834a8101bb8b1a +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-3999723.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-3999723.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b685597325beffa80785464110a0aac1a64c43 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-3999723.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df326c74119f3650fd5249278340fa520874f18720dd582e702555fa04c4177f +size 15534256 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-4999878.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-4999878.onnx new file mode 100644 index 0000000000000000000000000000000000000000..f4fda026718a0d63b935949ad1a14e1287478892 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-4999878.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4007891438ac609fb39e08e4ef3c14ce7ed6db7e595bdfc32dde3b8f3e13928f +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-4999878.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-4999878.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e924ba4891810089cbae4f7c7fa30bdc6ae1a19 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-4999878.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21e77de5af4f4edb8c3ccafcf8a78648923b7bb53a2209c12d51a0f772499f4a +size 15534256 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-5999900.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-5999900.onnx new file mode 100644 index 0000000000000000000000000000000000000000..9453090c851dde7e1b3bcf1f3418274da6f12090 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-5999900.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3714c3ce63222728a7f3885d2a09ad73b207bf671371f744bfe62632b945803f +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-5999900.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-5999900.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b7fbe69eaa7f801b38c37a8434d4e0f6e6f9142 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-5999900.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0be48e292b3539d91d245458edbb9a9bab555278be745059911febe1ff6e0f4b +size 15534256 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-6999800.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-6999800.onnx new file mode 100644 index 0000000000000000000000000000000000000000..ab261061fb98fa4a4833299d7b83e3957201b754 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-6999800.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb29a48df84c470aaf62205b9623dc81fca531ae68e234883e0648224c439f1 +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-6999800.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-6999800.pt new file mode 100644 index 0000000000000000000000000000000000000000..da331813166b65b5ded25c17e165d1621cfc8b51 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-6999800.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cf5d0b82936dc64f5a62f5a72272e14e2d98a0ada73392bc5d70e2bfca43fd2 +size 15534256 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-7999700.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-7999700.onnx new file mode 100644 index 0000000000000000000000000000000000000000..885a55c260a1d03f7503ede93931879b6cd6fa05 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-7999700.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c64fcf0c48f0a65bfbf6a851e5ec18675a83196594c455979e225dfcb7b0b9f9 +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-7999700.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-7999700.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd3ba5fbd102125258cdcc3f01bc291a7ceea9bb --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-7999700.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2ec4d9ea45716f3425426a7d6d0286cadcc678f055b92fb8db1066854f57e89 +size 15534256 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-8999900.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-8999900.onnx new file mode 100644 index 0000000000000000000000000000000000000000..217ecc7f9b7bc943048cf9b9cc00245a010675be --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-8999900.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3109ad5add6f8b16d306f3cbd34251f0d1fa0349a43c2ccc38dca56bc5373194 +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-8999900.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-8999900.pt new file mode 100644 index 0000000000000000000000000000000000000000..5be21700b0e389bbb9cdcb3961032525c60d815e --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-8999900.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1329022fc1307dfd7853798957e8c90b3c5b326b1b92771663f77bcaf793aac +size 15534256 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-9999800.onnx b/results/tau_agent_D14_140M/TauAgent/TauAgent-9999800.onnx new file mode 100644 index 0000000000000000000000000000000000000000..551a639e8d5d9c1f7b6f855b280e49919f39c83c --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-9999800.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0a1038faa46394a665300934894a5fe19fac1c2f0fd61ed6bceb1c96de449c7 +size 2186395 diff --git a/results/tau_agent_D14_140M/TauAgent/TauAgent-9999800.pt b/results/tau_agent_D14_140M/TauAgent/TauAgent-9999800.pt new file mode 100644 index 0000000000000000000000000000000000000000..a311e77526393fcc5914a967112a4e2fc78872b6 --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/TauAgent-9999800.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:405340b18c4515921886d5145bc4e322e8332145c19a3368dc2fe976440622b0 +size 15534256 diff --git a/results/tau_agent_D14_140M/TauAgent/checkpoint.pt b/results/tau_agent_D14_140M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..89183fbc041e3e15958951949c2a820d9db2880e --- /dev/null +++ b/results/tau_agent_D14_140M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fa12df9f45661c5f0591227f95d91485796184fc8437841d8acd9667264eeca +size 15533332 diff --git a/results/tau_agent_D14_140M/configuration.yaml b/results/tau_agent_D14_140M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..0346ae213db032d460fc83ae887eea028106149b --- /dev/null +++ b/results/tau_agent_D14_140M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D13\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Build + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D14 + initialize_from: tau_agent_D13 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false diff --git a/results/tau_agent_D15_150M/Tau-D15-150M.onnx b/results/tau_agent_D15_150M/Tau-D15-150M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..803a402e78a515dd5f7d0bfd9ad5cd2fab0906e8 --- /dev/null +++ b/results/tau_agent_D15_150M/Tau-D15-150M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5571e846f826a4ebdb719459a1ccb3ce2380eb8c65363dc3535510fabb6a0ff +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-10003000.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-10003000.onnx new file mode 100644 index 0000000000000000000000000000000000000000..803a402e78a515dd5f7d0bfd9ad5cd2fab0906e8 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-10003000.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5571e846f826a4ebdb719459a1ccb3ce2380eb8c65363dc3535510fabb6a0ff +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-10003000.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-10003000.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee9bd9610512cb3c82ac10efeaf44cf5f02e8d33 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-10003000.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b51ee7b9f537097f9e18d42ae679f9e3bdd2c95a5c75a5e330ba351c39029ea4 +size 15534410 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..e49494fb80d2224515f296e4b40811097511a242 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16221c36d15681fd3926ba1c276391c810e72fd8c6742b2d49d2bdaefbe1af98 +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8146e09a03a48688aef56662c9c9aa1ff4f1ff5 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:decd1fe4b711e950ceaa264b0b5a032831dd08f80ec643e7323aca3926d2ce8d +size 15534256 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-2999800.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-2999800.onnx new file mode 100644 index 0000000000000000000000000000000000000000..0b0c86e9e1c61960ff8311bf93e60f7b92413dee --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-2999800.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef72697982943cfed82208c2732fdee26001879a7d5818299f9c4b4ca1b95482 +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-2999800.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-2999800.pt new file mode 100644 index 0000000000000000000000000000000000000000..008cb058dd6d7c1426829fe0e78c0b7e7b7e78f7 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-2999800.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9dda03429fe83bf2acb739cda8221423747f71f8fb44204c3d5eb0437c04ab +size 15534256 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-3999700.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-3999700.onnx new file mode 100644 index 0000000000000000000000000000000000000000..0af9777c85a3535f3b48ae136386c637145a24af --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-3999700.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2b46be088d3d1122626b6d15b6551fd8dcaa2d4a789ffd85d5ef39c68f447e4 +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-3999700.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-3999700.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ba72556583086e3f8ce2d83f50cec727bb22ca3 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-3999700.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea7bd415b9b70d8f8e0156a567c2b5af1ed5bb181351761c99e89127cba410c +size 15534256 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-4999900.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-4999900.onnx new file mode 100644 index 0000000000000000000000000000000000000000..b8260f48bbd55a7aaf58e8bca1510107aebef9de --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-4999900.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6d13b7e45bb46b8510fc4a043b5fdbed2718c2323ce95e3ef65f52ab7800b5 +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-4999900.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-4999900.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c1532bbfdd6b125c562c0c52d7680ab2c8cde4e --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-4999900.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c8bfa15e591e3553625920c4aaf742b00d5b042273c570eebb6ebfb40a75f85 +size 15534256 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-5999800.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-5999800.onnx new file mode 100644 index 0000000000000000000000000000000000000000..5dba483ce94d52228349beb9c0ea102d636642cf --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-5999800.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9399038165a6c23a3b13a80c5b4066a3769257bb2742388fe12c4fd36ad0f0b8 +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-5999800.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-5999800.pt new file mode 100644 index 0000000000000000000000000000000000000000..023637b396c4392007a1d8fcf412a543893ccf32 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-5999800.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08e98b44c809b7222c49a1c50cc4b1cdc40f1db51a0224aaff02e01d161a3bf +size 15534256 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-6999700.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-6999700.onnx new file mode 100644 index 0000000000000000000000000000000000000000..2b2e2cd839d6393d1ec779cfc70ab7ffb89d4a54 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-6999700.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2f0dfd22418c4acf03759d5f4a35de09b593190e925bb88e69d8f47a173ec5f +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-6999700.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-6999700.pt new file mode 100644 index 0000000000000000000000000000000000000000..a07e2063df1027f6801e2d0648d848407310d456 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-6999700.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a08f28a791d22599e92a4c6bce6618f1db1e0107f67b05e0893ac4ef06d4483 +size 15534256 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-7999900.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-7999900.onnx new file mode 100644 index 0000000000000000000000000000000000000000..b87dfbe5d2cdf6f58b78f20d32a4fa20517de856 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-7999900.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b60be9b66b4ca19b51e046863fe5d705454919c02f677043bafbaecd4bb8abf7 +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-7999900.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-7999900.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6dfb5a04d86cd14c5f96be7c456b7050c69f89 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-7999900.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf711602fa60d5a7bab4dac350139f34bcd954432ae623905ddd1454c1cd74d1 +size 15534256 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-8999800.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-8999800.onnx new file mode 100644 index 0000000000000000000000000000000000000000..bac03552d1583ffae09c295723f473918398ae54 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-8999800.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c9666361646d7f87d2543ca17714fcff6974de3d40d896970afcf646636b0d +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-8999800.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-8999800.pt new file mode 100644 index 0000000000000000000000000000000000000000..966c430d4a4d08581993c03fea141d18921936f8 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-8999800.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb71e5fa2a8d41d1af470c2b8a583d5b45b2329f68bc7e136c9f694aef65fcfb +size 15534256 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-9999700.onnx b/results/tau_agent_D15_150M/TauAgent/TauAgent-9999700.onnx new file mode 100644 index 0000000000000000000000000000000000000000..8b6e26c9b0d61f7aa43867525660cc75b5d6df54 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-9999700.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc86860f80bc706e8a242c2b6a60ad099fd8136c227840ff8e8025b0acc79035 +size 2186395 diff --git a/results/tau_agent_D15_150M/TauAgent/TauAgent-9999700.pt b/results/tau_agent_D15_150M/TauAgent/TauAgent-9999700.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ccdc975ada645520b759e996bf33a06a340c201 --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/TauAgent-9999700.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:112fc4455518ca57099291c028cd3c8dba51361cfea68f842f62b751f3586359 +size 15534256 diff --git a/results/tau_agent_D15_150M/TauAgent/checkpoint.pt b/results/tau_agent_D15_150M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..e75fb483a58f03ddee211aa1a86db6fe9326329f --- /dev/null +++ b/results/tau_agent_D15_150M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:717477ab4843280fe74aca23d55eba4bf42bf192b63e71960c7a0055146f407b +size 15533332 diff --git a/results/tau_agent_D15_150M/configuration.yaml b/results/tau_agent_D15_150M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..d9443d8dc04dc1195cfc0ffb77b83f110b438824 --- /dev/null +++ b/results/tau_agent_D15_150M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D14\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Build + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D15 + initialize_from: tau_agent_D14 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false diff --git a/results/tau_agent_D16_160M/Tau-D16-160M.onnx b/results/tau_agent_D16_160M/Tau-D16-160M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..6df503223c8fbd3e12c62413e79db1e71ac64ed8 --- /dev/null +++ b/results/tau_agent_D16_160M/Tau-D16-160M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea30bb71ec0882e3f2c6964f4c9bc55b139c72429eeb8a3817d35186427b7f5 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-10001375.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-10001375.onnx new file mode 100644 index 0000000000000000000000000000000000000000..6df503223c8fbd3e12c62413e79db1e71ac64ed8 --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-10001375.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea30bb71ec0882e3f2c6964f4c9bc55b139c72429eeb8a3817d35186427b7f5 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-10001375.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-10001375.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a901b37cfd832aa2435aa00f49e4cae11d63fcd --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-10001375.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fac4b00af8d9f3f52895466aa63dcb6b4868c860e1c01470e3dbcfeca166827 +size 15534410 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..786e77b1c3f2fc722e349adaaf5ab853cc09707c --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f00f7867f1a5c286ebeb38c54a6c75da9d1d03e1b9ceda4515e383842ec0430 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f97bcdb474ddddaa28989809959356e242993ac --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c179214f63def0d23ee52a3f8b09166124aeaf7ca33ee8f42dc38bb1d1ef00a7 +size 15534256 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-2999975.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-2999975.onnx new file mode 100644 index 0000000000000000000000000000000000000000..4865cf927c14fb6af61730884ddb178cdbc4cead --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-2999975.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977444588acef30a529683c6e701b5502067271af5a773b77dafa546003d6666 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-2999975.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-2999975.pt new file mode 100644 index 0000000000000000000000000000000000000000..da42a670bedd422c151887864819db97f2a09cc2 --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-2999975.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf00d94d7ef159e3181ba7d7571b8cbea8613b5926579d7679b53a60fbd5eebd +size 15534256 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-3999875.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-3999875.onnx new file mode 100644 index 0000000000000000000000000000000000000000..07e6e2947282f52f3706b6513f75ca0f193543c7 --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-3999875.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81059df955f8c0d621c9e0c965a2483a78607012d73a4c30a717e4da4881b283 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-3999875.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-3999875.pt new file mode 100644 index 0000000000000000000000000000000000000000..893a1996870100c3ad065fb074faebf49bce406a --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-3999875.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc6d866465396646d4f783c633b8cc743ccb1f96d77fb85d1dd604a9bbfd912f +size 15534256 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-4999775.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-4999775.onnx new file mode 100644 index 0000000000000000000000000000000000000000..6f76e27c61d164a5bfaf83379c31cf813bae2e4a --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-4999775.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af8eb5ef86d3d96dfd3d24886236e61885efe3f7bf7edb2781235f487af6275 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-4999775.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-4999775.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb15cc0c0615848350ce4bf335263c455f6498cb --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-4999775.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b04055e99e1afc778143ab04fb60d6415f0e3dde29e6757daa56746bf0434e0 +size 15534256 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-5999975.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-5999975.onnx new file mode 100644 index 0000000000000000000000000000000000000000..d3ae7cf280d53ddadd488a8256d6924e5eb2d63f --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-5999975.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:692e43ca39ffd63ca165174ef48466fbde5a0434ab50138d0712ce9d870573f7 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-5999975.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-5999975.pt new file mode 100644 index 0000000000000000000000000000000000000000..e801fd7ce3d407dbb7d33d912bb0f1be254ce3b7 --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-5999975.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80f852ebca63e4fab629531878c747194a5f7c6a047ac9d94692f5d8601a4ece +size 15534256 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-6999875.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-6999875.onnx new file mode 100644 index 0000000000000000000000000000000000000000..83c69b98bb2343be1a73afdcb63ca6eac27082c0 --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-6999875.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0f9c78076492a337753ce8a3ec6d8778a18bd40cc8a5376f98bcb51026c572 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-6999875.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-6999875.pt new file mode 100644 index 0000000000000000000000000000000000000000..11b14bc0451f3606da4bd984a65af4269c2237d9 --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-6999875.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff3b6c347e6b9168e9b1e9ad10e930c245e71e9cb5601d22c3c0c47e3bd7ff9 +size 15534256 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-7999775.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-7999775.onnx new file mode 100644 index 0000000000000000000000000000000000000000..eb3f7e543ec15f3c7b6c0cda9c4bad4b47087088 --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-7999775.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac4f552d130880740a140eb7318e24f72c8978252ff1627e30c894ad9171a25 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-7999775.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-7999775.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e58e39cd182a3fe8a4f2362332f1c55ca6140ca --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-7999775.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8af7a6721d37a49a079b54e2bb1bd2e68dc15362c3fb5095ff08e89f1d40584a +size 15534256 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-8999975.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-8999975.onnx new file mode 100644 index 0000000000000000000000000000000000000000..8ab6d8618b95eb24d715e7b6ac3c5aa01687bd4b --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-8999975.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58476611a1cb6f43de698a2bf303fbcafa61a9e9a88d4397321bd0a75c2aac98 +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-8999975.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-8999975.pt new file mode 100644 index 0000000000000000000000000000000000000000..75117094a19ca084b988ccf15bfe7e29ba8e0d0c --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-8999975.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:605295f88bb69255245dfd13b56a1f413f140748a0ac910134dbc106fdfe700d +size 15534256 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-9999875.onnx b/results/tau_agent_D16_160M/TauAgent/TauAgent-9999875.onnx new file mode 100644 index 0000000000000000000000000000000000000000..12f40dfb8eb9010b7a425f381f61e194449fde84 --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-9999875.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c160911af4a41bf65b6f4ee29155961fa503489e90deb5c57da5d2352abc56dd +size 2186395 diff --git a/results/tau_agent_D16_160M/TauAgent/TauAgent-9999875.pt b/results/tau_agent_D16_160M/TauAgent/TauAgent-9999875.pt new file mode 100644 index 0000000000000000000000000000000000000000..f16257c74d6aec8adfe700873474c31b5001d99d --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/TauAgent-9999875.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:102c4e8fd1b4072205f0201b37cbe8e3cc05576e461cd9834e7f2a8aacd9225c +size 15534256 diff --git a/results/tau_agent_D16_160M/TauAgent/checkpoint.pt b/results/tau_agent_D16_160M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..29ca3c149cb4cddc3c9162099c331006cc358a88 --- /dev/null +++ b/results/tau_agent_D16_160M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36be1502d22796d1c141e274882b265fcdfe9b135865dcced5b4bbbb6d2315a6 +size 15533332 diff --git a/results/tau_agent_D16_160M/configuration.yaml b/results/tau_agent_D16_160M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..34deddb94dd0c19729215acb16f342f6af6c210b --- /dev/null +++ b/results/tau_agent_D16_160M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D15\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Build + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D16 + initialize_from: tau_agent_D15 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false diff --git a/results/tau_agent_D17_170M/Tau-D17-170M.onnx b/results/tau_agent_D17_170M/Tau-D17-170M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..78e4b2a204df5cf6a3f80212480becb509c7d8db --- /dev/null +++ b/results/tau_agent_D17_170M/Tau-D17-170M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d57898cd90b0e39f1e5e08219007b9cf40d4f2b58076fe18ccb924959906c70 +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-10015375.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-10015375.onnx new file mode 100644 index 0000000000000000000000000000000000000000..78e4b2a204df5cf6a3f80212480becb509c7d8db --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-10015375.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d57898cd90b0e39f1e5e08219007b9cf40d4f2b58076fe18ccb924959906c70 +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-10015375.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-10015375.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bc5c369d6506ce5067cd1dda9386ddf2744531c --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-10015375.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fed01a8ff1ab68ec9e9dfbb0561fbfeefd325db962cb7e2f6d261f215af4f42b +size 15534410 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..2a7b1c03832a3b56c60d1b39e82ce9ae9daa95c4 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80e6bdcc7f70a63e06a3aa37bf4704a099f44c810f45de5e05ee25aa6c794e7b +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5e02efaf4292681b811311512c83fce94d3e6a1 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b89b78b76c8ff4ef89a5e50d4f6b412468233734fb47fff1425f254b60b19af +size 15534256 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-2999867.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-2999867.onnx new file mode 100644 index 0000000000000000000000000000000000000000..2daaf866ab414af10a765ee4e2d393d1ba4b75fd --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-2999867.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56bc948d63fc8cf9ef9a54bbc338bb3243ff053e56859d8bb66a73e24178090 +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-2999867.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-2999867.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d6b3b8691a94a72c50e231a46e56790fca37871 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-2999867.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea76ede10e2d49690a6fbb0a4c5922ef0911ef75a7a2e2af5e1a38e813ee4f7 +size 15534256 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-3999723.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-3999723.onnx new file mode 100644 index 0000000000000000000000000000000000000000..ee8f13508abee4ec0a87b9ddb4dec4d66e5a7d1e --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-3999723.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1be5943b37eb21426d410fbe9fd540161f520789f1453157c86ff12706494304 +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-3999723.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-3999723.pt new file mode 100644 index 0000000000000000000000000000000000000000..44231abbd2744589c62f72626e53fd34fdca26df --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-3999723.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d38eced6ae1dcd0617b5efa350337d132bdcc7c00a6adac869e19220658f681 +size 15534256 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-4999878.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-4999878.onnx new file mode 100644 index 0000000000000000000000000000000000000000..b1421dcee5d324c399ac4696e2f0e20e88dfae98 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-4999878.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74a249496b10c1c26b1811dc540caf9b1c316acd5bb89e6c1ac236f48408d34f +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-4999878.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-4999878.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c2ddbf0cbef9cd208550075a772f3ffb6e7e492 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-4999878.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3123e828d32157f7c2d59753d8b8756c5cbcc2368f232b6db302c42b6403a881 +size 15534256 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-5999734.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-5999734.onnx new file mode 100644 index 0000000000000000000000000000000000000000..deb87e823f84af421135bb1b3fadd7e95f9f043e --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-5999734.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af5727f4d1de384c14c65f6cbb1c981ebaf35a67ef11ac6a0dc3257ddc2ce2f +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-5999734.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-5999734.pt new file mode 100644 index 0000000000000000000000000000000000000000..80fb1032296620efcbad38cfab843d1dc386e309 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-5999734.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5becb75044f8cf858c1e6ff466529025a59421e3c0571b1177b5fb7e3135b6df +size 15534256 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-6999889.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-6999889.onnx new file mode 100644 index 0000000000000000000000000000000000000000..791894bae87887e2793ffee7fa8cee1619bd9369 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-6999889.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb3e9f36175572c8ba668a25f777410a93304aaad90793cf64c50fb2b763f77 +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-6999889.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-6999889.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd4693405f3df7baacfb0193f93b645946aa046d --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-6999889.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd2411d29b035badf1da5558d87bf94660d8ffb3737d243150c333dbd43bf0a +size 15534256 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-7999745.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-7999745.onnx new file mode 100644 index 0000000000000000000000000000000000000000..beb568a47081ecbcd88d30abb6b5d7b35df47262 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-7999745.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85b782df8dacc838c2f8018c058966ac57bad249f4945529c8f6d8f6f3b818a9 +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-7999745.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-7999745.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c0388d78f40a5c5ba069cbdbc98eb4978dd6f97 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-7999745.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c78ea11cc4ea2cd44575135c5fad9b0afbdf0c3ed7ecbb962685747b54fd9e3f +size 15534256 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-8999900.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-8999900.onnx new file mode 100644 index 0000000000000000000000000000000000000000..78c08fba5496412a32052a9a5861bb268981f758 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-8999900.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95ef8a1e3edb45703a83e96de199f45303a5b086b05cf6055d048bf71a649d7e +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-8999900.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-8999900.pt new file mode 100644 index 0000000000000000000000000000000000000000..90ffa2083d68a248dd99d0237a8c6927250c0f94 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-8999900.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56aa62e0a290f00b0531329989b82463a02d278e874a3d99459ac68b751136f +size 15534256 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-9999775.onnx b/results/tau_agent_D17_170M/TauAgent/TauAgent-9999775.onnx new file mode 100644 index 0000000000000000000000000000000000000000..9c63cef7f19f966430504a97472aedd6406dbcb8 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-9999775.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1f6e4531e338537318d74e1b77a684761c02932f904f63754fedfbe5dc81174 +size 2186395 diff --git a/results/tau_agent_D17_170M/TauAgent/TauAgent-9999775.pt b/results/tau_agent_D17_170M/TauAgent/TauAgent-9999775.pt new file mode 100644 index 0000000000000000000000000000000000000000..952dd9f9970b32f13fc33c512227f81598ccdcd0 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/TauAgent-9999775.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f475dc605b3fe456294d3a387ca5d7201ec8cad99560e66d57c24115fa694519 +size 15534256 diff --git a/results/tau_agent_D17_170M/TauAgent/checkpoint.pt b/results/tau_agent_D17_170M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..74a6e5a7dec5534856689e35166c9fcf1e446b70 --- /dev/null +++ b/results/tau_agent_D17_170M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f982d1544f6f45213b7631f260e7fdced596bd9728c92dc99696fa062429b0 +size 15533332 diff --git a/results/tau_agent_D17_170M/configuration.yaml b/results/tau_agent_D17_170M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..d5d0ebc091122f4508960e3432b3d41f8fe7ac48 --- /dev/null +++ b/results/tau_agent_D17_170M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D16\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Build + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D17 + initialize_from: tau_agent_D16 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false diff --git a/results/tau_agent_D18_180M/Tau-D18-180M.onnx b/results/tau_agent_D18_180M/Tau-D18-180M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..df6ff79acbd867417d48e9863594288445100da5 --- /dev/null +++ b/results/tau_agent_D18_180M/Tau-D18-180M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513b038233be14556d7eadc6200fbe50498231d66b2bdb53d2e1d1f495c18456 +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-10022625.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-10022625.onnx new file mode 100644 index 0000000000000000000000000000000000000000..df6ff79acbd867417d48e9863594288445100da5 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-10022625.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513b038233be14556d7eadc6200fbe50498231d66b2bdb53d2e1d1f495c18456 +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-10022625.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-10022625.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebeb1edc299582b2ea1b1c12eee65129f0dd1ed6 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-10022625.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37a05a79cad727c14dd63fad44364bf36c5930370a77ad4c88115f2c221b972c +size 15534410 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..77ae5bf5e77da8eb23607d7dccfd4d188fc893bb --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a5fa77f7bdaf77f3470f7732d7bb2fb5f27276d7214de8848a69d604d2f6e34 +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..8937633c27b00ff9c9ef35187f308a6d30b1a0e8 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd20ade02685adc06658b8c811402791ba068a57e4eadfee35a02dc89fdb9ef +size 15534256 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-2999867.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-2999867.onnx new file mode 100644 index 0000000000000000000000000000000000000000..14edf72dcaec45ed74fb567217a529af2370b479 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-2999867.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e2593c138bb79719c76f7078168eef018fefc8f3203b5302a2ce430018600f +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-2999867.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-2999867.pt new file mode 100644 index 0000000000000000000000000000000000000000..128d96aa3cd2d8d4194c16d26a5b0c134cb90a5e --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-2999867.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:388a3f1b0db0349d586283fce919ed25c1f0be310aa414090772491185452054 +size 15534256 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-3999723.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-3999723.onnx new file mode 100644 index 0000000000000000000000000000000000000000..b4afd1f5666ca617e52d8b8f257261a54d55d35e --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-3999723.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6780d994bce7d709166cf00cbea24c0db7c9e3bd2a0fd5bbcbd3139026d848c2 +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-3999723.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-3999723.pt new file mode 100644 index 0000000000000000000000000000000000000000..d30e8e09b43e394f690e1bef8a8a44b5afa7bee1 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-3999723.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b08e408a9f5915f0b7f8b33164299358a325f060210521b1af93eff6f7601f11 +size 15534256 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-4999878.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-4999878.onnx new file mode 100644 index 0000000000000000000000000000000000000000..a5432e3f2bb0a5bdde8cdc3899c3a25ba05958b2 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-4999878.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59672db9e27e0ab02e9e0e2996608338f63b0b0343d7a307556be4fb834b5f90 +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-4999878.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-4999878.pt new file mode 100644 index 0000000000000000000000000000000000000000..c36819d8e51bc64c710b6cc97eb8b1004542ac79 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-4999878.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6583f639d2475c2199231c37135fb43545161ac00c4076bbc54a425c9a47c808 +size 15534256 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-5999734.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-5999734.onnx new file mode 100644 index 0000000000000000000000000000000000000000..79c7d9ab9691412b0d969bfd2597293c509828ee --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-5999734.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79943ac9e5e8c17024c5e3d05f353e7714db6284941570c55495c9fa1d96315d +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-5999734.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-5999734.pt new file mode 100644 index 0000000000000000000000000000000000000000..795e55babb72cadb056c5c8782bb9f1573e999ef --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-5999734.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ea02e560901c164f95aa5488114f08ee9042e76832357ec9d9219cedea65a9 +size 15534256 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-6999889.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-6999889.onnx new file mode 100644 index 0000000000000000000000000000000000000000..d32d7688f13adffdb6d0b221ed10d69326b81336 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-6999889.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2e9d4c50d9528bd0df1604904c9265accd3bf30aebe3a2ba609ee19028e3c15 +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-6999889.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-6999889.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed2e8acf9eff52b7d4b83edcb9068f107f4bd5c --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-6999889.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53a47ed2825df2780a4a176ef64c9757cf8bd13db91f2ad3b032e6d7165987dd +size 15534256 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-7999725.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-7999725.onnx new file mode 100644 index 0000000000000000000000000000000000000000..786cd45c531cac04e0d7bad81ce30e59a1215138 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-7999725.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9fccf024e321c9e445a7067cb940af1516e8414a5f3bad892c1df6b2730d78 +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-7999725.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-7999725.pt new file mode 100644 index 0000000000000000000000000000000000000000..65c1bdcfbcc43c8f5deefa4b5e8aae358a9d49fc --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-7999725.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96569afe1594676d82ae3df35c65c2dacba3b14cafb48fc8839e43e913b38c37 +size 15534256 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-8999925.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-8999925.onnx new file mode 100644 index 0000000000000000000000000000000000000000..080febdeb58696378de121440fe8961ba99b24ab --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-8999925.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb20970651d58960ef9aab83b069a9eea970325ef29e597ad63f633328d3d52 +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-8999925.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-8999925.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bb5f4f8b8e5f65565232de6fcac0e58e065feda --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-8999925.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d440cab3201652a7ed0954ceb64e1389a2d0bcba078a55c8b7d033d5f305e538 +size 15534256 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-9999825.onnx b/results/tau_agent_D18_180M/TauAgent/TauAgent-9999825.onnx new file mode 100644 index 0000000000000000000000000000000000000000..e3b7bb6b21f9d44e8d9c9628eede8da4aa8a9f70 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-9999825.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f5b4270e247b026111edddb90c4db2d66c9dc2c6e3daa3897f8a860d59046f +size 2186395 diff --git a/results/tau_agent_D18_180M/TauAgent/TauAgent-9999825.pt b/results/tau_agent_D18_180M/TauAgent/TauAgent-9999825.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0f2e6a0d29921632ff65b002004fff5fbe9071 --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/TauAgent-9999825.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56f9d4ec3ea35bafb2ade08ff52ea721d987f3089d8d07bd4d40253b539ea199 +size 15534256 diff --git a/results/tau_agent_D18_180M/TauAgent/checkpoint.pt b/results/tau_agent_D18_180M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5111e9a7c74764ecdfca8c57204761efec1183e --- /dev/null +++ b/results/tau_agent_D18_180M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610a5d207454617b71f0e8aafb971c9b975ae1c7afcbe4887955a790639bb7e4 +size 15533332 diff --git a/results/tau_agent_D18_180M/configuration.yaml b/results/tau_agent_D18_180M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..02e5ed63159739ba4288960bcebe91fb8b27c4b1 --- /dev/null +++ b/results/tau_agent_D18_180M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D17\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Build + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D18 + initialize_from: tau_agent_D17 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false diff --git a/results/tau_agent_D19_190M/Tau-D19-190M.onnx b/results/tau_agent_D19_190M/Tau-D19-190M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..a375669dd4c443ec09ea5afd87b6a8475cc6b31a --- /dev/null +++ b/results/tau_agent_D19_190M/Tau-D19-190M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a710b7ac67f4d21e32bc3ce914bc694b470cfb179d3f0058b8e7b3685979ca +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-0.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-0.onnx new file mode 100644 index 0000000000000000000000000000000000000000..df6ff79acbd867417d48e9863594288445100da5 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-0.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513b038233be14556d7eadc6200fbe50498231d66b2bdb53d2e1d1f495c18456 +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-0.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-0.pt new file mode 100644 index 0000000000000000000000000000000000000000..741dd63c914f014dd00628daab8958ae3dcb6df5 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2987f9a834f7956cbe464268383b3dc322354ab8490970a81211f7e99ec9c369 +size 15533332 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-10026875.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-10026875.onnx new file mode 100644 index 0000000000000000000000000000000000000000..a375669dd4c443ec09ea5afd87b6a8475cc6b31a --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-10026875.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a710b7ac67f4d21e32bc3ce914bc694b470cfb179d3f0058b8e7b3685979ca +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-10026875.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-10026875.pt new file mode 100644 index 0000000000000000000000000000000000000000..7df2465f7203b71c4aef97f14164fba76ff2b7ee --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-10026875.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce32f7a4d798dd57f7920d4654deba9db087de122b391e6c0a35b7bee5fecab0 +size 15534410 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..377f60e9fe4a5e7b3fc5bba5e0694083df67bf86 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df7f4a94ee32f36c1866b032abee670b58a1cdad4d199c24e4eaa74b700ffaa1 +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0efaae739eb958fc8c3a679d821c79569758579 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e7e0ed4f2b1de0aeb3c5f7bba4b4f7e96ecfd60870c38964f0738e2266b0c9f +size 15534256 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-2999867.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-2999867.onnx new file mode 100644 index 0000000000000000000000000000000000000000..1c888ce7657d108ec3c9427bcf78bc47465dc1a1 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-2999867.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7490b672a2627da3848c5f480b37d6c41ad11da13591f39e11a29a7331b229df +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-2999867.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-2999867.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f90949dc71991709fddf6fe070c368d8e957286 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-2999867.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a4dd903d5029d08a47737614e6b91a9116518fd8c9c6a8497b2567fc749add2 +size 15534256 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-3999723.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-3999723.onnx new file mode 100644 index 0000000000000000000000000000000000000000..b16a1d8fbbb4c07538d9353aaa66ba9275715623 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-3999723.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3939e94bde49091c0a635ad189fa6a5643f54efeb0ced079a253b5a2c2abf43b +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-3999723.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-3999723.pt new file mode 100644 index 0000000000000000000000000000000000000000..af3a5de782bc3576bc313f3ebf51fd88fd08ca3d --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-3999723.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a88f96df3256666a949604f3dfe396491a8353e60246972e75406e5e94dc9385 +size 15534256 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-4999878.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-4999878.onnx new file mode 100644 index 0000000000000000000000000000000000000000..7f7ce7aac5e85ffd84a4d3c1f90bcbfaa395d5a0 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-4999878.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f9f944fe72e6a496893afb3dea1a767006861117fd7a2710a11ffa4441f9a90 +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-4999878.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-4999878.pt new file mode 100644 index 0000000000000000000000000000000000000000..975077faa9025c5bdfb9d2fc9b3366da19eed5b5 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-4999878.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3376788bb286c1b05fd2ca52e974aa1aba8796e4e9f9d39a7d36a809873bb57b +size 15534256 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-5999734.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-5999734.onnx new file mode 100644 index 0000000000000000000000000000000000000000..a6e4a322f509758e1c7344f7f6724cb907968cac --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-5999734.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5abffd1abada69cbc630943dd23735c2b288036e566706f5473b60cce6064f65 +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-5999734.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-5999734.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ca4991876b44b4169e3105fe43c256a4aa4aefc --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-5999734.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4758f352f42846847dc5df1716ab18e97c9855204a1e2503344aaf0b0e29866 +size 15534256 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-6999875.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-6999875.onnx new file mode 100644 index 0000000000000000000000000000000000000000..ea598b97b12e36e0a1d83e0828268b5b5df3fc60 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-6999875.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9173e41395fb132b9f7862261979b075adbbe4609b104511b8417c2028fe0d9e +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-6999875.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-6999875.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a3581499eec919b6a8dba71e0acc6b04f3e208d --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-6999875.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb4fae39b597f37e69f754b79daa0b9c6b22f80076b6d0fd79e40c2e8934376 +size 15534256 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-7999775.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-7999775.onnx new file mode 100644 index 0000000000000000000000000000000000000000..3359c213db091fbbfd702690eefe0d853ecd22e1 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-7999775.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:798badc233e85b616c830f164790c3e65a2963206e027afd93598d9f8c4cd5f2 +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-7999775.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-7999775.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d7586795248664717e9694de2036dbf9109d745 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-7999775.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2991e60950eca9572310001a741a9ba2ee0152c3153253eff3e81b8819847a02 +size 15534256 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-8999975.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-8999975.onnx new file mode 100644 index 0000000000000000000000000000000000000000..63feb570e414a7bce87af3edea64d023933d676f --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-8999975.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6d7d19c7e450fd67ddc7d4ed88158fedfd9dc2efab144b2b7d1a4a1d830d0f0 +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-8999975.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-8999975.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbb7d528c95409406ac05a450fa6aacb2b51ec4e --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-8999975.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:036a7a9c58aa7c566a554d54ca39a6a06616709278a1121ab471e15cbf2f0267 +size 15534256 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-9999875.onnx b/results/tau_agent_D19_190M/TauAgent/TauAgent-9999875.onnx new file mode 100644 index 0000000000000000000000000000000000000000..79c83dba678981a9eb24d361209503faccc1fec8 --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-9999875.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda96adca818ef202def6d90a0b70f112e8c705018242ee568434b146039061a +size 2186395 diff --git a/results/tau_agent_D19_190M/TauAgent/TauAgent-9999875.pt b/results/tau_agent_D19_190M/TauAgent/TauAgent-9999875.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f1505c0a240502d74fb67b242255f38ef5c513d --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/TauAgent-9999875.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:450e95f5b041ffac70883db79b3d6e138b88dd5b89d4e76761424b11133e72a3 +size 15534256 diff --git a/results/tau_agent_D19_190M/TauAgent/checkpoint.pt b/results/tau_agent_D19_190M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e47835d71fdaad1dabb64afb215e95e61b448dc --- /dev/null +++ b/results/tau_agent_D19_190M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac63b23b69f92c1f7416214990bf5d271bef6257d2ab304f8ec1a0498abb0981 +size 15533332 diff --git a/results/tau_agent_D19_190M/configuration.yaml b/results/tau_agent_D19_190M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..7011eda41afe805f855c3827225516dc8719d48e --- /dev/null +++ b/results/tau_agent_D19_190M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D18\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Builds\001 + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D19 + initialize_from: tau_agent_D18 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false diff --git a/results/tau_agent_D20_200M/Tau-D20-200M.onnx b/results/tau_agent_D20_200M/Tau-D20-200M.onnx new file mode 100644 index 0000000000000000000000000000000000000000..fabd2693416e574e7b8968d149c69696d0acbeba --- /dev/null +++ b/results/tau_agent_D20_200M/Tau-D20-200M.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53fa9d458d87b79d4e2144923ae9cebee8fbe666229521e976ca84cea8fd04ab +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-10020375.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-10020375.onnx new file mode 100644 index 0000000000000000000000000000000000000000..fabd2693416e574e7b8968d149c69696d0acbeba --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-10020375.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53fa9d458d87b79d4e2144923ae9cebee8fbe666229521e976ca84cea8fd04ab +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-10020375.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-10020375.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6cf3f9bedc974895f5526d04c0850c95f3f3520 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-10020375.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd5fbd4dd5cbd2956ea8b063ce2b3451ed1b54ae89405c22ca7cf96a11ff533 +size 15534410 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-1999712.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-1999712.onnx new file mode 100644 index 0000000000000000000000000000000000000000..aa93f86f024e7a197302b0f00f324d033f71ab0a --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-1999712.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590cc10764078a6a8f3e1abbc8d4677ba0809390b4d39ee4914675e110910c7a +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-1999712.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-1999712.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b7b73002cc9112fd65db8461a309c9e8ab6f838 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-1999712.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6da3bbed08798c5c5dda37dc399103efc4120fa3f9a684628d386a2594c0d77 +size 15534256 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-2999867.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-2999867.onnx new file mode 100644 index 0000000000000000000000000000000000000000..c5d3e58aaf7f70d5cf9346d7be622b8b41110d16 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-2999867.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7bb88df0eb55b2d0fdd62857af5dac066595a154db096640566e4e7fcd8199 +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-2999867.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-2999867.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cefafec2c67c3c663acc972d985af1c699e5bb2 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-2999867.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac2c1fc7e7b5eb4cdd6fd17b70fc8f06aeacb4abb3095c4343034d64a160ef3 +size 15534256 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-3999723.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-3999723.onnx new file mode 100644 index 0000000000000000000000000000000000000000..debac8059cd22be99434e68dd07f801dbea9b556 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-3999723.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d66057bcc560b61451ba57a02f973cbc6568ff5ab002dd1b0cfdc02985736c3e +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-3999723.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-3999723.pt new file mode 100644 index 0000000000000000000000000000000000000000..eed5e9f866d8bf279b5275d09120ab81338cac8b --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-3999723.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88fe50f07677ed032599f732f5f5f2d11987f679184d68ce6cb5b1ecbd1e9a31 +size 15534256 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-4999878.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-4999878.onnx new file mode 100644 index 0000000000000000000000000000000000000000..87d7e17bb5efc0c01a1f77c0b58878de902be028 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-4999878.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7b983c466363521c08c41e69475d6471aa1bfe133695f0f6d6786f7e7d58c9 +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-4999878.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-4999878.pt new file mode 100644 index 0000000000000000000000000000000000000000..288929ad7c8c47a9feaadeee9e88663b8bc9bb8f --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-4999878.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced8fd53281a8005729b5a8df8a4dfdc981b65fdd6eb86c55acfa2085fe10251 +size 15534256 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-5999734.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-5999734.onnx new file mode 100644 index 0000000000000000000000000000000000000000..a9d80b5e9dbd448261cf92fdba06288002205adf --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-5999734.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67b669b6e2f283e1e80c887910af77c08108609af5921f76a5fae273e38cc5dc +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-5999734.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-5999734.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d20663b0c8f64a6aa7fb95d6615b2a178d5a81b --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-5999734.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed8e83f96cf4fb67d300ee5727328e7630dce0a1fefd8fd6cb7a33e27f9767e3 +size 15534256 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-6999889.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-6999889.onnx new file mode 100644 index 0000000000000000000000000000000000000000..701e5905e9e81b89753555dc8e394e94ce169898 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-6999889.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4181abaabb7767ce8dba062e457c5c2078397959d000a77b21c12afac487a43 +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-6999889.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-6999889.pt new file mode 100644 index 0000000000000000000000000000000000000000..da2f6bb0d9fdd340fbf092cb91e0312d6e20a2d2 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-6999889.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdd4ec77c8b6f9f357d9c11170b4e0e7e0b8b1538ef1f6722a73c2daeba4ca4c +size 15534256 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-7999745.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-7999745.onnx new file mode 100644 index 0000000000000000000000000000000000000000..0f9c9a1186016e8a653c268ad70320f29e0fe972 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-7999745.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6bd6d5de8ecfcb39bbd65c79391024fa163feab48e0128fa847badabf717296 +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-7999745.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-7999745.pt new file mode 100644 index 0000000000000000000000000000000000000000..66924b3fd9d441257ceb1f0e44959645419b7310 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-7999745.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:334daaf1ea345269be5f59049890ec4b6d2bc8840708bc373965f64d5279c2e6 +size 15534256 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-8999775.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-8999775.onnx new file mode 100644 index 0000000000000000000000000000000000000000..cfe4e649b260785dd81c483112a6c23f472557e9 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-8999775.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e2be3d3225da52892e1109e1f93d0337a3f44a99d4275d1721c2b46bb5074fb +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-8999775.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-8999775.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f981a859d88b88c2d09fc79173e2f242e04eb31 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-8999775.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbf771148dbb90fe2eb6254486ff15c50b66e4f22dea4afc8e2f83a626f10360 +size 15534256 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-9999975.onnx b/results/tau_agent_D20_200M/TauAgent/TauAgent-9999975.onnx new file mode 100644 index 0000000000000000000000000000000000000000..7a19cfa051f04003f6d1b759f3b4c91fc98186c6 --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-9999975.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4f12a8ec7744f5f11a2f95af3a232259b50effa1f78e751054177f5ccabdf3b +size 2186395 diff --git a/results/tau_agent_D20_200M/TauAgent/TauAgent-9999975.pt b/results/tau_agent_D20_200M/TauAgent/TauAgent-9999975.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fea68705d1dedf2f1148f00577b73683451b52a --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/TauAgent-9999975.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:070dba7a160f5bab1373a65e20b2073e07413a86f7a8c4359471a414016f9398 +size 15534256 diff --git a/results/tau_agent_D20_200M/TauAgent/checkpoint.pt b/results/tau_agent_D20_200M/TauAgent/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebf9cee9a6c3de9972065438bcb370cf012effec --- /dev/null +++ b/results/tau_agent_D20_200M/TauAgent/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b48ca6e6e3e91b84601a9d3f49303a0c5c96bc352fee3093a98bc48bf497f0 +size 15533332 diff --git a/results/tau_agent_D20_200M/configuration.yaml b/results/tau_agent_D20_200M/configuration.yaml new file mode 100644 index 0000000000000000000000000000000000000000..a1b99bbfefa9b8e1c0ccdc9c25d370ec1cec8361 --- /dev/null +++ b/results/tau_agent_D20_200M/configuration.yaml @@ -0,0 +1,95 @@ +default_settings: null +behaviors: + TauAgent: + trainer_type: ppo + hyperparameters: + batch_size: 512 + buffer_size: 4096 + learning_rate: 3.0e-05 + beta: 0.005 + epsilon: 0.2 + lambd: 0.95 + num_epoch: 3 + shared_critic: false + learning_rate_schedule: linear + beta_schedule: linear + epsilon_schedule: linear + checkpoint_interval: 1000000 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + reward_signals: + extrinsic: + gamma: 0.99 + strength: 1.0 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: + sequence_length: 128 + memory_size: 256 + goal_conditioning_type: hyper + deterministic: false + curiosity: + gamma: 0.995 + strength: 0.1 + network_settings: + normalize: true + hidden_units: 256 + num_layers: 4 + vis_encode_type: simple + memory: null + goal_conditioning_type: hyper + deterministic: false + learning_rate: 3.0e-05 + encoding_size: null + init_path: results\tau_agent_D19\TauAgent\checkpoint.pt + keep_checkpoints: 10 + even_checkpoints: true + max_steps: 10000000 + time_horizon: 512 + summary_freq: 100000 + threaded: true + self_play: null + behavioral_cloning: null +env_settings: + env_path: .\Builds\001 + env_args: null + base_port: 5005 + num_envs: 1 + num_areas: 1 + timeout_wait: 300 + seed: -1 + max_lifetime_restarts: 10 + restarts_rate_limit_n: 1 + restarts_rate_limit_period_s: 60 +engine_settings: + width: 84 + height: 84 + quality_level: 5 + time_scale: 20 + target_frame_rate: -1 + capture_frame_rate: 60 + no_graphics: false +environment_parameters: null +checkpoint_settings: + run_id: tau_agent_D20 + initialize_from: tau_agent_D19 + load_model: false + resume: false + force: true + train_model: false + inference: false + results_dir: results +torch_settings: + device: cuda +debug: false