croumegous
commited on
Commit
•
76a8a04
1
Parent(s):
00d2fd0
Better model performance
Browse files- README.md +1 -1
- args.yml +7 -7
- ppo-Swimmer-v3.zip +2 -2
- ppo-Swimmer-v3/data +21 -21
- ppo-Swimmer-v3/policy.optimizer.pth +1 -1
- ppo-Swimmer-v3/policy.pth +1 -1
- ppo-Swimmer-v3/system_info.txt +3 -3
- replay.mp4 +2 -2
- results.json +1 -1
- train_eval_metrics.zip +2 -2
- vec_normalize.pkl +2 -2
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: Swimmer-v3
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: Swimmer-v3
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 366.72 +/- 0.68
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
args.yml
CHANGED
@@ -10,7 +10,7 @@
|
|
10 |
- - env_kwargs
|
11 |
- null
|
12 |
- - eval_episodes
|
13 |
-
-
|
14 |
- - eval_freq
|
15 |
- 25000
|
16 |
- - gym_packages
|
@@ -18,13 +18,13 @@
|
|
18 |
- - hyperparams
|
19 |
- null
|
20 |
- - log_folder
|
21 |
-
- logs
|
22 |
- - log_interval
|
23 |
- -1
|
24 |
- - max_total_trials
|
25 |
- null
|
26 |
- - n_eval_envs
|
27 |
-
-
|
28 |
- - n_evaluations
|
29 |
- null
|
30 |
- - n_jobs
|
@@ -54,15 +54,15 @@
|
|
54 |
- - save_replay_buffer
|
55 |
- false
|
56 |
- - seed
|
57 |
-
-
|
58 |
- - storage
|
59 |
- null
|
60 |
- - study_name
|
61 |
- null
|
62 |
- - tensorboard_log
|
63 |
-
-
|
64 |
- - track
|
65 |
-
-
|
66 |
- - trained_agent
|
67 |
- ''
|
68 |
- - truncate_last_trajectory
|
@@ -74,7 +74,7 @@
|
|
74 |
- - verbose
|
75 |
- 1
|
76 |
- - wandb_entity
|
77 |
-
-
|
78 |
- - wandb_project_name
|
79 |
- sb3
|
80 |
- - wandb_tags
|
|
|
10 |
- - env_kwargs
|
11 |
- null
|
12 |
- - eval_episodes
|
13 |
+
- 20
|
14 |
- - eval_freq
|
15 |
- 25000
|
16 |
- - gym_packages
|
|
|
18 |
- - hyperparams
|
19 |
- null
|
20 |
- - log_folder
|
21 |
+
- logs
|
22 |
- - log_interval
|
23 |
- -1
|
24 |
- - max_total_trials
|
25 |
- null
|
26 |
- - n_eval_envs
|
27 |
+
- 5
|
28 |
- - n_evaluations
|
29 |
- null
|
30 |
- - n_jobs
|
|
|
54 |
- - save_replay_buffer
|
55 |
- false
|
56 |
- - seed
|
57 |
+
- 3324951722
|
58 |
- - storage
|
59 |
- null
|
60 |
- - study_name
|
61 |
- null
|
62 |
- - tensorboard_log
|
63 |
+
- runs/Swimmer-v3__ppo__3324951722__1673946687
|
64 |
- - track
|
65 |
+
- true
|
66 |
- - trained_agent
|
67 |
- ''
|
68 |
- - truncate_last_trajectory
|
|
|
74 |
- - verbose
|
75 |
- 1
|
76 |
- - wandb_entity
|
77 |
+
- croumegous
|
78 |
- - wandb_project_name
|
79 |
- sb3
|
80 |
- - wandb_tags
|
ppo-Swimmer-v3.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ddeb385d47f4b117cc084e52fb50236603f5f7ff926f779e8c62bafc2b97664
|
3 |
+
size 151380
|
ppo-Swimmer-v3/data
CHANGED
@@ -4,20 +4,20 @@
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
11 |
-
"_build": "<function ActorCriticPolicy._build at
|
12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
13 |
-
"extract_features": "<function ActorCriticPolicy.extract_features at
|
14 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
15 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
16 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
17 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
18 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
19 |
"__abstractmethods__": "frozenset()",
|
20 |
-
"_abc_impl": "<_abc_data object at
|
21 |
},
|
22 |
"verbose": 1,
|
23 |
"policy_kwargs": {},
|
@@ -36,7 +36,7 @@
|
|
36 |
},
|
37 |
"action_space": {
|
38 |
":type:": "<class 'gym.spaces.box.Box'>",
|
39 |
-
":serialized:": "
|
40 |
"dtype": "float32",
|
41 |
"_shape": [
|
42 |
2
|
@@ -53,15 +53,15 @@
|
|
53 |
"_num_timesteps_at_start": 0,
|
54 |
"seed": 0,
|
55 |
"action_noise": null,
|
56 |
-
"start_time":
|
57 |
"learning_rate": {
|
58 |
":type:": "<class 'function'>",
|
59 |
-
":serialized:": "
|
60 |
},
|
61 |
-
"tensorboard_log":
|
62 |
"lr_schedule": {
|
63 |
":type:": "<class 'function'>",
|
64 |
-
":serialized:": "
|
65 |
},
|
66 |
"_last_obs": null,
|
67 |
"_last_episode_starts": {
|
@@ -70,7 +70,7 @@
|
|
70 |
},
|
71 |
"_last_original_obs": {
|
72 |
":type:": "<class 'numpy.ndarray'>",
|
73 |
-
":serialized:": "
|
74 |
},
|
75 |
"_episode_num": 0,
|
76 |
"use_sde": false,
|
@@ -78,7 +78,7 @@
|
|
78 |
"_current_progress_remaining": -0.0035199999999999676,
|
79 |
"ep_info_buffer": {
|
80 |
":type:": "<class 'collections.deque'>",
|
81 |
-
":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////
|
82 |
},
|
83 |
"ep_success_buffer": {
|
84 |
":type:": "<class 'collections.deque'>",
|
@@ -95,7 +95,7 @@
|
|
95 |
"n_epochs": 10,
|
96 |
"clip_range": {
|
97 |
":type:": "<class 'function'>",
|
98 |
-
":serialized:": "
|
99 |
},
|
100 |
"clip_range_vf": null,
|
101 |
"normalize_advantage": true,
|
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7f2e940d0a60>",
|
8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f2e940d0af0>",
|
9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f2e940d0b80>",
|
10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f2e940d0c10>",
|
11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7f2e940d0ca0>",
|
12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7f2e940d0d30>",
|
13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x7f2e940d0dc0>",
|
14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f2e940d0e50>",
|
15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7f2e940d0ee0>",
|
16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f2e940d0f70>",
|
17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f2e940d6040>",
|
18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7f2e940d60d0>",
|
19 |
"__abstractmethods__": "frozenset()",
|
20 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f2e9442bec0>"
|
21 |
},
|
22 |
"verbose": 1,
|
23 |
"policy_kwargs": {},
|
|
|
36 |
},
|
37 |
"action_space": {
|
38 |
":type:": "<class 'gym.spaces.box.Box'>",
|
39 |
+
":serialized:": "gAWVDgwAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLAoWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAAAAIC/AACAv5RoCksChZSMAUOUdJRSlIwEaGlnaJRoEiiWCAAAAAAAAAAAAIA/AACAP5RoCksChZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolgIAAAAAAAAAAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLAoWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYCAAAAAAAAAAEBlGghSwKFlGgVdJRSlIwKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwSX19yYW5kb21zdGF0ZV9jdG9ylJOUjAdNVDE5OTM3lGgtjBRfX2JpdF9nZW5lcmF0b3JfY3RvcpSTlIaUUpR9lCiMDWJpdF9nZW5lcmF0b3KUjAdNVDE5OTM3lIwFc3RhdGWUfZQojANrZXmUaBIolsAJAAAAAAAAAAAAgFPCs5yHA7WTcuyrW+jmsvLPtoHa1QbvYaExTaBrtczZE+YYn3SceS/IpRuAxHkBSZ4PQ+Rd4BiTkhNVzNRKKWTSCJW+NNCeRHJ6A/Ctvwpzm3s+6WCxBtp1A0ULbn3WFmrrBDRmg7fz9aUvae9CY0O1XPfCd1LMRkQ3LQiJbtCOrnf7GLaAT3ue+U8y7BLYuY5ehakZyq49di1nK0KAnsXuxx/1IgFdS88kD8wZUmREV5hwnQr1Ehe16VreO8T/Qc86sV+2h90z2FiJqqLNf3s/yZS3bA9DHzGZfRtgkKu3Bx0ZTN7I+466APXPqRreJf4gBqUW/NB248FO9cpD0wFaed9QV63NqpiFOs/RYeEwD8e32dZFRfi9SK5aLvuApJMu2LOfZweypHIkyPjeY5W+tsm2bdPmVoCAOiyi73cf5k0LQeJNWqZU/wuy/f8myghZ9qrjf+2JSJMaB9VNMXWmxuq4Dq0fkhzJr1ML7SgftfSG29O5koFUMozQL58gAzyX96ZMcpWbZ+3/zlaVhGln5egXC8MtIK6xIFCvh/vD/F1jLgYIp14MM597MuPmTpa+OaKek7bql9Cp8/0skhg5QSCvCaijm8wenxrfqLyRxDPCpS+L3isJC5LrjFgWnsdxQXVrJK8uaobJcTIJ5NrYYfA2l5gH27iPI9EqhzFtZJXiE4vXpH18f3kouYV9RowPzOtmYsbmstR/Mx/VY7E0XBmnMidL4dYTUXgxaDbFxWy3y6miL2yw0I2O09vPWV7LqbwMbthlU26lrLfnJDz88B+7y4pFCwvsHgCsMWq6pvroAF4Ms+++JnhzrL0GLrtfJ7667p42Vg78GirmKIRMFH0p6aLRPV4V/fclE3PLBj0InU315M5v7fDFj/IreJeFUhIAy5/BlvLdgwIfBMBWvyjhqGRBo2KmdiDAO9BPhdi6oGmZUCxTDjUyMd8rjeRdntTE+L9sHQUSvUfpRjKcSIjZXcjsMMSwwU0QzIXewD4nZg8EAZ72iHnChWveW7cB5EQRFE+YPvvyNAw4OvORF+DjDtmLUz6jNz0JbkuKbhIQEEVbpDRkoeIGA4HATymZeE4TX/hvhOxJfX5liXD9/Uon8OjJ/hhIrDNUYR2NOV2R1L+VuK/JA9o0izGPiCC9vi7UK1u4re8tvPrBInC6BH2DpMvWSRepdH0frFxGsH/kRB/S77USeMs38a+yorDaa9Wsb9WnuQg10vl087jhvwSZx77fGq52NV1h/UnZAjnqJOjCPBgQrY0wsSeSW6SOSdItAOupiWkVvSzHz+gopd/3FUUPbjdik7Vd6O6ycGOFwp4+wyZqq1MKHww5exJND6De8NB4fGBzsvKoT8O1fAC3Y2Z+3mLYwkCJXULx2zNSO90bQi0L0BhTF1AidNtqRkak72V+V1kos6m4F+kyZiOiwxfcHKWHmpQe3A8HpX6nacx0Zso0WyF/W/sOLo//2g0YD9koIjgKvw//f9Em4CvxNBUMnJYTVQJGysF4QMShnM6byaMNJhRVALf+X0+SgLJkEwLfKdBbKxjA035OEc2YKmUpvooVUUt+9U8d7cKRgNYKKPwCHyYfLJSQt4ZEdThgjeywDxgsGzPax5SklOLroSYn39feofatZDzJXevfPTHyi1ZLwpe6Hwkbqz1FuOnHiShPedbEA9b/HCtBytSZrgUwlwHpQlAiBTSxpN7TFzVZrrhRd6N8W+FeE9SAGCHwXchFR4SCGThPyRGO/XWkMPJ42BLUOmMGepDQgWH646tjoJSE3EXcA5iDS+Nq6Oh521oC2UPAnvxIj1QbVh8IbxlBytRTTjc0c14E9cyhIPlgIoHriuEFSMXSEzOGL1MmL6UCbiXfsRg9Z6OwWCCl3VeGg5bEZ1kjJkvs08k7wtPk4ATAjaTL3QoY2gf106zFbJtL4D5gmLMJ9OuzE2Fn5uaAqqpjXIqqEXxS9jtpsRU9VTHCg68RwXQVIUhuVJgHq8fOigBMrW7Am5+jjo/GNNlcFcp813dFiXy4qHhjGSEjNXp3ln03NZkOgqXQ8SalJlPOvyrAS9wW9EtjQKhcrBSWSsQ8C3o/Mc/sR/CMRB85ZIojR/tiCKtOutxQMIusIOnYHK8g6kPpTQ8J/PfJ8pa3GEoYoA67axQTXsysd2Y6ZDwpz1HkAeISVK2AlCcuQssrQv8dVLAcins/2kjRFp5Vp82HSX9j6Ci9GH5mkdyqV84vWsdwRz4JNXHZoHVZKnrxSdA1HUwRUI/5oWiqnGk9KyiS4Mv9dQIVluJ1+/pAHYEdG9YgLHiNE2zA7aIQbqqlGX6jH1CrHSPL9mnlHdPiKjozwRXu02UQuzlGJn+/PUkU6cPYLLeLc8e7S2qfCZxbdpHioand7wYKqb5bMb8dA3Dwvm6P6iJXSogJ+Q+0z43li8ydYJqZNZlSjsljr/2c5UU33vMhLDLEXIHT8WzrsS45TsKNbhYfTYx6Ds/8W5yOtiOPWc0+fRlAjbQC++FKo5UaMl2eRCxI4U5/heX2HxJGNk50rICjuFsG/8Q+NUuJgS+y3FMhe+sm1e2MdC+ldkBqEn8oRxajECbP4Wizz1tfJliW/1A5fdGTfUxM3HV72bJgnqswmoAumAx6d36KfuZwEEp0/wcrdo+8/unJ5f2mYeqCrOcaxDJrs6SxW1zVaH/YTZl+RNA0NjPLgaqnlveaes/MkpzsVEQDtvKGFrG1cnmGjZVi2azrSDGQ0Y423nEksDC5awYcOJmVYbeA4DkMSNfj+7Dx2SzH/PVPuXLX9aw9K9QF4Ml48zsSrwsVjIa8+gIdffs2pf2wCKcPtFez6vOT0UDuFHknJjMDg0fI3DnyC7jJqO8V4XpmPyarTp3JJRGhmqTHhpZInn70JMfS+RFry5+rLSOM0T+KWV8fYjs9eyCiZijlR4AiADooXm9G8JIzZCLZX2Dty83iyz7gQzSxYO7ULuTT1stvGuJwbBP4LMhLXkbxdhAmBSDiYNOnc3O+yFsO6Ps9UOQD8S4Pbr8hZ4mFjbicpO635SwpmHINYDeuewln3/GHz69LpCjmpnKPeF9ZxXcq6MR4kJUV2j/dQzqjLniNaQmrMkULdI7W1sMXRFcsz9xs1GVwVqmtMVws8HtvXMYNmosCrrgAFX2ghPz7dXCV6vML5YhfNbDAzzG6MHffrslrhMav3vtlt8Fnld4VaH6IhMkowayT1lSVvfvlKHCWwtKaTcOZrR5LZGalJOpFbVIFUOAo+LnY/25bmc3KloyLzgiTudjPsXEGPNPBIvE/5cMEvU4Lrs0N3tCke4abYDXF9f14QrwLlGgHjAJ1NJSJiIeUUpQoSwNoC05OTkr/////Sv////9LAHSUYk1wAoWUaBV0lFKUjANwb3OUTXACdYwJaGFzX2dhdXNzlEsAjAVnYXVzc5RHAAAAAAAAAAB1YnViLg==",
|
40 |
"dtype": "float32",
|
41 |
"_shape": [
|
42 |
2
|
|
|
53 |
"_num_timesteps_at_start": 0,
|
54 |
"seed": 0,
|
55 |
"action_noise": null,
|
56 |
+
"start_time": 1673946689743340401,
|
57 |
"learning_rate": {
|
58 |
":type:": "<class 'function'>",
|
59 |
+
":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Q6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
|
60 |
},
|
61 |
+
"tensorboard_log": "runs/Swimmer-v3__ppo__3324951722__1673946687/Swimmer-v3",
|
62 |
"lr_schedule": {
|
63 |
":type:": "<class 'function'>",
|
64 |
+
":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Q6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
|
65 |
},
|
66 |
"_last_obs": null,
|
67 |
"_last_episode_starts": {
|
|
|
70 |
},
|
71 |
"_last_original_obs": {
|
72 |
":type:": "<class 'numpy.ndarray'>",
|
73 |
+
":serialized:": "gAWVdQEAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAQAAAAAAABa9QeFgerI/UAa1YDeihb/URHCAd8CwPzjKq7/YhZo/MuDaa/T8sD9SiHDyml64P/bVsPKxLLE/RNZj2Pl7ub9wk7mFMbe4P/SIVXlLebe/bMV8kVTGmL/WyxKLPc+2P49JdUYZ4be/l5UKpnyFrb+AsxNUmte2vyDbdXBEYXC/UEBhpB0+ez/dN0TesuSovzDKRuO9XIg/lrSb9L3csD99HnU/l96vv7BuhYt+LbK/AGd/D+77lD80YFi4skOZP3j+VaIWLZ4/1CrsP4mpoz+YBowyXcmgPzA/U1THTrA/pwbEI1i5pr8YHUB+xfSwP2fuPTOnNK+//oIyAohItj+UjAVudW1weZSMBWR0eXBllJOUjAJmOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLCIaUjAFDlHSUUpQu"
|
74 |
},
|
75 |
"_episode_num": 0,
|
76 |
"use_sde": false,
|
|
|
78 |
"_current_progress_remaining": -0.0035199999999999676,
|
79 |
"ep_info_buffer": {
|
80 |
":type:": "<class 'collections.deque'>",
|
81 |
+
":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIs5jYfBwrdkCUhpRSlIwBbJRN6AOMAXSUR0Ce0qEzO5avdX2UKGgGaAloD0MIGH0FaUZrdkCUhpRSlGgVTegDaBZHQJ7Smc4HX3B1fZQoaAZoCWgPQwjWxAJfEV52QJSGlFKUaBVN6ANoFkdAntKTshPj43V9lChoBmgJaA9DCIj1Rq3wTnZAlIaUUpRoFU3oA2gWR0Ce0o29tdiVdX2UKGgGaAloD0MIZ0Rpb3BBdkCUhpRSlGgVTegDaBZHQJ7zMsCkoF51fZQoaAZoCWgPQwigbwuW6lx2QJSGlFKUaBVN6ANoFkdAnvMq3y7PIHV9lChoBmgJaA9DCK4SLA6nT3ZAlIaUUpRoFU3oA2gWR0Ce8yQ6p5u7dX2UKGgGaAloD0MI+mAZG7pkdkCUhpRSlGgVTegDaBZHQJ7zHcBU70Z1fZQoaAZoCWgPQwjR6uQMhXd2QJSGlFKUaBVN6ANoFkdAnxO0bDMvAXV9lChoBmgJaA9DCP2C3bAtNXZAlIaUUpRoFU3oA2gWR0CfE60VafSQdX2UKGgGaAloD0MIle6us+GKdkCUhpRSlGgVTegDaBZHQJ8TppUPxx11fZQoaAZoCWgPQwjfh4OEqIJ2QJSGlFKUaBVN6ANoFkdAnxOgLiMo+nV9lChoBmgJaA9DCDoGZK93dXZAlIaUUpRoFU3oA2gWR0CfNLrQgLZ0dX2UKGgGaAloD0MIeJrMeJuddkCUhpRSlGgVTegDaBZHQJ80s3EQ5FR1fZQoaAZoCWgPQwit2jUh7aB2QJSGlFKUaBVN6ANoFkdAnzStQoCuEHV9lChoBmgJaA9DCK1rtBzom3ZAlIaUUpRoFU3oA2gWR0CfNKdHUc4pdX2UKGgGaAloD0MII4Wy8DV3dkCUhpRSlGgVTegDaBZHQJ9SzsiSq2l1fZQoaAZoCWgPQwiV7q6zIXh2QJSGlFKUaBVN6ANoFkdAn1LHcpLEk3V9lChoBmgJaA9DCNALdy4MaHZAlIaUUpRoFU3oA2gWR0CfUsFGoaUBdX2UKGgGaAloD0MItvY+VcVXdkCUhpRSlGgVTegDaBZHQJ9Su0gKWs11fZQoaAZoCWgPQwic+kDyDjt2QJSGlFKUaBVN6ANoFkdAn3KyAxzq8nV9lChoBmgJaA9DCJ3Ul6XdO3ZAlIaUUpRoFU3oA2gWR0Cfcqo86mwadX2UKGgGaAloD0MI0/caguNBdkCUhpRSlGgVTegDaBZHQJ9yo6RyOrB1fZQoaAZoCWgPQwhyi/m5IZN2QJSGlFKUaBVN6ANoFkdAn3KdNvfj0nV9lChoBmgJaA9DCIhkyLG1V3ZAlIaUUpRoFU3oA2gWR0Cfqac0cfeUdX2UKGgGaAloD0MIpnwIqgZpdkCUhpRSlGgVTegDaBZHQJ+pn3i704B1fZQoaAZoCWgPQwjmriXkA5p2QJSGlFKUaBVN6ANoFkdAn6mY5PuXu3V9lChoBmgJaA9DCKN1VDXBMXZAlIaUUpRoFU3oA2gWR0CfqZJ40Mw2dX2UKGgGaAloD0MIv7m/epw3dkCUhpRSlGgVTegDaBZHQJ/KNJ5E+gV1fZQoaAZoCWgPQwgSpb3BV152QJSGlFKUaBVN6ANoFkdAn8osynDR+nV9lChoBmgJaA9DCH3ogvoWiXZAlIaUUpRoFU3oA2gWR0CfyiYsunMudX2UKGgGaAloD0MI41MAjKdZdkCUhpRSlGgVTegDaBZHQJ/KH8yeqaR1fZQoaAZoCWgPQwhTWn9LAHx2QJSGlFKUaBVN6ANoFkdAn+oYybhFVnV9lChoBmgJaA9DCPSpY5XSi3ZAlIaUUpRoFU3oA2gWR0Cf6hDneSB9dX2UKGgGaAloD0MIP1OvW4RRdkCUhpRSlGgVTegDaBZHQJ/qCkbgjyF1fZQoaAZoCWgPQwj52F2gpIt2QJSGlFKUaBVN6ANoFkdAn+oD9fkWAXV9lChoBmgJaA9DCAn9TL1ubHZAlIaUUpRoFU3oA2gWR0CgBPGGucMFdX2UKGgGaAloD0MI7zhFR/KAdkCUhpRSlGgVTegDaBZHQKAE7ZQpF1B1fZQoaAZoCWgPQwh7vJAOD3d2QJSGlFKUaBVN6ANoFkdAoATqQcPvrnV9lChoBmgJaA9DCEjCvp0EZHZAlIaUUpRoFU3oA2gWR0CgBOcE3bVSdX2UKGgGaAloD0MIX2Is0y96dkCUhpRSlGgVTegDaBZHQKAUK7GvOhV1fZQoaAZoCWgPQwgpJQSrqpB2QJSGlFKUaBVN6ANoFkdAoBQnustCiXV9lChoBmgJaA9DCKeTbHV5Z3ZAlIaUUpRoFU3oA2gWR0CgFCRoh6jWdX2UKGgGaAloD0MIe9l22hp9dkCUhpRSlGgVTegDaBZHQKAUITBZZB91fZQoaAZoCWgPQwisb2ByI3N2QJSGlFKUaBVN6ANoFkdAoCOPRXwLE3V9lChoBmgJaA9DCNmwprJolXZAlIaUUpRoFU3oA2gWR0CgI4uTRplCdX2UKGgGaAloD0MIQs77/zhhdkCUhpRSlGgVTegDaBZHQKAjiH0se4l1fZQoaAZoCWgPQwij6lc6X212QJSGlFKUaBVN6ANoFkdAoCOFgYxcmnV9lChoBmgJaA9DCDKwjuNHj3ZAlIaUUpRoFU3oA2gWR0CgP0wc5sCUdX2UKGgGaAloD0MIEMr7OJqldkCUhpRSlGgVTegDaBZHQKA/SCtA9mp1fZQoaAZoCWgPQwhbQ6m9CKl2QJSGlFKUaBVN6ANoFkdAoD9E5dWyT3V9lChoBmgJaA9DCFFpxMz+k3ZAlIaUUpRoFU3oA2gWR0CgP0G0NSZSdX2UKGgGaAloD0MIrB+b5AdUdkCUhpRSlGgVTegDaBZHQKBPzt2LYPJ1fZQoaAZoCWgPQwgXLquwmVx2QJSGlFKUaBVN6ANoFkdAoE/K7GvOhXV9lChoBmgJaA9DCFQ3F39ba3ZAlIaUUpRoFU3oA2gWR0CgT8eaz/p/dX2UKGgGaAloD0MIcCNli+RjdkCUhpRSlGgVTegDaBZHQKBPxGDL8rJ1fZQoaAZoCWgPQwgQkZp28Tp2QJSGlFKUaBVN6ANoFkdAoGAsenyd4HV9lChoBmgJaA9DCGpMiLmkV3ZAlIaUUpRoFU3oA2gWR0CgYCjohY/3dX2UKGgGaAloD0MI5pE/GDgxdkCUhpRSlGgVTegDaBZHQKBgJfCQ9zR1fZQoaAZoCWgPQwjlQXqK3EJ2QJSGlFKUaBVN6ANoFkdAoGAjEm6XjXV9lChoBmgJaA9DCDiGAOCYMnZAlIaUUpRoFU3oA2gWR0CgcE2VVxS6dX2UKGgGaAloD0MIm+eIfFdKdkCUhpRSlGgVTegDaBZHQKBwSaaTfSB1fZQoaAZoCWgPQwglehnFckR2QJSGlFKUaBVN6ANoFkdAoHBGVX3g1nV9lChoBmgJaA9DCD60jxX8VXZAlIaUUpRoFU3oA2gWR0CgcEMfaHsUdX2UKGgGaAloD0MIt7JEZxmVdkCUhpRSlGgVTegDaBZHQKB/QzImw7l1fZQoaAZoCWgPQwj9EBss3Jp2QJSGlFKUaBVN6ANoFkdAoH8/QUpNK3V9lChoBmgJaA9DCHAofLZOrXZAlIaUUpRoFU3oA2gWR0CgfzvyLAHndX2UKGgGaAloD0MID5ccd0qCdkCUhpRSlGgVTegDaBZHQKB/OLofSx91fZQoaAZoCWgPQwjKNQUye492QJSGlFKUaBVN6ANoFkdAoI4LEvTPSnV9lChoBmgJaA9DCBR3vMlviXZAlIaUUpRoFU3oA2gWR0CgjgddVvMsdX2UKGgGaAloD0MISG+4j1x2dkCUhpRSlGgVTegDaBZHQKCOBEpAlfJ1fZQoaAZoCWgPQwj60XDKHIt2QJSGlFKUaBVN6ANoFkdAoI4BT4tYjnV9lChoBmgJaA9DCKIMVTGVQnZAlIaUUpRoFU3oA2gWR0CgqWSM98qndX2UKGgGaAloD0MI53Pudr1ndkCUhpRSlGgVTegDaBZHQKCpYJdjXnR1fZQoaAZoCWgPQwhH/8u16IF2QJSGlFKUaBVN6ANoFkdAoKldRFZxJnV9lChoBmgJaA9DCJ2f4jhwX3ZAlIaUUpRoFU3oA2gWR0CgqVoMz/IbdX2UKGgGaAloD0MIW18ktOWRdkCUhpRSlGgVTegDaBZHQKC5wADJU5x1fZQoaAZoCWgPQwix+bg2FEV2QJSGlFKUaBVN6ANoFkdAoLm8VYZEUnV9lChoBmgJaA9DCET5ghbSpHZAlIaUUpRoFU3oA2gWR0CgublC1JDmdX2UKGgGaAloD0MIy0dS0oNGdkCUhpRSlGgVTegDaBZHQKC5tkdV/+d1fZQoaAZoCWgPQwhJTbuY5np2QJSGlFKUaBVN6ANoFkdAoMpDTrmhd3V9lChoBmgJaA9DCImV0chnfXZAlIaUUpRoFU3oA2gWR0Cgyj9ytFKDdX2UKGgGaAloD0MI4dHGEStJdkCUhpRSlGgVTegDaBZHQKDKPDVH4Gl1fZQoaAZoCWgPQwjZk8DmnIB2QJSGlFKUaBVN6ANoFkdAoMo5AKOT7nV9lChoBmgJaA9DCNCzWfU5pXZAlIaUUpRoFU3oA2gWR0Cg2muPeYUndX2UKGgGaAloD0MIX2Is029HdkCUhpRSlGgVTegDaBZHQKDaZ+PRzBB1fZQoaAZoCWgPQwhRhqqYyqx2QJSGlFKUaBVN6ANoFkdAoNpkzMzMzXV9lChoBmgJaA9DCLN+MzHdl3ZAlIaUUpRoFU3oA2gWR0Cg2mHM2WIHdX2UKGgGaAloD0MI91j60MVcdkCUhpRSlGgVTegDaBZHQKDqWsz2vjh1fZQoaAZoCWgPQwhmFTYD3HB2QJSGlFKUaBVN6ANoFkdAoOpW4EwFknV9lChoBmgJaA9DCIJ0sWllbXZAlIaUUpRoFU3oA2gWR0Cg6lOSGJvYdX2UKGgGaAloD0MIDMufb0tydkCUhpRSlGgVTegDaBZHQKDqUF2V3Ux1fZQoaAZoCWgPQwhweEFEqnl2QJSGlFKUaBVN6ANoFkdAoPn8zVMEinV9lChoBmgJaA9DCF5jl6hecnZAlIaUUpRoFU3oA2gWR0Cg+fjhcZ+AdX2UKGgGaAloD0MIx0eLMwZrdkCUhpRSlGgVTegDaBZHQKD59ZVXFLp1fZQoaAZoCWgPQwh4tHHEWmp2QJSGlFKUaBVN6ANoFkdAoPnyXjU/fXV9lChoBmgJaA9DCN83vvaMrXZAlIaUUpRoFU3oA2gWR0ChCHUth/iHdX2UKGgGaAloD0MIOh4zUFl/dkCUhpRSlGgVTegDaBZHQKEIcX7+DOF1fZQoaAZoCWgPQwh55XrbDJF2QJSGlFKUaBVN6ANoFkdAoQhubCrLhnV9lChoBmgJaA9DCNfCLLSzinZAlIaUUpRoFU3oA2gWR0ChCGtvn8sMdWUu"
|
82 |
},
|
83 |
"ep_success_buffer": {
|
84 |
":type:": "<class 'collections.deque'>",
|
|
|
95 |
"n_epochs": 10,
|
96 |
"clip_range": {
|
97 |
":type:": "<class 'function'>",
|
98 |
+
":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
|
99 |
},
|
100 |
"clip_range_vf": null,
|
101 |
"normalize_advantage": true,
|
ppo-Swimmer-v3/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 87280
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92683882c52462ee4f66ca28a87a2071f1b98024eb9aeb333eea90a81e63da5d
|
3 |
size 87280
|
ppo-Swimmer-v3/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43070
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c3a460ccff6cda88f73391aeaa6e4d76ed52f9b73e7cbdc3f364ee8450424c1
|
3 |
size 43070
|
ppo-Swimmer-v3/system_info.txt
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
-
- OS: Linux-5.
|
2 |
-
- Python: 3.
|
3 |
- Stable-Baselines3: 1.7.0
|
4 |
- PyTorch: 1.13.1+cu117
|
5 |
- GPU Enabled: False
|
6 |
-
- Numpy: 1.
|
7 |
- Gym: 0.21.0
|
|
|
1 |
+
- OS: Linux-5.10.0-20-cloud-amd64-x86_64-with-glibc2.31 # 1 SMP Debian 5.10.158-2 (2022-12-13)
|
2 |
+
- Python: 3.9.2
|
3 |
- Stable-Baselines3: 1.7.0
|
4 |
- PyTorch: 1.13.1+cu117
|
5 |
- GPU Enabled: False
|
6 |
+
- Numpy: 1.24.1
|
7 |
- Gym: 0.21.0
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf848ac0c087f299e24d2e8c38b29508b7fc34c4f2ceeb36d2df24d0f69035ef
|
3 |
+
size 1422054
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 366.7220337, "std_reward": 0.6844751029888642, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-01-17T11:49:19.302237"}
|
train_eval_metrics.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ae218db88e3aff350507ba2a75479f3d4a2ea104c3305d161120890e6dadf4e
|
3 |
+
size 42875
|
vec_normalize.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f23a17e06f188b9b7bb976cadca53bf241a89e2193ca03872e4fada69ced049
|
3 |
+
size 4552
|