Quentin Gallouédec commited on
Commit
d64f459
·
1 Parent(s): 3befa29

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: CartpoleDMC-v0
17
  metrics:
18
  - type: mean_reward
19
- value: 991.74 +/- 0.45
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -62,7 +62,12 @@ python -m rl_zoo3.push_to_hub --algo ddpg --env CartpoleDMC-v0 -f logs/ -orga qg
62
 
63
  ## Hyperparameters
64
  ```python
65
- OrderedDict([('n_timesteps', 1000000.0),
 
 
 
 
 
66
  ('policy', 'MlpPolicy'),
67
  ('policy_kwargs',
68
  'dict(net_arch=dict(pi=[300, 200], qf=[400, 300]))'),
 
16
  type: CartpoleDMC-v0
17
  metrics:
18
  - type: mean_reward
19
+ value: 885.50 +/- 4.94
20
  name: mean_reward
21
  verified: false
22
  ---
 
62
 
63
  ## Hyperparameters
64
  ```python
65
+ OrderedDict([('batch_size', 64),
66
+ ('gamma', 0.99),
67
+ ('learning_rate', 0.0001),
68
+ ('n_timesteps', 1000000.0),
69
+ ('noise_std', 0.3),
70
+ ('noise_type', 'ornstein-uhlenbeck'),
71
  ('policy', 'MlpPolicy'),
72
  ('policy_kwargs',
73
  'dict(net_arch=dict(pi=[300, 200], qf=[400, 300]))'),
args.yml CHANGED
@@ -10,11 +10,11 @@
10
  - - env_kwargs
11
  - null
12
  - - eval_episodes
13
- - 5
14
  - - eval_freq
15
  - 25000
16
  - - gym_packages
17
- - - dmc_gym
18
  - - hyperparams
19
  - null
20
  - - log_folder
@@ -24,7 +24,7 @@
24
  - - max_total_trials
25
  - null
26
  - - n_eval_envs
27
- - 1
28
  - - n_evaluations
29
  - null
30
  - - n_jobs
@@ -54,15 +54,15 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 1840051874
58
  - - storage
59
  - null
60
  - - study_name
61
  - null
62
  - - tensorboard_log
63
- - ''
64
  - - track
65
- - false
66
  - - trained_agent
67
  - ''
68
  - - truncate_last_trajectory
@@ -74,9 +74,9 @@
74
  - - verbose
75
  - 1
76
  - - wandb_entity
77
- - null
78
  - - wandb_project_name
79
- - sb3
80
  - - wandb_tags
81
  - []
82
  - - yaml_file
 
10
  - - env_kwargs
11
  - null
12
  - - eval_episodes
13
+ - 20
14
  - - eval_freq
15
  - 25000
16
  - - gym_packages
17
+ - []
18
  - - hyperparams
19
  - null
20
  - - log_folder
 
24
  - - max_total_trials
25
  - null
26
  - - n_eval_envs
27
+ - 5
28
  - - n_evaluations
29
  - null
30
  - - n_jobs
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 3757117300
58
  - - storage
59
  - null
60
  - - study_name
61
  - null
62
  - - tensorboard_log
63
+ - runs/CartpoleDMC-v0__ddpg__3757117300__1673811016
64
  - - track
65
+ - true
66
  - - trained_agent
67
  - ''
68
  - - truncate_last_trajectory
 
74
  - - verbose
75
  - 1
76
  - - wandb_entity
77
+ - qgallouedec
78
  - - wandb_project_name
79
+ - dmc
80
  - - wandb_tags
81
  - []
82
  - - yaml_file
config.yml CHANGED
@@ -1,6 +1,16 @@
1
  !!python/object/apply:collections.OrderedDict
2
- - - - n_timesteps
 
 
 
 
 
 
3
  - 1000000.0
 
 
 
 
4
  - - policy
5
  - MlpPolicy
6
  - - policy_kwargs
 
1
  !!python/object/apply:collections.OrderedDict
2
+ - - - batch_size
3
+ - 64
4
+ - - gamma
5
+ - 0.99
6
+ - - learning_rate
7
+ - 0.0001
8
+ - - n_timesteps
9
  - 1000000.0
10
+ - - noise_std
11
+ - 0.3
12
+ - - noise_type
13
+ - ornstein-uhlenbeck
14
  - - policy
15
  - MlpPolicy
16
  - - policy_kwargs
ddpg-CartpoleDMC-v0.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:923cb4e841cb805d69a220f0c0498569eb2abfb1a3713001d96a7662b47f5826
3
- size 3010029
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:877cd406d523ea85172a4a93ff71c81e540dec32903d4bc68f23d8a1f8873e9a
3
+ size 3011980
ddpg-CartpoleDMC-v0/actor.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb20b1fe7bab4e0da2512800c8914f14964df922fc5e0eac9e6ab98deefea832
3
  size 502319
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:166c4143263a24cdd9d3cd802ff4559bff80a9b7965a1a7d7e73ebc2a5428b3b
3
  size 502319
ddpg-CartpoleDMC-v0/critic.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d120ee30a9e4a1c5c8d20f75573f83f7ad0261a31f55c9bb2ca16f22df0c6441
3
  size 991855
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b00f7c9cecf7772b2df007c1577f2f50d5b7e298708baed00becbb269abe6a3f
3
  size 991855
ddpg-CartpoleDMC-v0/data CHANGED
@@ -4,16 +4,16 @@
4
  ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnRkMy5wb2xpY2llc5SMCVREM1BvbGljeZSTlC4=",
5
  "__module__": "stable_baselines3.td3.policies",
6
  "__doc__": "\n Policy class (with both actor and critic) for TD3.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
7
- "__init__": "<function TD3Policy.__init__ at 0x153e1c700>",
8
- "_build": "<function TD3Policy._build at 0x153e1c790>",
9
- "_get_constructor_parameters": "<function TD3Policy._get_constructor_parameters at 0x153e1c820>",
10
- "make_actor": "<function TD3Policy.make_actor at 0x153e1c8b0>",
11
- "make_critic": "<function TD3Policy.make_critic at 0x153e1c940>",
12
- "forward": "<function TD3Policy.forward at 0x153e1c9d0>",
13
- "_predict": "<function TD3Policy._predict at 0x153e1ca60>",
14
- "set_training_mode": "<function TD3Policy.set_training_mode at 0x153e1caf0>",
15
  "__abstractmethods__": "frozenset()",
16
- "_abc_impl": "<_abc._abc_data object at 0x153e15e80>"
17
  },
18
  "verbose": 1,
19
  "policy_kwargs": {
@@ -31,7 +31,7 @@
31
  },
32
  "observation_space": {
33
  ":type:": "<class 'gym.spaces.box.Box'>",
34
- ":serialized:": "gAWVMgwAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBYWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWFAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/5RoC0sFhZSMAUOUdJRSlIwEaGlnaJRoEyiWFAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAf5RoC0sFhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolgUAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBYWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYFAAAAAAAAAAAAAAAAlGgiSwWFlGgWdJRSlIwKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwSX19yYW5kb21zdGF0ZV9jdG9ylJOUjAdNVDE5OTM3lGgujBRfX2JpdF9nZW5lcmF0b3JfY3RvcpSTlIaUUpR9lCiMDWJpdF9nZW5lcmF0b3KUjAdNVDE5OTM3lIwFc3RhdGWUfZQojANrZXmUaBMolsAJAAAAAAAAAAAAgPyvMR0jzuf33p6KWaKEEdF5TV9qkgLWaKbF34cjJHvwV92wv7gsUSLwr38i0G9vi5NBuuqlN7ZDGBuAz11m0vRkDoDT2qad2gr2brCw3sJ3Z8LPQWWpTA5HgiW7bdTJv/rPpwK+PM0XYOiJ9Cn8i+eSbMXWZKbGrRQeGevQ7XoO8js1VHts1JZFRpNbW+8zjvREq5rEvA508h4tgqAENKa2PKr0+fb13bxaQJ5LH5r1loSfaQfdt18AJKtKHGhLEpoQf3DC3ZBc6v7hmMiAzCLa1T6oaEPs8hlPz/tJ/Hksnh4M0xlxZQLRgWdBADXYG8uvdD/eYl+JWWnl/K7RI4u+L/r925+sqYLxFwmbtJ3znMSo16z78K45NNA7/XSqGJtCXJ5PNETzBl+1SB8Vwv1wooQK5SkbT/WHiorzJ+V5042SemA2NPSFHRudsSDKfjX4xq2biVUmFwXmzkoVvoVMSnRM6RkdmmGn3/rKdFq3noR43w9DrgUXzcwrpQ6QF4z/ScmAUgTd/rP1+3kiK6O6woQzn1SBALDlsNa1L6yg5OCvnd8QK3Kivaeu9ukWxE/Z/9vfdlEtIXkCFj0h/fO7h0GO/M/VVQ3nVNpZblVdLPbRwXS/RhQUCKRVwUbYod1vipOG+JGSIb/TasYogZKxDd+m++1oaQBCFDK8W0jlYvxowxJnBJMDAN7irQP68T8uULTs8CeiePBDpVnx1HaEPHGHJDpscId/yokrdKUvJQ2FJzbjBXs/owDC48zyt3eHXuJCU/nduRXLDgrD5glYLoLwBdjWkLmv+Vy7zCWYnhQsq7FLQeczzeNYSI9KoWmHZ4pEy1DOJAxOTQi1pDzEBpplUOaOtzTxRxZnq++o5o6yGqSvZUMkXe5vk/RfGp8JQz0lVR74LczTZqWPQuPwGi6AXb2d8ICqTlAzPfRQyxEEI+DFhIdvIptSOfTplM1CK1liQYSK9q4vVc6xJC/C4tqNYasLpaNPGfJIKD+yPN1U9Htn34+kh4h1ctLkDEQZtmSl4OBGmMvZHB4fQie0PasmUuOBcanGYIfBFh2SsdXuRol2JvGtSjJbS6zAZl4pWjI/PVHxhB5V7zK/mjwdgYy2jdCu9u5KJBy4DRvsOPzOLU+tUtE8x1tvcR2e+SXwSz5G3AVyn2xsMxarZJttX5ZkX9RXkopgRTWMHUIwt6/sZ6kA/EuengjqFAeKw1RhbNDH1S7K8pwlRpvHbYCogHS80aC0PxxbCWzsPlAUPqopyD5XwKi23/NVvvP3YeY7DzUGMyHdj2JxDwBEjDgPI+2dRohqBoDVziR4g0O0f/y3rP0bMGY4AJInnHdu5sSyfIAvcL1BKGcnDF2FwBwk75wh/UfMSU2LAbSqGAMaeMD4jLhR/H4zZOAFOzHptaVyMx1t4hu17PmHnfWZT/FYyFV4AjXMbgpuryRj9vl+a0hw8VpeaUz9RDSWUDWTsFNnwXqTYIOV3/44ESj6ZP4Fv9HzCUPrXkN4QD4zVYskNCQWDeBljMgfTFk8lmmE5hHCK9szpeGZcgCAc5DqeyB3qg09CFJWkACCSHmeHwKF8FeCWlE4pYHfdxy0jTiK4QjLLWNftj16KNNHPnMmZjoc53m0X+VHzM+dzBruRQ5W94RN9D+YNcIPqs13zsNCoJQxxYlH6lDzdGDs/sefpfjqd/oxKHERr4fnWzxTVuQXmEJArYO67gOljuEkG3XKS/AgiVTogyk4AIop+klB7Q4HDzfau/IwAdcoYAMViijMrtoS2cjLe6RkQNp/+oRGqkRHHQlbzqG7p+rNOfUyPPUZTgz5bMoIXLHwn9Uv/WWHayNq7WgMCegypVBgR6Rw9xj7wJhyAslYuPlx47HhzFPT5EEUtnlkp6INo646+tDpSkR3PM3uuvNT0SkOUDluB3f74XypKRj3xyCPRu2t3C0vlCI54t0ICLHaz+ijbHHpjADIq4nhNvOTU/aud4o8s2dUBoQ35K3Tm7B3IcDgFtCaflDL4YOPfmrI6DHz5skf01V5Qa5W2yWl8B5qmYQ5ow17403FaKrRKMEZSgsEUAXZoQRXtlusyr/CW0BQG5wicpFWbCuOsDfSZZXu7CUAuv6421q8Aqt/GkPkISAl6AcnTPk3ufG8ZaLl8lRQmD3w5k8vfRXi7MM/vPduBfdyYpgwc5CpcoSoWvBmoh0WDO4G+yvA9inNrZDeDImKQxXgnyJLm1fKPo9U/L+/i1D3D+Oi8ab1io4CYXGafde5kROQudxsRhqDzqodjE6PsIbfxd855SV7WF0MArI9aQfa2LUvpddtRkA8l12mtPDdi+zkoWbMx3i5sRjoAUg0ikCKGXaaC/yYN/WwDZl+XpYYVuSXE1IRswv6KmKiJHzbjVKiXNPFfzpRDemi7x3TNfE6Ihya4ZR9yNpHpWZuxBJl8tmG3xuzpPUVYPGbdC42BWI9Dd5SWFUqTDgU6GZTgif1iht2Iz/IciXG3AwrO9F96WUp6DbXaiDAVm/YJjfVgtWlbOA6vfj9SjUFbGYOj7XudraSz7Q5jC34Bc9ff/O05mlbOreThcMLQrxfOG9PQJEjxEWQ/ZL1QpJH2oi6gAqeEkZmOhKXJ/xOX3GWLFjx7jgv96KZPm15M0raA72hy1eZo2AymbeSIFYdgiCnvQ+zhS7h93oEW+1W1ViAAjn5mXHIgfQE/fRXzH3flm1TU0NleaaKR9ZpLHEugFllAFzHY+PzNJsCcr92SYeFEIZ5/O6K8wEaIj9kRSnxOr5vcXcyteEtMuASGiUYzfU+jp7U7pqvg4x7Td/1KmoR6gS5F+0I0ERTlsqzGlbF7Ni0zf1MNevodEqDQRnbNbnwmC79JB1E4jO7IN7atEYt2gCM3PTTJaDdJrzS44e0YympSqOU3i3YCKUEejxP/X6WohfZQEcV3nfsFOH0QJugsGMed3bbfE0+jyGofpJBXbgLkNHYvUSci9xp+TD9AYHcjl4dPcBH1o3sqM5tWlGNUaq7rgUVHrnIUh1C1wus+PG6bVe6/yQDg1yIAQQ9g0nwmxGTfFV+qfA3LLbmdQ58pGPnsBvxRAOHPblPR+N6t619+IXeXTGza2SyimwHo+gPdP4k9StVUZHPBiRJiiBDXxbXm5ankcnvqzaFZ1o3zmCi03R5gTeoiJr4NA681tZgpVJsxgW2po6c2NdNwoBZPoXzcN0wJk38Z23dQKQELeUaXPNUzimTHfKhyGPM0HIkK8cUNc9Z8jGHfFRh2RwBMorVqgzR5SrMXP+4CsKnv3qhR8T87fCSbBpnSu62wFYDvUPLm27JMIo+z/U0QE6nlGgIjAJ1NJSJiIeUUpQoSwNoDE5OTkr/////Sv////9LAHSUYk1wAoWUaBZ0lFKUjANwb3OUTXACdYwJaGFzX2dhdXNzlEsAjAVnYXVzc5RHAAAAAAAAAAB1YnViLg==",
35
  "dtype": "float32",
36
  "_shape": [
37
  5
@@ -60,13 +60,25 @@
60
  "_total_timesteps": 1000000,
61
  "_num_timesteps_at_start": 0,
62
  "seed": 0,
63
- "action_noise": null,
64
- "start_time": 1673793870909720000,
65
- "learning_rate": 0.001,
66
- "tensorboard_log": null,
 
 
 
 
 
 
 
 
 
 
 
 
67
  "lr_schedule": {
68
  ":type:": "<class 'function'>",
69
- ":serialized:": "gAWV+QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMYy9Vc2Vycy9xdWVudGluZ2FsbG91ZWRlYy9kbWNfZ3ltL2Vudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMYy9Vc2Vycy9xdWVudGluZ2FsbG91ZWRlYy9kbWNfZ3ltL2Vudi9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/UGJN0vGp/IWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
70
  },
71
  "_last_obs": null,
72
  "_last_episode_starts": {
@@ -75,7 +87,7 @@
75
  },
76
  "_last_original_obs": {
77
  ":type:": "<class 'numpy.ndarray'>",
78
- ":serialized:": "gAWViQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYUAAAAAAAAAOnQ376k/38/exNZu9j9Tb15GzE8lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksBSwWGlIwBQ5R0lFKULg=="
79
  },
80
  "_episode_num": 1000,
81
  "use_sde": false,
@@ -83,7 +95,7 @@
83
  "_current_progress_remaining": 0.0,
84
  "ep_info_buffer": {
85
  ":type:": "<class 'collections.deque'>",
86
- ":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIborHRfUzj0CUhpRSlIwBbJRN6AOMAXSUR0CjoaoHC4z8dX2UKGgGaAloD0MIlbn5RvR7iUCUhpRSlGgVTegDaBZHQKOnd8l5WzZ1fZQoaAZoCWgPQwi8XS9NUYyIQJSGlFKUaBVN6ANoFkdAo60o4Ia99XV9lChoBmgJaA9DCMr+eRqw645AlIaUUpRoFU3oA2gWR0CjsuSp71IzdX2UKGgGaAloD0MIidNJtvrbjkCUhpRSlGgVTegDaBZHQKO4fkELYwt1fZQoaAZoCWgPQwj9LQH4JzyIQJSGlFKUaBVN6ANoFkdAo74TufEn9nV9lChoBmgJaA9DCK2E7pL4545AlIaUUpRoFU3oA2gWR0Cjw5em3vx6dX2UKGgGaAloD0MIC/Dd5s39jkCUhpRSlGgVTegDaBZHQKPJLo7FKkF1fZQoaAZoCWgPQwiRe7q6wyWPQJSGlFKUaBVN6ANoFkdAo867wYtQK3V9lChoBmgJaA9DCEoJwapaI49AlIaUUpRoFU3oA2gWR0Cj1FVmSQo1dX2UKGgGaAloD0MICvSJPClVi0CUhpRSlGgVTegDaBZHQKPZ6BT4tYl1fZQoaAZoCWgPQwhNaf0tga+OQJSGlFKUaBVN6ANoFkdAo998OmR/3HV9lChoBmgJaA9DCOCBAYTv9Y5AlIaUUpRoFU3oA2gWR0Cj5Qsz2vjfdX2UKGgGaAloD0MIR450BkbNeUCUhpRSlGgVTegDaBZHQKPqoCJXQt11fZQoaAZoCWgPQwjCTUaVAYqCQJSGlFKUaBVN6ANoFkdAo/Au9YfW+XV9lChoBmgJaA9DCOV8sffiJo9AlIaUUpRoFU3oA2gWR0Cj9bmO2iL3dX2UKGgGaAloD0MIwLFnz4VjgUCUhpRSlGgVTegDaBZHQKP7UtVaOgh1fZQoaAZoCWgPQwgjopi8gTuJQJSGlFKUaBVN6ANoFkdApADbofSx7nV9lChoBmgJaA9DCKpHGtyWNo9AlIaUUpRoFU3oA2gWR0CkBnFL39JjdX2UKGgGaAloD0MIs7PonSphhECUhpRSlGgVTegDaBZHQKQL+U0Nz8x1fZQoaAZoCWgPQwi0klZ8wyqPQJSGlFKUaBVN6ANoFkdApBGKbtqpLnV9lChoBmgJaA9DCLIRiNdVaYVAlIaUUpRoFU3oA2gWR0CkFxyKekHldX2UKGgGaAloD0MIHzAPmfI4j0CUhpRSlGgVTegDaBZHQKQcouq3mV91fZQoaAZoCWgPQwg6deWzvDePQJSGlFKUaBVN6ANoFkdApCIrBKtga3V9lChoBmgJaA9DCAkVHF6wyo1AlIaUUpRoFU3oA2gWR0CkJ8TZxrBTdX2UKGgGaAloD0MIXp1jQHbgjUCUhpRSlGgVTegDaBZHQKQvbmqYJE91fZQoaAZoCWgPQwiXqUnwhsOJQJSGlFKUaBVN6ANoFkdApDUDlYEGJXV9lChoBmgJaA9DCIYBS67i24xAlIaUUpRoFU3oA2gWR0CkOopxNqQBdX2UKGgGaAloD0MIFO0qpJzXjECUhpRSlGgVTegDaBZHQKRAFbNbC791fZQoaAZoCWgPQwhOX8/XbEmLQJSGlFKUaBVN6ANoFkdApEWdMh5gPXV9lChoBmgJaA9DCAg6WtWSRIdAlIaUUpRoFU3oA2gWR0CkSzMQd0aIdX2UKGgGaAloD0MII6DCESRAikCUhpRSlGgVTegDaBZHQKRQ3rLyMDR1fZQoaAZoCWgPQwiHGoUkc56LQJSGlFKUaBVN6ANoFkdApFZs5Qxes3V9lChoBmgJaA9DCILjMm7KHYpAlIaUUpRoFU3oA2gWR0CkW/+yiVSodX2UKGgGaAloD0MI4QfnUwf8i0CUhpRSlGgVTegDaBZHQKRhhNIK+i91fZQoaAZoCWgPQwjS4La2EHKHQJSGlFKUaBVN6ANoFkdApGcLG5tm+XV9lChoBmgJaA9DCEinrny2l4pAlIaUUpRoFU3oA2gWR0CkbJSXMQmNdX2UKGgGaAloD0MI0eY4t+nMjUCUhpRSlGgVTegDaBZHQKRyHtix3V11fZQoaAZoCWgPQwh6VWe1YDmPQJSGlFKUaBVN6ANoFkdApHekR+SbIHV9lChoBmgJaA9DCJGadjEtsYVAlIaUUpRoFU3oA2gWR0CkfTbn5i3HdX2UKGgGaAloD0MITp1HxZ9sjUCUhpRSlGgVTegDaBZHQKSCxJwKjSJ1fZQoaAZoCWgPQwgAOPbsOS6NQJSGlFKUaBVN6ANoFkdApIhZcVxjrnV9lChoBmgJaA9DCB2vQPQkMY9AlIaUUpRoFU3oA2gWR0CkjenWBjFydX2UKGgGaAloD0MIUAEwnqEyhUCUhpRSlGgVTegDaBZHQKSTfeVLSNR1fZQoaAZoCWgPQwhkWTDxJyiOQJSGlFKUaBVN6ANoFkdApJkW+AVfu3V9lChoBmgJaA9DCOHvF7NlUYxAlIaUUpRoFU3oA2gWR0CknqZ0KZ2IdX2UKGgGaAloD0MIFvw2xBh3iUCUhpRSlGgVTegDaBZHQKSkOouPFNt1fZQoaAZoCWgPQwjYZmMlhiOEQJSGlFKUaBVN6ANoFkdApKnFgF5fMXV9lChoBmgJaA9DCEt319kwXYNAlIaUUpRoFU3oA2gWR0Ckr1F9Sde6dX2UKGgGaAloD0MITgte9LU3j0CUhpRSlGgVTegDaBZHQKS054DcM3J1fZQoaAZoCWgPQwjKi0zALy6PQJSGlFKUaBVN6ANoFkdApLx/420iQnV9lChoBmgJaA9DCBn/PuNiropAlIaUUpRoFU3oA2gWR0CkwkewcHW0dX2UKGgGaAloD0MIR3L5DyndhkCUhpRSlGgVTegDaBZHQKTH+20iQkp1fZQoaAZoCWgPQwjKoxthsRqPQJSGlFKUaBVN6ANoFkdApM2hN7BwdnV9lChoBmgJaA9DCIGTbeCOOY9AlIaUUpRoFU3oA2gWR0Ck0zTefqX4dX2UKGgGaAloD0MId0zdlb03jUCUhpRSlGgVTegDaBZHQKTYvi7TUiJ1fZQoaAZoCWgPQwhP6svSToiKQJSGlFKUaBVN6ANoFkdApN5ETcqOLnV9lChoBmgJaA9DCB2PGagsAo1AlIaUUpRoFU3oA2gWR0Ck5CIw/PgOdX2UKGgGaAloD0MI5gMCnQk8j0CUhpRSlGgVTegDaBZHQKTqBU1hsqJ1fZQoaAZoCWgPQwgqHEEqheyKQJSGlFKUaBVN6ANoFkdApO+4A+6iCnV9lChoBmgJaA9DCKA1P/5yKI1AlIaUUpRoFU3oA2gWR0Ck9UGoR7JGdX2UKGgGaAloD0MIBYpYxHA5jkCUhpRSlGgVTegDaBZHQKT61o0Q9Rt1fZQoaAZoCWgPQwinXOFdDmmFQJSGlFKUaBVN6ANoFkdApQBkQVbiZXV9lChoBmgJaA9DCCBgrdoVMYpAlIaUUpRoFU3oA2gWR0ClBfmb9ZRsdX2UKGgGaAloD0MIK76h8Nmkh0CUhpRSlGgVTegDaBZHQKULkt6HCXR1fZQoaAZoCWgPQwh5zhYQWsSJQJSGlFKUaBVN6ANoFkdApREar/82rHV9lChoBmgJaA9DCP9aXrm+54tAlIaUUpRoFU3oA2gWR0ClFqBoM8YAdX2UKGgGaAloD0MISwSqf3ARjECUhpRSlGgVTegDaBZHQKUcKLYPGyZ1fZQoaAZoCWgPQwimgLT/geKJQJSGlFKUaBVN6ANoFkdApSHDvqkdm3V9lChoBmgJaA9DCC/3yVEgSYdAlIaUUpRoFU3oA2gWR0ClJ04sunMudX2UKGgGaAloD0MIUu4+x4e9hUCUhpRSlGgVTegDaBZHQKUs5Wy1NQF1fZQoaAZoCWgPQwiGqphKX4yKQJSGlFKUaBVN6ANoFkdApTJ5m03OwHV9lChoBmgJaA9DCPnaM0siuYJAlIaUUpRoFU3oA2gWR0ClOAQHAymAdX2UKGgGaAloD0MIUmNCzAUxjECUhpRSlGgVTegDaBZHQKU9jeQdS2p1fZQoaAZoCWgPQwhhNgGGpSmGQJSGlFKUaBVN6ANoFkdApUMSyt3fRHV9lChoBmgJaA9DCF3Cobe4E41AlIaUUpRoFU3oA2gWR0ClSmdbgTAWdX2UKGgGaAloD0MIfAxWnMq1jECUhpRSlGgVTegDaBZHQKVQN/hl18t1fZQoaAZoCWgPQwjFdYwrLpGGQJSGlFKUaBVN6ANoFkdApVXnB+F10XV9lChoBmgJaA9DCIfCZ+vA+41AlIaUUpRoFU3oA2gWR0ClW5FGPPszdX2UKGgGaAloD0MImWclrZhbiUCUhpRSlGgVTegDaBZHQKVhJ5AQg9x1fZQoaAZoCWgPQwiaIyu/bLyJQJSGlFKUaBVN6ANoFkdApWawAS39aXV9lChoBmgJaA9DCOXsndHWuItAlIaUUpRoFU3oA2gWR0ClbDVvddmhdX2UKGgGaAloD0MIUbzK2sZGh0CUhpRSlGgVTegDaBZHQKVxyYekpJB1fZQoaAZoCWgPQwhbsirCrUyDQJSGlFKUaBVN6ANoFkdApXddbiZOSHV9lChoBmgJaA9DCKVPq+hPRIZAlIaUUpRoFU3oA2gWR0ClfPWyLQ5WdX2UKGgGaAloD0MIC2E1lnCXhkCUhpRSlGgVTegDaBZHQKWCi6JZW7x1fZQoaAZoCWgPQwj/sRAdonWOQJSGlFKUaBVN6ANoFkdApYgQbQ1JlXV9lChoBmgJaA9DCLrYtFLoCI5AlIaUUpRoFU3oA2gWR0CljaOpS75EdX2UKGgGaAloD0MIrJFdaVljjECUhpRSlGgVTegDaBZHQKWTLzcynDR1fZQoaAZoCWgPQwjg9gSJrcyKQJSGlFKUaBVN6ANoFkdApZi2B8QZoHV9lChoBmgJaA9DCP8iaMxk24NAlIaUUpRoFU3oA2gWR0ClnjsAeaKDdX2UKGgGaAloD0MIURa+vtYRh0CUhpRSlGgVTegDaBZHQKWj0APNFBp1fZQoaAZoCWgPQwghIjXt4q2CQJSGlFKUaBVN6ANoFkdApalbc9GI9HV9lChoBmgJaA9DCMRafAqA541AlIaUUpRoFU3oA2gWR0ClruQOnVG1dX2UKGgGaAloD0MIm3Eaoqq1jECUhpRSlGgVTegDaBZHQKW0fDUmUnp1fZQoaAZoCWgPQwiEm4wqw+WKQJSGlFKUaBVN6ANoFkdApboUejmCAnV9lChoBmgJaA9DCF9cqtJWD4tAlIaUUpRoFU3oA2gWR0Clv6GYBvJjdX2UKGgGaAloD0MIhqxu9ZxmiUCUhpRSlGgVTegDaBZHQKXFOtPpIMB1fZQoaAZoCWgPQwjvHTUmZNqIQJSGlFKUaBVN6ANoFkdApcrC8OCoTHV9lChoBmgJaA9DCNAM4gObgI1AlIaUUpRoFU3oA2gWR0Cl0E0EHMUzdWUu"
87
  },
88
  "ep_success_buffer": {
89
  ":type:": "<class 'collections.deque'>",
@@ -91,7 +103,7 @@
91
  },
92
  "_n_updates": 1000000,
93
  "buffer_size": 1,
94
- "batch_size": 100,
95
  "learning_starts": 100,
96
  "tau": 0.005,
97
  "gamma": 0.99,
@@ -102,12 +114,12 @@
102
  ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
103
  "__module__": "stable_baselines3.common.buffers",
104
  "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
105
- "__init__": "<function ReplayBuffer.__init__ at 0x153e0b250>",
106
- "add": "<function ReplayBuffer.add at 0x153e0b2e0>",
107
- "sample": "<function ReplayBuffer.sample at 0x153e0b370>",
108
- "_get_samples": "<function ReplayBuffer._get_samples at 0x153e0b400>",
109
  "__abstractmethods__": "frozenset()",
110
- "_abc_impl": "<_abc._abc_data object at 0x153e03f40>"
111
  },
112
  "replay_buffer_kwargs": {},
113
  "train_freq": {
 
4
  ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnRkMy5wb2xpY2llc5SMCVREM1BvbGljeZSTlC4=",
5
  "__module__": "stable_baselines3.td3.policies",
6
  "__doc__": "\n Policy class (with both actor and critic) for TD3.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
7
+ "__init__": "<function TD3Policy.__init__ at 0x139898280>",
8
+ "_build": "<function TD3Policy._build at 0x139898310>",
9
+ "_get_constructor_parameters": "<function TD3Policy._get_constructor_parameters at 0x1398983a0>",
10
+ "make_actor": "<function TD3Policy.make_actor at 0x139898430>",
11
+ "make_critic": "<function TD3Policy.make_critic at 0x1398984c0>",
12
+ "forward": "<function TD3Policy.forward at 0x139898550>",
13
+ "_predict": "<function TD3Policy._predict at 0x1398985e0>",
14
+ "set_training_mode": "<function TD3Policy.set_training_mode at 0x139898670>",
15
  "__abstractmethods__": "frozenset()",
16
+ "_abc_impl": "<_abc._abc_data object at 0x139892d80>"
17
  },
18
  "verbose": 1,
19
  "policy_kwargs": {
 
31
  },
32
  "observation_space": {
33
  ":type:": "<class 'gym.spaces.box.Box'>",
34
+ ":serialized:": "gAWVMgwAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBYWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWFAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/5RoC0sFhZSMAUOUdJRSlIwEaGlnaJRoEyiWFAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAf5RoC0sFhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolgUAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBYWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYFAAAAAAAAAAAAAAAAlGgiSwWFlGgWdJRSlIwKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwSX19yYW5kb21zdGF0ZV9jdG9ylJOUjAdNVDE5OTM3lGgujBRfX2JpdF9nZW5lcmF0b3JfY3RvcpSTlIaUUpR9lCiMDWJpdF9nZW5lcmF0b3KUjAdNVDE5OTM3lIwFc3RhdGWUfZQojANrZXmUaBMolsAJAAAAAAAAAAAAgCJI3W7TaYNo2fkCQTqkGso9PgD+gpj29/M/d+fXv7mxGN3/7aYgZyvV0Ye9Mqg636TmZE5bw2bcCxNeR8TyCBDpnUCPLrx7pKMgwAia7+EDxmTe1NYhO87+D5+vZcW2uMYIJE+6AI/OH6W3CCHYBR11hSSk3DFQo4K+FU7SurMp04MDN6NiNxRwecmWCuT2Q+JWuRXfnmbwrzFpuTQcnNAIdKd++P+QBG1UB+Uduc/saNr7TqOCD+pzMlEeyYTEbDegZvdCaXLWDoXO5FnPoSmO3TtOWUbLuE/F7yk4DT7ZPXKQtaF5n2YfUr8lL67nyWiQUkGk76JLL5uWXFW/i96GnepHUQ1/3EBqSAfbej/Qvbzt4joABFVtCIVVfSSLFxwyzLQ+se3Yp+jaNpm+ikeEUvP2OGCbBDLAtFWwver8m0VDA71UCYGErR0oumNjhtoAOeNzd/1QZU4iaVptCrkqZvcsS8MGAWmN3NO3zQBvEBrHr2s9oWEg1uLUwsyKwp3Ej3HciQGxOQ5+biDZhB8VLLl5RyiwJ+9S/ouy40Z3vBEFhfLASbWQAo2+5lsHDduWiIw+ALN2ooo4bfAFCk9UDac3plWLrtp9le1WUnu3bXM+gCtX0D2tvPg+EnEnodd0g3YprVxiDrQ9rEAggJtpC0r/JUbFkYXweRPxsx4Oeil7IVthzxTx7wDWbCPUrwvtBuYrSDD264NaeNeW2plKz69oH0zjZJf3fuK2tmM4Qi6hlKtNQCDB4GjgtEJcFyfzsYGMpFktH6A8IaEXFj7DbVUGkPdGLod9aXyFUoyzz/LM2HvGeiAFJ74L6vSsn56LFRtPI8IZa1LZlDUamoT8PxQ+nO0rMzoSPydacC/X16q4F3KTKdxRV3YOUg+7hr8pPUXAY8fKVMOC3DcK4rvdXv2i1HhuzPdGKep18KpcYboGB9YdRUfD3xFJzTj/kdWKEtIkZKArroo4WQvXK9m2O3wcasi7QvfDlEaI1P22R10kBQmIZIJEEevbBu+vAJVoT/vuYGCLT4BO7lnqtfkJCsq97mQoenp99p42vFF/79dvNbnA6u041MH3dwoahQCYbQZ1I6fYDqNz7Ga5hscD1zr1pxTYbuP/YdFgun+BM+MayFxilRd1scPzxmUVFGHawNZ/ZFFQuEwu2RyhweiDVCwi55NMfvWVB0xxdJZ/W6lCw7uNp73sfINNREqc3tt7myYn4Zx7PBOGLk2XKMJdsnIG22qn8DcWtX7B+sycFIA1bRe1tGAn3ndOOheba4LnEHg4Z5QXwlI2ri70aSBPn69o756Rc06HVYmYuKKfNl2XUlknUPXc+JoFHRIWTucRnZVGbY4yWec2J1vX3K5Sz+8sXU1aR17I8HxiawgaJ1tgggxY38Pf8SVlwL98FVa3VqjYSG8CS1kdwGeP/w+4Ru4vNX2RlOgMoEnD/9WZAwHkmPdtngENSd826EkfJL8zh8wv+gGbBEHuw2H0w3UP70+IvLePRKaYIBXifNMa+5QtAlLBzO+fN46O/m6l/OCi7RlxJR7bqHr4KkMksYw76XCA68xzLIf8cqaI2+zw2A+xPkNDyXoRPW2abw9HSOVPQWnHkFjT7xUOhjXtc30ICmIgXeHBNwndFpBzNncjnLCVawy3tZWDjgUHdoiP4wDY9INwXMzMy6dU2rbHpLcUJowkcm7gm2TZNdSS1JeA7oOj4J8r1pvm0mOvJvY7L/u5FppT8mU2Q2mEBYXA3o5TXiBmWLkL3tDZjKWvRCEdjergoQY4l/JSv0mx37ZlARhQMs8QA2XmfCRgGZq2s6/luASo4ZCOt7IE/ZuxkrpNh68hkbmDyEYAoBU3pCLojBU8aLJDIj1TbojVL/9Eg3EQ2EOvkDLO+pNjHVsZmOWeCVx+ZqjO1oaDZZ4BRSXQzSlOGR4RMzTw39kYKUxR1lhvMQbcY8tNLSEREALhIwBEd4jWk57ZWEgrYb0Az1KqsbJ7jLmYXO6hCEwoEThdFaJsMCoIX3IKVRp6sE1CRkwii25d/euBM0cwu3QkUIx7kVUi+HsjCP3gQzYmrGL6rSxdIB0i1FqVD9ph0Q/4j3vp8BXsg0vHJzaUkOb+6Oz4ZHyPHYw3msSvjEjVUldb4s8sodV/C79foirUAiXvOjHM3aYDFABKbzZdeUnLL/mG5+wVX9ef93ssJUxK8ElWb17RVrY8HAWLErz1hOp1TQ8Ew/tcVINrcivojfmlrYgNSKgnYd5w4q4IVdcM0hRZJW1I6QUl8OdYaT/88gCfOpXJsv9Cc/6HYbl3HLFjpsBRo2I1TUZ1RQbMiQSXlrF9ff6B27FUwbG01cAac66rIu4H66pNt5MRvtHsgW8P71ULDDqFdZfNr3aUi2tNZ0CJ/vC8g15/2DBfitzcSs30blUDaXoKmDbTnbzvsc45rpv0vZf5IRcbtWe4DW3UB0bFUIPlI4FdinM+OHOs3Z2ICYrQX1IRt7+/JK2iAIpLRp34P0ZRUUuYTpvlI2vT3p0EA6395THuXhqvKtVcS21MfiktsCT4K3HanLLnJmqQ4vg0jUa6pPRNdJuAzkYMCZMrzoMKBhmeHBRqg9d7nc7rIhMWyFPRvXfcMsW5vJt9QQ6mkItDxKlJqoGfeGA0zrxoXGkScZvO/BcB/7Yt1/X2GIzuTV6rrImmPBsZFgSEoQE7ySUAW1SubvRTSTzB8yWOzHZDtROzA+gE/ZNVVuSibZbhLvvehU0nFZKlTM3NaZon+XQegGgpMKKvdnWb3aD9tqIKGLAHdqAPah5QViwLM/X2xchqdCJ6W3P9lAFryrCRmjG3hBC+oPknkpqDchoTTxCjyzbgD8dT9s79WnPzP/S+Ob7kGyulItdPn10JqPB7E3nn+OG32aKG+z0dS0JCau7DZe6lI51TdzB96209Vz0vKTLJTztSeWSdF/PJZNkAQ4gqZ+RIMOnBvSET8BtdXVktZyTinZiNSYTN5sdJqIOyppvKv3Kg/xXPlRbROCtcF0sKOonlLIxATLypV5FCkWTLXYwIpsuLxkkEW5d9F0gc1DdiLMNamrcZFWdddtGGiQYolqtZN7bSg2jUyJCqWc++kcz4/AR8FSG4zwIF95A1OIMCisZ/RJGdTs2qzAOrErX0loqR7DgszURLK8VgP4fsta5Ksm/cyBybB34Pz/Gqe/yGMRkDfrT9va1MuJyhxf/wvCjwnuXrLeNs0Jh4rwUM+gfzjZGDW+IvzG2iAzH6rZFL37dnJULnz/jYGglC3cV6ljb0eZ40N5rK0VmpTVh41CAU9RTR9sdlCFXu01EWL1tfHwIee8vasEX3lGgIjAJ1NJSJiIeUUpQoSwNoDE5OTkr/////Sv////9LAHSUYk1wAoWUaBZ0lFKUjANwb3OUTXACdYwJaGFzX2dhdXNzlEsAjAVnYXVzc5RHAAAAAAAAAAB1YnViLg==",
35
  "dtype": "float32",
36
  "_shape": [
37
  5
 
60
  "_total_timesteps": 1000000,
61
  "_num_timesteps_at_start": 0,
62
  "seed": 0,
63
+ "action_noise": {
64
+ ":type:": "<class 'stable_baselines3.common.noise.OrnsteinUhlenbeckActionNoise'>",
65
+ ":serialized:": "gAWVVQEAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5ub2lzZZSMHE9ybnN0ZWluVWhsZW5iZWNrQWN0aW9uTm9pc2WUk5QpgZR9lCiMBl90aGV0YZRHP8MzMzMzMzOMA19tdZSMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYIAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksBhZSMAUOUdJRSlIwGX3NpZ21hlGgJKJYIAAAAAAAAADMzMzMzM9M/lGgQSwGFlGgUdJRSlIwDX2R0lEc/hHrhR64Ue4wNaW5pdGlhbF9ub2lzZZROjApub2lzZV9wcmV2lGgJKJYIAAAAAAAAAAAAAAAAAAAAlGgQSwGFlGgUdJRSlHViLg==",
66
+ "_theta": 0.15,
67
+ "_mu": "[0.]",
68
+ "_sigma": "[0.3]",
69
+ "_dt": 0.01,
70
+ "initial_noise": null,
71
+ "noise_prev": "[0.]"
72
+ },
73
+ "start_time": 1673811020596785684,
74
+ "learning_rate": {
75
+ ":type:": "<class 'function'>",
76
+ ":serialized:": "gAWVCQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMay9ncGZzZHN3b3JrL3Byb2plY3RzL3JlY2gvdWxpL3VwZjgyc3AvZW52X2RtYy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgkMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxrL2dwZnNkc3dvcmsvcHJvamVjdHMvcmVjaC91bGkvdXBmODJzcC9lbnZfZG1jL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
77
+ },
78
+ "tensorboard_log": "runs/CartpoleDMC-v0__ddpg__3757117300__1673811016/CartpoleDMC-v0",
79
  "lr_schedule": {
80
  ":type:": "<class 'function'>",
81
+ ":serialized:": "gAWVCQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMay9ncGZzZHN3b3JrL3Byb2plY3RzL3JlY2gvdWxpL3VwZjgyc3AvZW52X2RtYy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgkMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxrL2dwZnNkc3dvcmsvcHJvamVjdHMvcmVjaC91bGkvdXBmODJzcC9lbnZfZG1jL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
82
  },
83
  "_last_obs": null,
84
  "_last_episode_starts": {
 
87
  },
88
  "_last_original_obs": {
89
  ":type:": "<class 'numpy.ndarray'>",
90
+ ":serialized:": "gAWViQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYUAAAAAAAAAF4seT/vRX4/JXntPbMYHb8I7ZU+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksBSwWGlIwBQ5R0lFKULg=="
91
  },
92
  "_episode_num": 1000,
93
  "use_sde": false,
 
95
  "_current_progress_remaining": 0.0,
96
  "ep_info_buffer": {
97
  ":type:": "<class 'collections.deque'>",
98
+ ":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIrKxtigc8jUCUhpRSlIwBbJRN6AOMAXSUR0DIWeA+yJKrdX2UKGgGaAloD0MIox03/M55jkCUhpRSlGgVTegDaBZHQMhhHExIre91fZQoaAZoCWgPQwgYl6q0hU+NQJSGlFKUaBVN6ANoFkdAyGiDqTKT0XV9lChoBmgJaA9DCDfjNEQVQ4tAlIaUUpRoFU3oA2gWR0DIb4AbsF+vdX2UKGgGaAloD0MIfR8OEoIOhkCUhpRSlGgVTegDaBZHQMh20Mr/bTN1fZQoaAZoCWgPQwg8bCIzV+KOQJSGlFKUaBVN6ANoFkdAyH48ow22onV9lChoBmgJaA9DCAjHLHvyoYdAlIaUUpRoFU3oA2gWR0DIhSVqcmShdX2UKGgGaAloD0MIVP1K5+PsjUCUhpRSlGgVTegDaBZHQMiMizz/ZNB1fZQoaAZoCWgPQwicTrLVJUWMQJSGlFKUaBVN6ANoFkdAyJNff+jubHV9lChoBmgJaA9DCJJ6T+V0uYRAlIaUUpRoFU3oA2gWR0DImd5uXNTtdX2UKGgGaAloD0MIinYVUh49h0CUhpRSlGgVTegDaBZHQMigtxIatLd1fZQoaAZoCWgPQwicNXhfFcaLQJSGlFKUaBVN6ANoFkdAyKd28/UvwnV9lChoBmgJaA9DCNIdxM70HYRAlIaUUpRoFU3oA2gWR0DIrgV8XvYwdX2UKGgGaAloD0MIhllo57TKekCUhpRSlGgVTegDaBZHQMi1dw0GeMB1fZQoaAZoCWgPQwiVu8/x8XKOQJSGlFKUaBVN6ANoFkdAyLzSz5XU6XV9lChoBmgJaA9DCEdzZOU34odAlIaUUpRoFU3oA2gWR0DIw/TDEWIodX2UKGgGaAloD0MIR1UTRD2/jECUhpRSlGgVTegDaBZHQMjLTiyhSLt1fZQoaAZoCWgPQwjpmV5iLKGDQJSGlFKUaBVN6ANoFkdAyNK3Nzr/sHV9lChoBmgJaA9DCBueXinLXYlAlIaUUpRoFU3oA2gWR0DI2b7Z8KG+dX2UKGgGaAloD0MIw552+IsHjUCUhpRSlGgVTegDaBZHQMjg8b2criF1fZQoaAZoCWgPQwgSUOEIstaGQJSGlFKUaBVN6ANoFkdAyOfHncL0BnV9lChoBmgJaA9DCBuEud3rfYxAlIaUUpRoFU3oA2gWR0DI7kc1TBIndX2UKGgGaAloD0MINEksKbeyiECUhpRSlGgVTegDaBZHQMj1IlbVz6t1fZQoaAZoCWgPQwhh4/p3nUCOQJSGlFKUaBVN6ANoFkdAyPvwV8kUsXV9lChoBmgJaA9DCHxinSpf04VAlIaUUpRoFU3oA2gWR0DJApc9U0emdX2UKGgGaAloD0MIP3PWp9zKjkCUhpRSlGgVTegDaBZHQMkPzjyOJch1fZQoaAZoCWgPQwipFDsaB9KOQJSGlFKUaBVN6ANoFkdAyRbp+GXXy3V9lChoBmgJaA9DCJPJqZ0hwIdAlIaUUpRoFU3oA2gWR0DJHkjdYW+HdX2UKGgGaAloD0MIx4Ds9W4wekCUhpRSlGgVTegDaBZHQMkluHmig011fZQoaAZoCWgPQwhsy4Cz9PKGQJSGlFKUaBVN6ANoFkdAySy+/47A+XV9lChoBmgJaA9DCD+O5sgKJo5AlIaUUpRoFU3oA2gWR0DJM/9j9XLedX2UKGgGaAloD0MI9WVpp0Yah0CUhpRSlGgVTegDaBZHQMk62w3YL9d1fZQoaAZoCWgPQwj4HFiOEBGMQJSGlFKUaBVN6ANoFkdAyUFxSXMQmXV9lChoBmgJaA9DCMdI9gj1YoNAlIaUUpRoFU3oA2gWR0DJSFAWxhUjdX2UKGgGaAloD0MIliNkIE87g0CUhpRSlGgVTegDaBZHQMlPPVlXiit1fZQoaAZoCWgPQwhHHogsEnCBQJSGlFKUaBVN6ANoFkdAyVX+CHRCyHV9lChoBmgJaA9DCAucbAPXEY5AlIaUUpRoFU3oA2gWR0DJXYU+kgwHdX2UKGgGaAloD0MIdH0fDpKai0CUhpRSlGgVTegDaBZHQMllEFCswL51fZQoaAZoCWgPQwjovwevHaaLQJSGlFKUaBVN6ANoFkdAyWxAOnVG1HV9lChoBmgJaA9DCGppboVwE4lAlIaUUpRoFU3oA2gWR0DJc8enO0LMdX2UKGgGaAloD0MI3gAz32H8jUCUhpRSlGgVTegDaBZHQMl7PzyauwJ1fZQoaAZoCWgPQwiTOCuiRjCDQJSGlFKUaBVN6ANoFkdAyYJrYTTOPnV9lChoBmgJaA9DCAJnKVmujolAlIaUUpRoFU3oA2gWR0DJiXncgyM2dX2UKGgGaAloD0MIRwTj4BLKjECUhpRSlGgVTegDaBZHQMmQa9joZAJ1fZQoaAZoCWgPQwjYRdEDv8KBQJSGlFKUaBVN6ANoFkdAyZcI7cwg1XV9lChoBmgJaA9DCJ8B9WaUr3pAlIaUUpRoFU3oA2gWR0DJnfLZtelbdX2UKGgGaAloD0MIEalpF5OjhUCUhpRSlGgVTegDaBZHQMmkkoP07Kd1fZQoaAZoCWgPQwjGM2jo32KNQJSGlFKUaBVN6ANoFkdAyavHxKg7HXV9lChoBmgJaA9DCJiJIqQOjYtAlIaUUpRoFU3oA2gWR0DJs0u6wt8NdX2UKGgGaAloD0MIYMrAAU3AgUCUhpRSlGgVTegDaBZHQMm6czjm0Vt1fZQoaAZoCWgPQwjJBWfwl7mFQJSGlFKUaBVN6ANoFkdAycfKiTMaCXV9lChoBmgJaA9DCEvK3efYw4pAlIaUUpRoFU3oA2gWR0DJz1ez0HyFdX2UKGgGaAloD0MIntFWJVERi0CUhpRSlGgVTegDaBZHQMnWkFlK9PF1fZQoaAZoCWgPQwj9hokGKQGHQJSGlFKUaBVN6ANoFkdAyd2JqrR0EHV9lChoBmgJaA9DCF+4c2FEWI5AlIaUUpRoFU3oA2gWR0DJ5BZY5ksjdX2UKGgGaAloD0MIhIO9iUGmikCUhpRSlGgVTegDaBZHQMnq+NpM6BB1fZQoaAZoCWgPQwha8KKvgI2KQJSGlFKUaBVN6ANoFkdAyfHdxlQMyHV9lChoBmgJaA9DCMmwijeSlopAlIaUUpRoFU3oA2gWR0DJ+Ckyad+YdX2UKGgGaAloD0MItTf4wiQrjECUhpRSlGgVTegDaBZHQMn/swaaTfR1fZQoaAZoCWgPQwjMe5xpovWKQJSGlFKUaBVN6ANoFkdAygdCTvAoHHV9lChoBmgJaA9DCHP3OT5agI5AlIaUUpRoFU3oA2gWR0DKDntJpWWAdX2UKGgGaAloD0MI8Z4Dy7Gxg0CUhpRSlGgVTegDaBZHQMoWDL6+FlF1fZQoaAZoCWgPQwiBzM6i1+yMQJSGlFKUaBVN6ANoFkdAyh2DUz9CNXV9lChoBmgJaA9DCMfw2M+iJ4hAlIaUUpRoFU3oA2gWR0DKJLRaLXMAdX2UKGgGaAloD0MIFxIwulxQikCUhpRSlGgVTegDaBZHQMor+n1e0HB1fZQoaAZoCWgPQwhvZYnO0oOEQJSGlFKUaBVN6ANoFkdAyjLqQf6oEXV9lChoBmgJaA9DCC7IluVLDopAlIaUUpRoFU3oA2gWR0DKOYVr433pdX2UKGgGaAloD0MIizVc5N5niUCUhpRSlGgVTegDaBZHQMpAcgEt/Wl1fZQoaAZoCWgPQwjxDYXPlmZ/QJSGlFKUaBVN6ANoFkdAykdljiGWU3V9lChoBmgJaA9DCKbydoRT5oJAlIaUUpRoFU3oA2gWR0DKTiC35N48dX2UKGgGaAloD0MIFf4MbzbMjECUhpRSlGgVTegDaBZHQMpVpRKg7HR1fZQoaAZoCWgPQwjj/iPTQe6LQJSGlFKUaBVN6ANoFkdAyl00YNy5qnV9lChoBmgJaA9DCMa/z7iw/YtAlIaUUpRoFU3oA2gWR0DKZF4nWrfcdX2UKGgGaAloD0MIxQPKplyigUCUhpRSlGgVTegDaBZHQMpr8MZP2wp1fZQoaAZoCWgPQwgx0/avTL6OQJSGlFKUaBVN6ANoFkdAynOEgnMMZ3V9lChoBmgJaA9DCFRweEFk7I1AlIaUUpRoFU3oA2gWR0DKgFMMCtA+dX2UKGgGaAloD0MIl6jeGpjcjkCUhpRSlGgVTegDaBZHQMqHSTJyQxN1fZQoaAZoCWgPQwjtEP+wJSaHQJSGlFKUaBVN6ANoFkdAyo3tK+SKWXV9lChoBmgJaA9DCAFNhA2vq45AlIaUUpRoFU3oA2gWR0DKlOLmGM4tdX2UKGgGaAloD0MIvVErTL8hjUCUhpRSlGgVTegDaBZHQMqb5IsiB5J1fZQoaAZoCWgPQwhlx0Yg3gWCQJSGlFKUaBVN6ANoFkdAyqLDYHPeHnV9lChoBmgJaA9DCKSOjqux7ItAlIaUUpRoFU3oA2gWR0DKqnExZdOZdX2UKGgGaAloD0MI6IU7F6Ymh0CUhpRSlGgVTegDaBZHQMqx8qNAC4l1fZQoaAZoCWgPQwj9SufDE0SLQJSGlFKUaBVN6ANoFkdAyrlB8VHnU3V9lChoBmgJaA9DCKUvhJxXnYlAlIaUUpRoFU3oA2gWR0DKwNgkgOjJdX2UKGgGaAloD0MIUP2DSCbih0CUhpRSlGgVTegDaBZHQMrIAFj/dZd1fZQoaAZoCWgPQwgB/FOqJDOHQJSGlFKUaBVN6ANoFkdAys+Ebn5i3HV9lChoBmgJaA9DCPfnoiHjM3tAlIaUUpRoFU3oA2gWR0DK1sdWS2YwdX2UKGgGaAloD0MIb7ckB8yjg0CUhpRSlGgVTegDaBZHQMreEmM4tHx1fZQoaAZoCWgPQwiXVdgMkJiKQJSGlFKUaBVN6ANoFkdAyuVwMnZ00XV9lChoBmgJaA9DCOTbuwY9oolAlIaUUpRoFU3oA2gWR0DK7GoFkhA4dX2UKGgGaAloD0MIdChDVcxbiECUhpRSlGgVTegDaBZHQMrwseJgssh1fZQoaAZoCWgPQwjJ/+Tv/ueKQJSGlFKUaBVN6ANoFkdAyvTmH31zyXV9lChoBmgJaA9DCF3Ed2LW4IpAlIaUUpRoFU3oA2gWR0DK+Rp6F/QTdX2UKGgGaAloD0MIEYsYdlgMiECUhpRSlGgVTegDaBZHQMr9TdJz1bt1fZQoaAZoCWgPQwiCOA8ncCOIQJSGlFKUaBVN6ANoFkdAywGCMpgCwXV9lChoBmgJaA9DCBajrrUXs4hAlIaUUpRoFU3oA2gWR0DLBbXf4yoGdX2UKGgGaAloD0MI+grSjIV7h0CUhpRSlGgVTegDaBZHQMsJ6PNFBpp1fZQoaAZoCWgPQwhm3T8WAjqJQJSGlFKUaBVN6ANoFkdAyw4cjfNzKnV9lChoBmgJaA9DCIeiQJ9ojYZAlIaUUpRoFU3oA2gWR0DLEk8zl90BdWUu"
99
  },
100
  "ep_success_buffer": {
101
  ":type:": "<class 'collections.deque'>",
 
103
  },
104
  "_n_updates": 1000000,
105
  "buffer_size": 1,
106
+ "batch_size": 64,
107
  "learning_starts": 100,
108
  "tau": 0.005,
109
  "gamma": 0.99,
 
114
  ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
115
  "__module__": "stable_baselines3.common.buffers",
116
  "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
117
+ "__init__": "<function ReplayBuffer.__init__ at 0x139896dd0>",
118
+ "add": "<function ReplayBuffer.add at 0x139896e60>",
119
+ "sample": "<function ReplayBuffer.sample at 0x139896ef0>",
120
+ "_get_samples": "<function ReplayBuffer._get_samples at 0x139896f80>",
121
  "__abstractmethods__": "frozenset()",
122
+ "_abc_impl": "<_abc._abc_data object at 0x139836280>"
123
  },
124
  "replay_buffer_kwargs": {},
125
  "train_freq": {
ddpg-CartpoleDMC-v0/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da847fad2037ddb02726800e4a0df41f4381cdeb2db097268415452192dbfc6e
3
  size 1492509
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2b4d0b8ccac39463f11616bef8492f3180debfd1e197a9a8023faf2072d6528
3
  size 1492509
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6e31e14f626aa13b39aa9599bbc2098dabbe353811f68cff712d31cbd29fca9
3
- size 126013
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:613f7d0e18c00bd0917ad26f69552b415640cd2300288ec5f3efab70698e7b45
3
+ size 156822
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 991.7419097999998, "std_reward": 0.45462611289097343, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-01-15T16:57:59.429907"}
 
1
+ {"mean_reward": 885.5004687999999, "std_reward": 4.93610187527313, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-01-16T08:50:36.963750"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e4938adfe4c1ee50bc2dc3f220e636d4cd5d641becf774bb40109a6b2bea90b
3
- size 32968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2ab4ce5419d6105f084e517a228f67bf79a341d2cc807c442d89f1739bd5c88
3
+ size 43170