sdpkjc commited on
Commit
4435bb6
1 Parent(s): 11badf2

pushing model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +3 -3
  2. events.out.tfevents.1705723465.4090-171.2555519.0 → events.out.tfevents.1705726201.4090-171.2583911.0 +2 -2
  3. ppo_fix_continuous_action-10000.cleanrl_model +0 -0
  4. ppo_fix_continuous_action-100000.cleanrl_model +0 -0
  5. ppo_fix_continuous_action-105000.cleanrl_model +0 -0
  6. ppo_fix_continuous_action-110000.cleanrl_model +0 -0
  7. ppo_fix_continuous_action-115000.cleanrl_model +0 -0
  8. ppo_fix_continuous_action-120000.cleanrl_model +0 -0
  9. ppo_fix_continuous_action-125000.cleanrl_model +0 -0
  10. ppo_fix_continuous_action-130000.cleanrl_model +0 -0
  11. ppo_fix_continuous_action-135000.cleanrl_model +0 -0
  12. ppo_fix_continuous_action-140000.cleanrl_model +0 -0
  13. ppo_fix_continuous_action-145000.cleanrl_model +0 -0
  14. ppo_fix_continuous_action-15000.cleanrl_model +0 -0
  15. ppo_fix_continuous_action-150000.cleanrl_model +0 -0
  16. ppo_fix_continuous_action-155000.cleanrl_model +0 -0
  17. ppo_fix_continuous_action-160000.cleanrl_model +0 -0
  18. ppo_fix_continuous_action-165000.cleanrl_model +0 -0
  19. ppo_fix_continuous_action-170000.cleanrl_model +0 -0
  20. ppo_fix_continuous_action-175000.cleanrl_model +0 -0
  21. ppo_fix_continuous_action-180000.cleanrl_model +0 -0
  22. ppo_fix_continuous_action-185000.cleanrl_model +0 -0
  23. ppo_fix_continuous_action-190000.cleanrl_model +0 -0
  24. ppo_fix_continuous_action-195000.cleanrl_model +0 -0
  25. ppo_fix_continuous_action-20000.cleanrl_model +0 -0
  26. ppo_fix_continuous_action-200000.cleanrl_model +0 -0
  27. ppo_fix_continuous_action-205000.cleanrl_model +0 -0
  28. ppo_fix_continuous_action-210000.cleanrl_model +0 -0
  29. ppo_fix_continuous_action-215000.cleanrl_model +0 -0
  30. ppo_fix_continuous_action-220000.cleanrl_model +0 -0
  31. ppo_fix_continuous_action-225000.cleanrl_model +0 -0
  32. ppo_fix_continuous_action-230000.cleanrl_model +0 -0
  33. ppo_fix_continuous_action-235000.cleanrl_model +0 -0
  34. ppo_fix_continuous_action-240000.cleanrl_model +0 -0
  35. ppo_fix_continuous_action-245000.cleanrl_model +0 -0
  36. ppo_fix_continuous_action-25000.cleanrl_model +0 -0
  37. ppo_fix_continuous_action-250000.cleanrl_model +0 -0
  38. ppo_fix_continuous_action-255000.cleanrl_model +0 -0
  39. ppo_fix_continuous_action-260000.cleanrl_model +0 -0
  40. ppo_fix_continuous_action-265000.cleanrl_model +0 -0
  41. ppo_fix_continuous_action-270000.cleanrl_model +0 -0
  42. ppo_fix_continuous_action-275000.cleanrl_model +0 -0
  43. ppo_fix_continuous_action-280000.cleanrl_model +0 -0
  44. ppo_fix_continuous_action-285000.cleanrl_model +0 -0
  45. ppo_fix_continuous_action-290000.cleanrl_model +0 -0
  46. ppo_fix_continuous_action-295000.cleanrl_model +0 -0
  47. ppo_fix_continuous_action-30000.cleanrl_model +0 -0
  48. ppo_fix_continuous_action-300000.cleanrl_model +0 -0
  49. ppo_fix_continuous_action-305000.cleanrl_model +0 -0
  50. ppo_fix_continuous_action-310000.cleanrl_model +0 -0
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: Swimmer-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 77.44 +/- 2.78
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -46,7 +46,7 @@ curl -OL https://huggingface.co/sdpkjc/Swimmer-v4-ppo_fix_continuous_action-seed
46
  curl -OL https://huggingface.co/sdpkjc/Swimmer-v4-ppo_fix_continuous_action-seed5/raw/main/pyproject.toml
47
  curl -OL https://huggingface.co/sdpkjc/Swimmer-v4-ppo_fix_continuous_action-seed5/raw/main/poetry.lock
48
  poetry install --all-extras
49
- python ppo_fix_continuous_action.py --save-model --upload-model --hf-entity sdpkjc --env-id Swimmer-v4 --seed 5 --track --cuda False
50
  ```
51
 
52
  # Hyperparameters
@@ -56,7 +56,7 @@ python ppo_fix_continuous_action.py --save-model --upload-model --hf-entity sdpk
56
  'capture_video': False,
57
  'clip_coef': 0.2,
58
  'clip_vloss': True,
59
- 'cuda': False,
60
  'ent_coef': 0.0,
61
  'env_id': 'Swimmer-v4',
62
  'exp_name': 'ppo_fix_continuous_action',
 
16
  type: Swimmer-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 59.11 +/- 5.97
20
  name: mean_reward
21
  verified: false
22
  ---
 
46
  curl -OL https://huggingface.co/sdpkjc/Swimmer-v4-ppo_fix_continuous_action-seed5/raw/main/pyproject.toml
47
  curl -OL https://huggingface.co/sdpkjc/Swimmer-v4-ppo_fix_continuous_action-seed5/raw/main/poetry.lock
48
  poetry install --all-extras
49
+ python ppo_fix_continuous_action.py --save-model --upload-model --hf-entity sdpkjc --env-id Swimmer-v4 --seed 5 --track
50
  ```
51
 
52
  # Hyperparameters
 
56
  'capture_video': False,
57
  'clip_coef': 0.2,
58
  'clip_vloss': True,
59
+ 'cuda': True,
60
  'ent_coef': 0.0,
61
  'env_id': 'Swimmer-v4',
62
  'exp_name': 'ppo_fix_continuous_action',
events.out.tfevents.1705723465.4090-171.2555519.0 → events.out.tfevents.1705726201.4090-171.2583911.0 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4175d2c14a00c0477ce120627fbe7ac3352b5377e268a7db8dbcd5f71a912478
3
- size 376391
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:863312e3c4914d0205868fb0ead5641b55975aac7eea29ff159e8f87857b73a3
3
+ size 403050
ppo_fix_continuous_action-10000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-100000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-105000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-110000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-115000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-120000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-125000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-130000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-135000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-140000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-145000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-15000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-150000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-155000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-160000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-165000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-170000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-175000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-180000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-185000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-190000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-195000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-20000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-200000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-205000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-210000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-215000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-220000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-225000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-230000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-235000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-240000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-245000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-25000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-250000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-255000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-260000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-265000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-270000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-275000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-280000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-285000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-290000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-295000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-30000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-300000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-305000.cleanrl_model ADDED
Binary file (44.5 kB). View file
 
ppo_fix_continuous_action-310000.cleanrl_model ADDED
Binary file (44.5 kB). View file