lambdavi commited on
Commit
7cd68e2
1 Parent(s): e923406

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. README.md +25 -0
  2. hyperparameters.json +1 -0
  3. model.zip +3 -0
  4. replay.mp4 +0 -0
  5. results.json +1 -0
README.md ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - PandaReach-v3
4
+ - ddpg
5
+ - reinforcement-learning
6
+ - custom-implementation
7
+ model-index:
8
+ - name: ddpg-PandaReach-v3
9
+ results:
10
+ - task:
11
+ type: reinforcement-learning
12
+ name: reinforcement-learning
13
+ dataset:
14
+ name: PandaReach-v3
15
+ type: PandaReach-v3
16
+ metrics:
17
+ - type: mean_reward
18
+ value: -1.64 +/- 0.82
19
+ name: mean_reward
20
+ verified: false
21
+ ---
22
+
23
+ # **DDPG** Agent playing **PandaReach-v3**
24
+ This is a trained model of a **DDPG** agent playing **PandaReach-v3** .
25
+
hyperparameters.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"env_id": "PandaReach-v3", "max_steps": 50000, "n_training_episodes": 9624, "n_eval_episodes": 3000, "learning_rate": 0.001}
model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2494d8dedf6351c800d01a501fd95a86339bdfc4bd572c740d5c498707ead9a
3
+ size 4091189
replay.mp4 ADDED
Binary file (9.47 kB). View file
 
results.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"env_id": "PandaReach-v3", "mean_reward": -1.64, "n_evaluation_episodes": 3000, "eval_datetime": "2024-01-28T09:35:31.806232"}