Roberto commited on
Commit
5498eec
1 Parent(s): 99bf7d8

Upload . with huggingface_hub

Browse files
.gitattributes CHANGED
@@ -2,7 +2,6 @@
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
  *.ftz filter=lfs diff=lfs merge=lfs -text
7
  *.gz filter=lfs diff=lfs merge=lfs -text
8
  *.h5 filter=lfs diff=lfs merge=lfs -text
 
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
 
5
  *.ftz filter=lfs diff=lfs merge=lfs -text
6
  *.gz filter=lfs diff=lfs merge=lfs -text
7
  *.h5 filter=lfs diff=lfs merge=lfs -text
.summary/0/events.out.tfevents.1666554178.r12i0n7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33d6690167305d19adae5a1910c49cce96aab0dc3bf34b2374b061abe3368430
3
+ size 9192848
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
- value: 8.04 +/- 3.48
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
+ value: 19.19 +/- 4.01
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000466273_3819708416_reward_63.056.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f546634a38180cb4a57aec199213e3b845b90a5ebb8206ddaa081c2c9d4ba854
3
+ size 41231900
checkpoint_p0/checkpoint_000538763_4413546496.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45dae22eea622f39a8ea7e51fa52eed63489f4548785a8c2c80d9fc5b1bc676b
3
+ size 41231900
checkpoint_p0/checkpoint_000539850_4422451200.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73fcca08938df3021096188ffa087fe10baadc4365972130f8958a74df3e498f
3
+ size 41231900
config.json CHANGED
@@ -2,11 +2,11 @@
2
  "help": false,
3
  "algo": "APPO",
4
  "env": "doom_health_gathering_supreme",
5
- "experiment": "default_experiment",
6
- "train_dir": "/content/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
- "seed": null,
10
  "num_policies": 1,
11
  "async_rl": true,
12
  "serial_mode": false,
@@ -15,9 +15,9 @@
15
  "worker_num_splits": 2,
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
- "num_workers": 8,
19
- "num_envs_per_worker": 4,
20
- "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
23
  "rollout": 32,
@@ -42,17 +42,15 @@
42
  "adam_eps": 1e-06,
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
- "max_grad_norm": 4.0,
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
49
- "lr_adaptive_min": 1e-06,
50
- "lr_adaptive_max": 0.01,
51
  "obs_subtract_mean": 0.0,
52
  "obs_scale": 255.0,
53
  "normalize_input": true,
54
  "normalize_input_keys": null,
55
- "decorrelate_experience_max_seconds": 0,
56
  "decorrelate_envs_on_one_worker": true,
57
  "actor_worker_gpus": [],
58
  "set_workers_cpu_affinity": true,
@@ -63,10 +61,10 @@
63
  "flush_summaries_interval": 30,
64
  "stats_avg": 100,
65
  "summaries_use_frameskip": true,
66
- "heartbeat_interval": 20,
67
- "heartbeat_reporting_interval": 600,
68
- "train_for_env_steps": 4000000,
69
- "train_for_seconds": 10000000000,
70
  "save_every_sec": 120,
71
  "keep_checkpoints": 2,
72
  "load_checkpoint_kind": "latest",
@@ -85,10 +83,10 @@
85
  ],
86
  "use_rnn": true,
87
  "rnn_size": 512,
88
- "rnn_type": "gru",
89
  "rnn_num_layers": 1,
90
  "decoder_mlp_layers": [],
91
- "nonlinearity": "elu",
92
  "policy_initialization": "orthogonal",
93
  "policy_init_gain": 1.0,
94
  "actor_critic_share_weights": true,
@@ -97,7 +95,6 @@
97
  "initial_stddev": 1.0,
98
  "use_env_info_cache": false,
99
  "env_gpu_actions": false,
100
- "env_gpu_observations": true,
101
  "env_frameskip": 4,
102
  "env_framestack": 1,
103
  "pixel_format": "CHW",
@@ -130,13 +127,30 @@
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
- "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=4000000",
134
  "cli_args": {
 
135
  "env": "doom_health_gathering_supreme",
136
- "num_workers": 8,
137
- "num_envs_per_worker": 4,
138
- "train_for_env_steps": 4000000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
139
  },
140
- "git_hash": "unknown",
141
- "git_repo_name": "not a git repository"
142
  }
 
2
  "help": false,
3
  "algo": "APPO",
4
  "env": "doom_health_gathering_supreme",
5
+ "experiment": "vizdoom_doom_health_gathering_supreme_2222",
6
+ "train_dir": "/scratch/sample_factory/train_dir/vizdoom",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
+ "seed": 2222,
10
  "num_policies": 1,
11
  "async_rl": true,
12
  "serial_mode": false,
 
15
  "worker_num_splits": 2,
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
+ "num_workers": 20,
19
+ "num_envs_per_worker": 12,
20
+ "batch_size": 2048,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
23
  "rollout": 32,
 
42
  "adam_eps": 1e-06,
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
+ "max_grad_norm": 0.0,
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
 
 
49
  "obs_subtract_mean": 0.0,
50
  "obs_scale": 255.0,
51
  "normalize_input": true,
52
  "normalize_input_keys": null,
53
+ "decorrelate_experience_max_seconds": 1,
54
  "decorrelate_envs_on_one_worker": true,
55
  "actor_worker_gpus": [],
56
  "set_workers_cpu_affinity": true,
 
61
  "flush_summaries_interval": 30,
62
  "stats_avg": 100,
63
  "summaries_use_frameskip": true,
64
+ "heartbeat_interval": 10,
65
+ "heartbeat_reporting_interval": 300,
66
+ "train_for_env_steps": 10000000000,
67
+ "train_for_seconds": 3600000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
70
  "load_checkpoint_kind": "latest",
 
83
  ],
84
  "use_rnn": true,
85
  "rnn_size": 512,
86
+ "rnn_type": "lstm",
87
  "rnn_num_layers": 1,
88
  "decoder_mlp_layers": [],
89
+ "nonlinearity": "relu",
90
  "policy_initialization": "orthogonal",
91
  "policy_init_gain": 1.0,
92
  "actor_critic_share_weights": true,
 
95
  "initial_stddev": 1.0,
96
  "use_env_info_cache": false,
97
  "env_gpu_actions": false,
 
98
  "env_frameskip": 4,
99
  "env_framestack": 1,
100
  "pixel_format": "CHW",
 
127
  "wide_aspect_ratio": false,
128
  "eval_env_frameskip": 1,
129
  "fps": 35,
130
+ "command_line": "--train_for_seconds=3600000 --algo=APPO --gamma=0.99 --use_rnn=True --num_workers=20 --num_envs_per_worker=12 --num_epochs=1 --rollout=32 --recurrence=32 --batch_size=2048 --benchmark=False --max_grad_norm=0.0 --decorrelate_experience_max_seconds=1 --nonlinearity=relu --rnn_type=lstm --num_policies=1 --heartbeat_reporting_interval=300 --train_dir=/scratch/sample_factory/train_dir/vizdoom --seed=2222 --experiment=vizdoom_doom_health_gathering_supreme_2222 --env=doom_health_gathering_supreme",
131
  "cli_args": {
132
+ "algo": "APPO",
133
  "env": "doom_health_gathering_supreme",
134
+ "experiment": "vizdoom_doom_health_gathering_supreme_2222",
135
+ "train_dir": "/scratch/sample_factory/train_dir/vizdoom",
136
+ "seed": 2222,
137
+ "num_policies": 1,
138
+ "num_workers": 20,
139
+ "num_envs_per_worker": 12,
140
+ "batch_size": 2048,
141
+ "num_epochs": 1,
142
+ "rollout": 32,
143
+ "recurrence": 32,
144
+ "gamma": 0.99,
145
+ "max_grad_norm": 0.0,
146
+ "decorrelate_experience_max_seconds": 1,
147
+ "heartbeat_reporting_interval": 300,
148
+ "train_for_seconds": 3600000,
149
+ "benchmark": false,
150
+ "use_rnn": true,
151
+ "rnn_type": "lstm",
152
+ "nonlinearity": "relu"
153
  },
154
+ "git_hash": "9da68b57eecd73c3c884c1be2d938b46aa7a7f49",
155
+ "git_repo_name": "https://github.com/alex-petrenko/sample-factory.git"
156
  }
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3496433111ee787e9222d3bb86cbf34b226b3892fdcd07390684da95e6c0ee36
3
- size 15367561
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9391cd4e0bdbcff669e6aa2d253dd4d5d776c909fd135137c442a49bd146ef4
3
+ size 38370996