Upload folder using huggingface_hub
Browse files- .summary/0/events.out.tfevents.1740689707.631c800cb024 +3 -0
- README.md +1 -1
- checkpoint_p0/best_000002712_22216704_reward_31.850.pth +3 -0
- checkpoint_p0/checkpoint_000003049_24977408.pth +3 -0
- checkpoint_p0/checkpoint_000003053_25010176.pth +3 -0
- config.json +13 -11
- replay.mp4 +2 -2
- sf_log.txt +0 -0
.summary/0/events.out.tfevents.1740689707.631c800cb024
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52a57a4c664a8fb0c37300c584ef8c592253d24ea4f3d2959097f68218f5b5c6
|
3 |
+
size 1897610
|
README.md
CHANGED
@@ -15,7 +15,7 @@ model-index:
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
-
value:
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
+
value: 12.55 +/- 7.27
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
checkpoint_p0/best_000002712_22216704_reward_31.850.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41117ae72490213e4f6612604bcbe03b177dea2a774fd55dcb8fd2d60c73296e
|
3 |
+
size 36830735
|
checkpoint_p0/checkpoint_000003049_24977408.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e95dcaba387481cb54ffe8417b8079085371e051834be524c51fe70558d0051c
|
3 |
+
size 36831233
|
checkpoint_p0/checkpoint_000003053_25010176.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e85475c587a308bec60a10191b17308cbb8f5d8f84dfe5a9483f8fac0160564
|
3 |
+
size 36831233
|
config.json
CHANGED
@@ -65,8 +65,8 @@
|
|
65 |
"summaries_use_frameskip": true,
|
66 |
"heartbeat_interval": 10,
|
67 |
"heartbeat_reporting_interval": 300,
|
68 |
-
"train_for_env_steps":
|
69 |
-
"train_for_seconds":
|
70 |
"save_every_sec": 120,
|
71 |
"keep_checkpoints": 2,
|
72 |
"load_checkpoint_kind": "latest",
|
@@ -84,12 +84,12 @@
|
|
84 |
512
|
85 |
],
|
86 |
"use_rnn": true,
|
87 |
-
"rnn_size":
|
88 |
-
"rnn_type": "
|
89 |
-
"rnn_num_layers":
|
90 |
"decoder_mlp_layers": [],
|
91 |
"nonlinearity": "elu",
|
92 |
-
"policy_initialization": "
|
93 |
"policy_init_gain": 1.0,
|
94 |
"actor_critic_share_weights": true,
|
95 |
"adaptive_stddev": true,
|
@@ -130,7 +130,7 @@
|
|
130 |
"wide_aspect_ratio": false,
|
131 |
"eval_env_frameskip": 1,
|
132 |
"fps": 35,
|
133 |
-
"command_line": "--env=doom_health_gathering_supreme --batch_size=2048 --num_workers=20 --num_envs_per_worker=12 --train_for_env_steps=
|
134 |
"cli_args": {
|
135 |
"env": "doom_health_gathering_supreme",
|
136 |
"num_workers": 20,
|
@@ -140,11 +140,13 @@
|
|
140 |
"decorrelate_experience_max_seconds": 1,
|
141 |
"heartbeat_interval": 10,
|
142 |
"heartbeat_reporting_interval": 300,
|
143 |
-
"train_for_env_steps":
|
144 |
-
"train_for_seconds":
|
145 |
"encoder_conv_architecture": "convnet_atari",
|
146 |
-
"rnn_size":
|
147 |
-
"rnn_type": "
|
|
|
|
|
148 |
},
|
149 |
"git_hash": "unknown",
|
150 |
"git_repo_name": "not a git repository"
|
|
|
65 |
"summaries_use_frameskip": true,
|
66 |
"heartbeat_interval": 10,
|
67 |
"heartbeat_reporting_interval": 300,
|
68 |
+
"train_for_env_steps": 25000000,
|
69 |
+
"train_for_seconds": 320000,
|
70 |
"save_every_sec": 120,
|
71 |
"keep_checkpoints": 2,
|
72 |
"load_checkpoint_kind": "latest",
|
|
|
84 |
512
|
85 |
],
|
86 |
"use_rnn": true,
|
87 |
+
"rnn_size": 256,
|
88 |
+
"rnn_type": "gru",
|
89 |
+
"rnn_num_layers": 2,
|
90 |
"decoder_mlp_layers": [],
|
91 |
"nonlinearity": "elu",
|
92 |
+
"policy_initialization": "xavier_uniform",
|
93 |
"policy_init_gain": 1.0,
|
94 |
"actor_critic_share_weights": true,
|
95 |
"adaptive_stddev": true,
|
|
|
130 |
"wide_aspect_ratio": false,
|
131 |
"eval_env_frameskip": 1,
|
132 |
"fps": 35,
|
133 |
+
"command_line": "--env=doom_health_gathering_supreme --batch_size=2048 --num_workers=20 --num_envs_per_worker=12 --train_for_env_steps=25000000 --gamma=0.99 --rnn_type=gru --rnn_num_layers=2 --rnn_size=256 --encoder_conv_architecture=convnet_atari --policy_initialization=xavier_uniform --decorrelate_experience_max_seconds=1 --heartbeat_interval=10 --heartbeat_reporting_interval=300 --train_for_seconds=320000",
|
134 |
"cli_args": {
|
135 |
"env": "doom_health_gathering_supreme",
|
136 |
"num_workers": 20,
|
|
|
140 |
"decorrelate_experience_max_seconds": 1,
|
141 |
"heartbeat_interval": 10,
|
142 |
"heartbeat_reporting_interval": 300,
|
143 |
+
"train_for_env_steps": 25000000,
|
144 |
+
"train_for_seconds": 320000,
|
145 |
"encoder_conv_architecture": "convnet_atari",
|
146 |
+
"rnn_size": 256,
|
147 |
+
"rnn_type": "gru",
|
148 |
+
"rnn_num_layers": 2,
|
149 |
+
"policy_initialization": "xavier_uniform"
|
150 |
},
|
151 |
"git_hash": "unknown",
|
152 |
"git_repo_name": "not a git repository"
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d488dc1e4f869e596687c2e517c07dde52da289092233d573494a31666914641
|
3 |
+
size 24752210
|
sf_log.txt
CHANGED
The diff for this file is too large to render.
See raw diff
|
|