francescosabbarese commited on
Commit
cc24025
·
verified ·
1 Parent(s): 45073f3

Upload folder using huggingface_hub

Browse files
.summary/0/events.out.tfevents.1740689707.631c800cb024 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52a57a4c664a8fb0c37300c584ef8c592253d24ea4f3d2959097f68218f5b5c6
3
+ size 1897610
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
- value: 10.25 +/- 4.97
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
+ value: 12.55 +/- 7.27
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000002712_22216704_reward_31.850.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41117ae72490213e4f6612604bcbe03b177dea2a774fd55dcb8fd2d60c73296e
3
+ size 36830735
checkpoint_p0/checkpoint_000003049_24977408.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e95dcaba387481cb54ffe8417b8079085371e051834be524c51fe70558d0051c
3
+ size 36831233
checkpoint_p0/checkpoint_000003053_25010176.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e85475c587a308bec60a10191b17308cbb8f5d8f84dfe5a9483f8fac0160564
3
+ size 36831233
config.json CHANGED
@@ -65,8 +65,8 @@
65
  "summaries_use_frameskip": true,
66
  "heartbeat_interval": 10,
67
  "heartbeat_reporting_interval": 300,
68
- "train_for_env_steps": 100000000,
69
- "train_for_seconds": 300000,
70
  "save_every_sec": 120,
71
  "keep_checkpoints": 2,
72
  "load_checkpoint_kind": "latest",
@@ -84,12 +84,12 @@
84
  512
85
  ],
86
  "use_rnn": true,
87
- "rnn_size": 512,
88
- "rnn_type": "lstm",
89
- "rnn_num_layers": 1,
90
  "decoder_mlp_layers": [],
91
  "nonlinearity": "elu",
92
- "policy_initialization": "orthogonal",
93
  "policy_init_gain": 1.0,
94
  "actor_critic_share_weights": true,
95
  "adaptive_stddev": true,
@@ -130,7 +130,7 @@
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
- "command_line": "--env=doom_health_gathering_supreme --batch_size=2048 --num_workers=20 --num_envs_per_worker=12 --train_for_env_steps=100000000 --gamma=0.99 --rnn_type=lstm --rnn_size=512 --encoder_conv_architecture=convnet_atari --decorrelate_experience_max_seconds=1 --heartbeat_interval=10 --heartbeat_reporting_interval=300 --train_for_seconds=300000",
134
  "cli_args": {
135
  "env": "doom_health_gathering_supreme",
136
  "num_workers": 20,
@@ -140,11 +140,13 @@
140
  "decorrelate_experience_max_seconds": 1,
141
  "heartbeat_interval": 10,
142
  "heartbeat_reporting_interval": 300,
143
- "train_for_env_steps": 100000000,
144
- "train_for_seconds": 300000,
145
  "encoder_conv_architecture": "convnet_atari",
146
- "rnn_size": 512,
147
- "rnn_type": "lstm"
 
 
148
  },
149
  "git_hash": "unknown",
150
  "git_repo_name": "not a git repository"
 
65
  "summaries_use_frameskip": true,
66
  "heartbeat_interval": 10,
67
  "heartbeat_reporting_interval": 300,
68
+ "train_for_env_steps": 25000000,
69
+ "train_for_seconds": 320000,
70
  "save_every_sec": 120,
71
  "keep_checkpoints": 2,
72
  "load_checkpoint_kind": "latest",
 
84
  512
85
  ],
86
  "use_rnn": true,
87
+ "rnn_size": 256,
88
+ "rnn_type": "gru",
89
+ "rnn_num_layers": 2,
90
  "decoder_mlp_layers": [],
91
  "nonlinearity": "elu",
92
+ "policy_initialization": "xavier_uniform",
93
  "policy_init_gain": 1.0,
94
  "actor_critic_share_weights": true,
95
  "adaptive_stddev": true,
 
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
+ "command_line": "--env=doom_health_gathering_supreme --batch_size=2048 --num_workers=20 --num_envs_per_worker=12 --train_for_env_steps=25000000 --gamma=0.99 --rnn_type=gru --rnn_num_layers=2 --rnn_size=256 --encoder_conv_architecture=convnet_atari --policy_initialization=xavier_uniform --decorrelate_experience_max_seconds=1 --heartbeat_interval=10 --heartbeat_reporting_interval=300 --train_for_seconds=320000",
134
  "cli_args": {
135
  "env": "doom_health_gathering_supreme",
136
  "num_workers": 20,
 
140
  "decorrelate_experience_max_seconds": 1,
141
  "heartbeat_interval": 10,
142
  "heartbeat_reporting_interval": 300,
143
+ "train_for_env_steps": 25000000,
144
+ "train_for_seconds": 320000,
145
  "encoder_conv_architecture": "convnet_atari",
146
+ "rnn_size": 256,
147
+ "rnn_type": "gru",
148
+ "rnn_num_layers": 2,
149
+ "policy_initialization": "xavier_uniform"
150
  },
151
  "git_hash": "unknown",
152
  "git_repo_name": "not a git repository"
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73cade1b7c741fe9141d3bd76455c7715107bb078fb7600366c1a829064f2bba
3
- size 8751111
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d488dc1e4f869e596687c2e517c07dde52da289092233d573494a31666914641
3
+ size 24752210
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff