jaymanvirk commited on
Commit
ada2a99
·
verified ·
1 Parent(s): efe1365

Upload folder using huggingface_hub

Browse files
.summary/0/events.out.tfevents.1715932120.1a9e46bdb9a9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:385ea0a981444fcf1fc9eabf3b18ad56daa215e30c27a5636ec49fff4f3472ab
3
+ size 804884
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
- value: 4.10 +/- 0.34
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
+ value: 10.44 +/- 2.99
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000001815_7434240_reward_32.035.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1a654d4670ed5bc012447486ae77c6e8f0b12ef9353e781bdc4306d57cc69ed
3
+ size 34929051
checkpoint_p0/checkpoint_000001721_7049216.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b86f69aea65de683db7a9e26e3f9fe366c81b085c5ed98011343774b615b3585
3
+ size 34929477
checkpoint_p0/checkpoint_000001955_8007680.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9f3b9ac82861d9578ed6be09f1e6d4107c21994108e4a97ac3954b50a9605be
3
- size 34929477
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:393792f1f85848c499dfa4906061e6cda02d5dbbf120619aa672d085ca33f732
3
+ size 34929541
config.json CHANGED
@@ -30,7 +30,7 @@
30
  "normalize_returns": true,
31
  "exploration_loss_coeff": 0.001,
32
  "value_loss_coeff": 0.5,
33
- "kl_loss_coeff": 0.0,
34
  "exploration_loss": "symmetric_kl",
35
  "gae_lambda": 0.95,
36
  "ppo_clip_ratio": 0.1,
@@ -130,12 +130,13 @@
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
- "command_line": "--env=doom_health_gathering_supreme --seed=0 --num_workers=8 --num_envs_per_worker=8 --train_for_env_steps=8000000",
134
  "cli_args": {
135
  "env": "doom_health_gathering_supreme",
136
  "seed": 0,
137
  "num_workers": 8,
138
  "num_envs_per_worker": 8,
 
139
  "train_for_env_steps": 8000000
140
  },
141
  "git_hash": "unknown",
 
30
  "normalize_returns": true,
31
  "exploration_loss_coeff": 0.001,
32
  "value_loss_coeff": 0.5,
33
+ "kl_loss_coeff": 0.3,
34
  "exploration_loss": "symmetric_kl",
35
  "gae_lambda": 0.95,
36
  "ppo_clip_ratio": 0.1,
 
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
+ "command_line": "--env=doom_health_gathering_supreme --seed=0 --kl_loss_coeff=0.3 --num_workers=8 --num_envs_per_worker=8 --train_for_env_steps=8000000",
134
  "cli_args": {
135
  "env": "doom_health_gathering_supreme",
136
  "seed": 0,
137
  "num_workers": 8,
138
  "num_envs_per_worker": 8,
139
+ "kl_loss_coeff": 0.3,
140
  "train_for_env_steps": 8000000
141
  },
142
  "git_hash": "unknown",
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46c349d29b75962ed92793897e7581a2a15087e62ed9a6ee4b9d6b8d9ba7d373
3
- size 5060169
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a726339a83db3e91dd82f291cb157ded2099bec799708959ac04cf2cab75f823
3
+ size 20190222
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff