alidenewade commited on
Commit
35d3de9
·
verified ·
1 Parent(s): 150c4f1

Upload folder using huggingface_hub

Browse files
Files changed (37) hide show
  1. .gitattributes +1 -0
  2. .summary/0/events.out.tfevents.1730974276.ali +3 -0
  3. .summary/0/events.out.tfevents.1730974590.ali +3 -0
  4. .summary/0/events.out.tfevents.1730974664.ali +3 -0
  5. .summary/0/events.out.tfevents.1730975190.ali +3 -0
  6. .summary/0/events.out.tfevents.1730975549.ali +3 -0
  7. .summary/0/events.out.tfevents.1730975770.ali +3 -0
  8. .summary/0/events.out.tfevents.1730975809.ali +3 -0
  9. .summary/0/events.out.tfevents.1730975829.ali +3 -0
  10. .summary/0/events.out.tfevents.1730976027.ali +3 -0
  11. .summary/0/events.out.tfevents.1730978122.ali +3 -0
  12. .summary/0/events.out.tfevents.1730978309.ali +3 -0
  13. .summary/0/events.out.tfevents.1730978593.ali +3 -0
  14. .summary/0/events.out.tfevents.1730978881.ali +3 -0
  15. .summary/0/events.out.tfevents.1730979552.ali +3 -0
  16. .summary/0/events.out.tfevents.1730979979.ali +3 -0
  17. .summary/0/events.out.tfevents.1730980579.ali +3 -0
  18. .summary/0/events.out.tfevents.1730981989.ali +3 -0
  19. .summary/0/events.out.tfevents.1730982413.ali +0 -0
  20. .summary/0/events.out.tfevents.1730982684.ali +0 -0
  21. .summary/0/events.out.tfevents.1730982741.ali +3 -0
  22. .summary/0/events.out.tfevents.1730982907.ali +3 -0
  23. .summary/0/events.out.tfevents.1730984134.ali +3 -0
  24. .summary/0/events.out.tfevents.1730984471.ali +3 -0
  25. .summary/0/events.out.tfevents.1730986539.ali +3 -0
  26. .summary/0/events.out.tfevents.1730987699.ali +3 -0
  27. .summary/0/events.out.tfevents.1731011984.ali +0 -0
  28. .summary/0/events.out.tfevents.1731012020.ali +0 -0
  29. .summary/0/events.out.tfevents.1731012499.ali +3 -0
  30. .summary/0/events.out.tfevents.1731014017.ali +3 -0
  31. README.md +56 -0
  32. checkpoint_p0/best_000050505_206868480_reward_4.944.pth +3 -0
  33. checkpoint_p0/checkpoint_000052490_214999040.pth +3 -0
  34. checkpoint_p0/checkpoint_000052658_215687168.pth +3 -0
  35. config.json +142 -0
  36. replay.mp4 +3 -0
  37. sf_log.txt +0 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ replay.mp4 filter=lfs diff=lfs merge=lfs -text
.summary/0/events.out.tfevents.1730974276.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4382105e3ef6707c735ccd1579bf41ee9a01be70ee168b41b43f860e63647233
3
+ size 40
.summary/0/events.out.tfevents.1730974590.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38d118f6935be2e9cd880c8220197067c14a9d329cea5ddd42ca64ffb6a56b0e
3
+ size 151
.summary/0/events.out.tfevents.1730974664.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5cb81d627e1ce00aae8317ff3ad12859a9bab6e263c59bd93d0c9cec3e97d00
3
+ size 276148
.summary/0/events.out.tfevents.1730975190.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:597bf3ddf19d2be914ca908e7e364cb0334d237699e96aa3fa637e976b8d2228
3
+ size 43666
.summary/0/events.out.tfevents.1730975549.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28f1f4dcde7139511501908f7aca479f96594689b35b4537c393f083bdf9dda9
3
+ size 60347
.summary/0/events.out.tfevents.1730975770.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04e3d83a01510c600e7789ca5840916784d69ef5dd961e67e88ed1361ace092d
3
+ size 40
.summary/0/events.out.tfevents.1730975809.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69466774033c58c11cb37326d494c1b7ca021571c086781221112a5d8100ffef
3
+ size 40
.summary/0/events.out.tfevents.1730975829.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05621f66b90cc3a8a5315e00fc608b69bc8981101048aceb1225776c8e8be71c
3
+ size 565
.summary/0/events.out.tfevents.1730976027.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31af7e16468267d3b690298905441fa94c76320d3c08b51b8dcc2605a016e688
3
+ size 40
.summary/0/events.out.tfevents.1730978122.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ab3136ad6f56c7e5e63be561dbe627e85c6017ee07f1e1f8699528c69081346
3
+ size 20617
.summary/0/events.out.tfevents.1730978309.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff634f8baab7584feee9878d5fb0256f54bb7323cebd618ed303916d59a0a4b3
3
+ size 90
.summary/0/events.out.tfevents.1730978593.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f08ed57889be4f7b015f785c19c0711d9f4721ec8d6922df06d0a2dd71f5bca5
3
+ size 141087
.summary/0/events.out.tfevents.1730978881.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10efcede3823ac261b583e403b212b3de7a25fecbce7b6404eae0dab5e47b4ed
3
+ size 56857
.summary/0/events.out.tfevents.1730979552.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd078efe6f013cdc7d671dd119f486ff7f169b28aba261a7c8e01577d7fa30e4
3
+ size 4915
.summary/0/events.out.tfevents.1730979979.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9439b155a01d1103172ccd2561e5959231c4f43de30dbb4489126329672767a3
3
+ size 2683
.summary/0/events.out.tfevents.1730980579.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d28c8ee2be2d5ec00d853944f6079d26aeb23fdcdf653535a1326cb1211cc83f
3
+ size 3251
.summary/0/events.out.tfevents.1730981989.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c6074b66c173883d8c0d34862aeccd2380761dafe4ee720058660a2aeaefa2f
3
+ size 3251
.summary/0/events.out.tfevents.1730982413.ali ADDED
File without changes
.summary/0/events.out.tfevents.1730982684.ali ADDED
File without changes
.summary/0/events.out.tfevents.1730982741.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:814f1a05c62696ae377c67fe385aa2b78f2e1f1bb048a26fdfd6d51ce9706129
3
+ size 40
.summary/0/events.out.tfevents.1730982907.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b77ed93e786f21de8587f4a2cf8852dbda3dbf10c6afaab58ea577ed51e36a71
3
+ size 418702
.summary/0/events.out.tfevents.1730984134.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63b94cdef6e415ddbb0526608b0aeec84bab1ed76f502a53dc2253bb836dc4ad
3
+ size 3066
.summary/0/events.out.tfevents.1730984471.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed1f2510c136f287f3925582d617719373e7e94b3e3f3728b2fe53983b303464
3
+ size 887900
.summary/0/events.out.tfevents.1730986539.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1e11b0059b918b90d03360ce897dbcfbe4919841fc122b58ade530701936f1f
3
+ size 3137
.summary/0/events.out.tfevents.1730987699.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87059ecbdc1670d0818d006cee4eb4c1c8f0c91d0d12d9116f813c80be81e325
3
+ size 375709
.summary/0/events.out.tfevents.1731011984.ali ADDED
File without changes
.summary/0/events.out.tfevents.1731012020.ali ADDED
File without changes
.summary/0/events.out.tfevents.1731012499.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9df453dfb3b9b49a5a14dd8296be889497ffc265dc538b6a69193e7b60f856be
3
+ size 3066
.summary/0/events.out.tfevents.1731014017.ali ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74000e5dac727c97b7fa7174a685eb3bbb538887f7ec2c0ef1685dcfc5653da5
3
+ size 7814291
README.md ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: sample-factory
3
+ tags:
4
+ - deep-reinforcement-learning
5
+ - reinforcement-learning
6
+ - sample-factory
7
+ model-index:
8
+ - name: APPO
9
+ results:
10
+ - task:
11
+ type: reinforcement-learning
12
+ name: reinforcement-learning
13
+ dataset:
14
+ name: doom_health_gathering_supreme
15
+ type: doom_health_gathering_supreme
16
+ metrics:
17
+ - type: mean_reward
18
+ value: 4.11 +/- 0.62
19
+ name: mean_reward
20
+ verified: false
21
+ ---
22
+
23
+ A(n) **APPO** model trained on the **doom_health_gathering_supreme** environment.
24
+
25
+ This model was trained using Sample-Factory 2.0: https://github.com/alex-petrenko/sample-factory.
26
+ Documentation for how to use Sample-Factory can be found at https://www.samplefactory.dev/
27
+
28
+
29
+ ## Downloading the model
30
+
31
+ After installing Sample-Factory, download the model with:
32
+ ```
33
+ python -m sample_factory.huggingface.load_from_hub -r alidenewade/rl_course_vizdoom_health_gathering_supreme-alid
34
+ ```
35
+
36
+
37
+ ## Using the model
38
+
39
+ To run the model after download, use the `enjoy` script corresponding to this environment:
40
+ ```
41
+ python -m <path.to.enjoy.module> --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=rl_course_vizdoom_health_gathering_supreme-alid
42
+ ```
43
+
44
+
45
+ You can also upload models to the Hugging Face Hub using the same script with the `--push_to_hub` flag.
46
+ See https://www.samplefactory.dev/10-huggingface/huggingface/ for more details
47
+
48
+ ## Training with this model
49
+
50
+ To continue training with this model, use the `train` script corresponding to this environment:
51
+ ```
52
+ python -m <path.to.train.module> --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=rl_course_vizdoom_health_gathering_supreme-alid --restart_behavior=resume --train_for_env_steps=10000000000
53
+ ```
54
+
55
+ Note, you may have to adjust `--train_for_env_steps` to a suitably high number as the experiment will resume at the number of steps it concluded at.
56
+
checkpoint_p0/best_000050505_206868480_reward_4.944.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:623329ecdb15960b9faa8deab2fdeb826e8abc897bdd6e010d871633abc14ca4
3
+ size 34929243
checkpoint_p0/checkpoint_000052490_214999040.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd9883e09c4d3e0564e621dfa733222a972ef9a1b85d5c98d87e2882267d1fad
3
+ size 34929669
checkpoint_p0/checkpoint_000052658_215687168.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f49ba940f2daa8637c534abc25808a59b815464b05d0415515ac063d49604f5
3
+ size 34929669
config.json ADDED
@@ -0,0 +1,142 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "help": false,
3
+ "algo": "APPO",
4
+ "env": "doom_health_gathering_supreme",
5
+ "experiment": "default_experiment",
6
+ "train_dir": "/root/hfRL/ml/LunarLander-v2/train_dir",
7
+ "restart_behavior": "resume",
8
+ "device": "gpu",
9
+ "seed": null,
10
+ "num_policies": 1,
11
+ "async_rl": true,
12
+ "serial_mode": false,
13
+ "batched_sampling": false,
14
+ "num_batches_to_accumulate": 2,
15
+ "worker_num_splits": 2,
16
+ "policy_workers_per_policy": 1,
17
+ "max_policy_lag": 1000,
18
+ "num_workers": 8,
19
+ "num_envs_per_worker": 4,
20
+ "batch_size": 1024,
21
+ "num_batches_per_epoch": 1,
22
+ "num_epochs": 1,
23
+ "rollout": 32,
24
+ "recurrence": 32,
25
+ "shuffle_minibatches": false,
26
+ "gamma": 0.99,
27
+ "reward_scale": 1.0,
28
+ "reward_clip": 1000.0,
29
+ "value_bootstrap": false,
30
+ "normalize_returns": true,
31
+ "exploration_loss_coeff": 0.001,
32
+ "value_loss_coeff": 0.5,
33
+ "kl_loss_coeff": 0.0,
34
+ "exploration_loss": "symmetric_kl",
35
+ "gae_lambda": 0.95,
36
+ "ppo_clip_ratio": 0.1,
37
+ "ppo_clip_value": 0.2,
38
+ "with_vtrace": false,
39
+ "vtrace_rho": 1.0,
40
+ "vtrace_c": 1.0,
41
+ "optimizer": "adam",
42
+ "adam_eps": 1e-06,
43
+ "adam_beta1": 0.9,
44
+ "adam_beta2": 0.999,
45
+ "max_grad_norm": 4.0,
46
+ "learning_rate": 0.0003,
47
+ "lr_schedule": "constant",
48
+ "lr_schedule_kl_threshold": 0.008,
49
+ "lr_adaptive_min": 1e-06,
50
+ "lr_adaptive_max": 0.01,
51
+ "obs_subtract_mean": 0.0,
52
+ "obs_scale": 255.0,
53
+ "normalize_input": true,
54
+ "normalize_input_keys": null,
55
+ "decorrelate_experience_max_seconds": 0,
56
+ "decorrelate_envs_on_one_worker": true,
57
+ "actor_worker_gpus": [],
58
+ "set_workers_cpu_affinity": true,
59
+ "force_envs_single_thread": false,
60
+ "default_niceness": 0,
61
+ "log_to_file": true,
62
+ "experiment_summaries_interval": 10,
63
+ "flush_summaries_interval": 30,
64
+ "stats_avg": 100,
65
+ "summaries_use_frameskip": true,
66
+ "heartbeat_interval": 20,
67
+ "heartbeat_reporting_interval": 600,
68
+ "train_for_env_steps": 1000000000,
69
+ "train_for_seconds": 10000000000,
70
+ "save_every_sec": 120,
71
+ "keep_checkpoints": 2,
72
+ "load_checkpoint_kind": "latest",
73
+ "save_milestones_sec": -1,
74
+ "save_best_every_sec": 5,
75
+ "save_best_metric": "reward",
76
+ "save_best_after": 100000,
77
+ "benchmark": false,
78
+ "encoder_mlp_layers": [
79
+ 512,
80
+ 512
81
+ ],
82
+ "encoder_conv_architecture": "convnet_simple",
83
+ "encoder_conv_mlp_layers": [
84
+ 512
85
+ ],
86
+ "use_rnn": true,
87
+ "rnn_size": 512,
88
+ "rnn_type": "gru",
89
+ "rnn_num_layers": 1,
90
+ "decoder_mlp_layers": [],
91
+ "nonlinearity": "elu",
92
+ "policy_initialization": "orthogonal",
93
+ "policy_init_gain": 1.0,
94
+ "actor_critic_share_weights": true,
95
+ "adaptive_stddev": true,
96
+ "continuous_tanh_scale": 0.0,
97
+ "initial_stddev": 1.0,
98
+ "use_env_info_cache": false,
99
+ "env_gpu_actions": false,
100
+ "env_gpu_observations": true,
101
+ "env_frameskip": 4,
102
+ "env_framestack": 1,
103
+ "pixel_format": "CHW",
104
+ "use_record_episode_statistics": false,
105
+ "with_wandb": false,
106
+ "wandb_user": null,
107
+ "wandb_project": "sample_factory",
108
+ "wandb_group": null,
109
+ "wandb_job_type": "SF",
110
+ "wandb_tags": [],
111
+ "with_pbt": false,
112
+ "pbt_mix_policies_in_one_env": true,
113
+ "pbt_period_env_steps": 5000000,
114
+ "pbt_start_mutation": 20000000,
115
+ "pbt_replace_fraction": 0.3,
116
+ "pbt_mutation_rate": 0.15,
117
+ "pbt_replace_reward_gap": 0.1,
118
+ "pbt_replace_reward_gap_absolute": 1e-06,
119
+ "pbt_optimize_gamma": false,
120
+ "pbt_target_objective": "true_objective",
121
+ "pbt_perturb_min": 1.1,
122
+ "pbt_perturb_max": 1.5,
123
+ "num_agents": -1,
124
+ "num_humans": 0,
125
+ "num_bots": -1,
126
+ "start_bot_difficulty": null,
127
+ "timelimit": null,
128
+ "res_w": 128,
129
+ "res_h": 72,
130
+ "wide_aspect_ratio": false,
131
+ "eval_env_frameskip": 1,
132
+ "fps": 35,
133
+ "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=4000000",
134
+ "cli_args": {
135
+ "env": "doom_health_gathering_supreme",
136
+ "num_workers": 8,
137
+ "num_envs_per_worker": 4,
138
+ "train_for_env_steps": 4000000
139
+ },
140
+ "git_hash": "unknown",
141
+ "git_repo_name": "not a git repository"
142
+ }
replay.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef772052cb02b4cbc305fa9b5a87a7f155a919d2d3d71db999a9133eaffd10d5
3
+ size 63660637
sf_log.txt ADDED
The diff for this file is too large to render. See raw diff