colinrgodsey commited on Jul 25, 2024

Commit

e020ca5

verified ·

1 Parent(s): 8544a15

Push agent to the Hub

Files changed (18) hide show

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
 tags:
-- doom_health_gathering_supreme
 - ppo
 - deep-reinforcement-learning
 - reinforcement-learning
@@ -13,32 +13,33 @@ model-index:
       type: reinforcement-learning
       name: reinforcement-learning
     dataset:
-      name: doom_health_gathering_supreme
-      type: doom_health_gathering_supreme
     metrics:
     - type: mean_reward
-      value: 23.32 +/- 12.86
       name: mean_reward
       verified: false
 ---
-  # PPO Agent Playing doom_health_gathering_supreme
-  This is a trained model of a PPO agent playing doom_health_gathering_supreme.
   # Hyperparameters
   ```python
-  {'env_id': 'doom_health_gathering_supreme'
-'learning_rate': 0.001
 'gamma': 0.99
 'gae_lambda': 0.95
 'clip_coef': 0.2
-'total_timesteps': 1000000
-'ent_coef': 0.001
 'vf_coef': 0.5
 'max_grad_norm': 4.0
 'epsilon': 0
-'num_minibatches': 2
 'update_epochs': 1}
   ```

 ---
 tags:
+- HealthGatheringSupreme-v1
 - ppo
 - deep-reinforcement-learning
 - reinforcement-learning
       type: reinforcement-learning
       name: reinforcement-learning
     dataset:
+      name: HealthGatheringSupreme-v1
+      type: HealthGatheringSupreme-v1
     metrics:
     - type: mean_reward
+      value: 23.42 +/- 20.23
       name: mean_reward
       verified: false
 ---
+  # PPO Agent Playing HealthGatheringSupreme-v1
+  This is a trained model of a PPO agent playing HealthGatheringSupreme-v1.
   # Hyperparameters
   ```python
+  {'env_id': 'HealthGatheringSupreme-v1'
+'learning_rate': 0.0005
+'learning_rate_min': 1e-06
 'gamma': 0.99
 'gae_lambda': 0.95
 'clip_coef': 0.2
+'total_timesteps': 2000000
+'ent_coef': 0.05
 'vf_coef': 0.5
 'max_grad_norm': 4.0
 'epsilon': 0
+'num_minibatches': 4
 'update_epochs': 1}
   ```

logs/events.out.tfevents.1721869554.tf-notebook-0.8669.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6947fbbf2fff5fed1c0e049c1a6c69ea6720ba1a4ed7b01fe025d0fc61864a2a
+size 5555

logs/events.out.tfevents.1721869582.tf-notebook-0.8669.2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:704bd63940b8708968784f9423a173cc46aafe172f6eed3ef20d40d2cb7f4fff
+size 263043

logs/events.out.tfevents.1721870482.tf-notebook-0.8669.3 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b9248687fc0867b83fc4edf497c02d8f8541c504eea38338f2530abc775ae69
+size 88

logs/events.out.tfevents.1721870495.tf-notebook-0.10474.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:2ba644caa7a3a79265839058cd7bbb1a21dc08ca4f66b8f861b3aa41ad1fe1df
+size 88

logs/events.out.tfevents.1721870528.tf-notebook-0.10474.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:86cb3cbad2ae86756572dd6a5ab1af46f565751b14510ced7c1e0fa8b2a5727c
+size 88

logs/events.out.tfevents.1721870553.tf-notebook-0.10474.2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a4f8252a59cf1bc6dbc44aaad64de896962c2532002f6ea40d0e691ae8e3d0d
+size 88

logs/events.out.tfevents.1721870563.tf-notebook-0.10830.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0dd7e66684e4eb33956cc55dad18f0cfccc10d6f5ba2c84fff9a4ad43b26b894
+size 88

logs/events.out.tfevents.1721870604.tf-notebook-0.10989.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:00812c9c3b7b250243f82f95379c56074a7c06344133a950aef20a9769a58b6c
+size 88

logs/events.out.tfevents.1721870771.tf-notebook-0.11148.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:bccd4023cb6b778bde58abd7957e2813477ae8e89bb834468942efeb3d7a5fd5
+size 8280

logs/events.out.tfevents.1721870852.tf-notebook-0.11323.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:adec6207f5b7601cc34663cd81a67970db0c813c7bab52fe477b30a7d00acb60
+size 492195

logs/events.out.tfevents.1721872526.tf-notebook-0.11499.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:926b0a2823d32f53977ab71f81b06c4a462808f7a05f958dccadf3fe43853252
+size 8280

logs/events.out.tfevents.1721872613.tf-notebook-0.11896.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:096341e46438d876a38a4d3925927d07fb5bb78f2d0f7fc59f2e05f70aea7c23
+size 24664

logs/events.out.tfevents.1721872749.tf-notebook-0.12294.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c50c813ab17f7374742923890098bbb2638152a2800ac9ee1d8016cb39e1390c
+size 88

logs/events.out.tfevents.1721872878.tf-notebook-0.12294.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:110886d5926cde26685bb5291066ec5c7a2ecd593edac5c18854a70c0266f3e3
+size 601227

model.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1ac57c7a562674be7b647e77c7397eeb4049ab42bbfb65ecd8c400e8a57a6af8
-size 16208178

 version https://git-lfs.github.com/spec/v1
+oid sha256:f4f422fd65107d4b849ee465442c8d2cd7e559f763626598965f355384a94db3
+size 16091362

replay.mp4 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:096d2848cacb8d6b3fea66adf12b653f332423a7d8c7dbf1d353da4c1493bbf0
-size 10432852

 version https://git-lfs.github.com/spec/v1
+oid sha256:dd8e6ba71ad9ef373f72deb5744cdd952f78c1cb3a173ca8f05a518e49b50a9e
+size 7298703

results.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"env_id": "~~doom_health_gathering_supreme~~", "mean_reward": 23.~~317407608032227~~, "std_reward": 12.~~858668327331543~~, "n_evaluation_episodes": 10, "eval_datetime": "2024-07-~~25T01~~:02:59.~~758995~~"}


1	+ {"env_id": "HealthGatheringSupreme-v1", "mean_reward": 23.419818878173828, "std_reward": 20.225461959838867, "n_evaluation_episodes": 10, "eval_datetime": "2024-07-25T02:42:47.105650"}