kalbuld commited on
Commit
df8b92f
·
verified ·
1 Parent(s): bdd769b

Upload PPO SpaceInvaders-v5 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: ALE/SpaceInvaders-v5
17
  metrics:
18
  - type: mean_reward
19
- value: 167.50 +/- 77.89
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: ALE/SpaceInvaders-v5
17
  metrics:
18
  - type: mean_reward
19
+ value: 313.00 +/- 134.61
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
The diff for this file is too large to render. See raw diff
 
ppo-SpaceInvaders-v5.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:173970460477fb5f445f004ce180c6a7e965a6d943c2fdf17f68d0b1ba8d1eaf
3
- size 156045551
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b63c0bd3767e876ddc27c383e95a631e86e7e6e0596b8018821c8ddc195a61f2
3
+ size 155642641
ppo-SpaceInvaders-v5/data CHANGED
The diff for this file is too large to render. See raw diff
 
ppo-SpaceInvaders-v5/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b768c06648359f99db718e363e47644e0fa4d8c9161ac3ebf22f22e596ae6939
3
  size 103300394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c3ba4f33e9739c7051e55169271a9bd0ac3d90d7cb8780bd8aae1c06988890c
3
  size 103300394
ppo-SpaceInvaders-v5/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fc59b20655619f55f1276d69f56868067e575a1976411fec7d3447bd26c066a
3
  size 51649778
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8925fd4cbf6730e1ac9e2b6cc9289b663e18912bbe7034ddc031776d34f735ef
3
  size 51649778
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 167.5, "std_reward": 77.88613483798, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-10-06T04:13:26.935025"}
 
1
+ {"mean_reward": 313.0, "std_reward": 134.6142637315972, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-10-06T05:23:30.467482"}