quilaquedi commited on
Commit
134f691
·
1 Parent(s): a802bb3

Upload baseline PPO LunarLander-v2 trained agent

Browse files
Files changed (3) hide show
  1. README.md +1 -1
  2. lunarlander-v2_ppo_v0.zip +1 -1
  3. results.json +1 -1
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 247.79 +/- 12.29
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 258.98 +/- 18.52
20
  name: mean_reward
21
  verified: false
22
  ---
lunarlander-v2_ppo_v0.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d78c8324a6321daf310e5a512b5084ed4c8c69c4b03d2a3b144c54abd95e6e52
3
  size 145917
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab81624293858438b755b36b0f3c4ca5bc9349674bf068a7b1839215beefd9b
3
  size 145917
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 247.79293876379307, "std_reward": 12.291194859734047, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-15T14:13:00.010466"}
 
1
+ {"mean_reward": 258.98265062935377, "std_reward": 18.51602437736822, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-15T14:14:48.100705"}