MadFritz commited on
Commit
b86ce06
·
1 Parent(s): 6962f22

Upload ars BipedalWalker-v3 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: BipedalWalker-v3
17
  metrics:
18
  - type: mean_reward
19
- value: -16.42 +/- 2.52
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: BipedalWalker-v3
17
  metrics:
18
  - type: mean_reward
19
+ value: -1.58 +/- 1.26
20
  name: mean_reward
21
  verified: false
22
  ---
ars-BipedalWalker-v3.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1d4693b7a51e2349cf0b817923292a24d3de338187196155d8f8a8b30d11de2
3
- size 14910
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fbcb710f4d22be3e1f98d771629542f1b4eff66171c9d1226ca5b28666b3518
3
+ size 22535
ars-BipedalWalker-v3/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVMAAAAAAAAACMGHNiM19jb250cmliLmFycy5wb2xpY2llc5SMD0FSU0xpbmVhclBvbGljeZSTlC4=",
5
  "__module__": "sb3_contrib.ars.policies",
6
  "__doc__": "\n Linear policy network for ARS.\n\n :param observation_space: The observation space of the environment\n :param action_space: The action space of the environment\n :param with_bias: With or without bias on the output\n :param squash_output: For continuous actions, whether the output is squashed\n or not using a ``tanh()`` function. If not squashed with tanh the output will instead be clipped.\n ",
7
- "__init__": "<function ARSLinearPolicy.__init__ at 0x7d86d77088b0>",
8
  "__abstractmethods__": "frozenset()",
9
- "_abc_impl": "<_abc._abc_data object at 0x7d86d76f8d80>"
10
  },
11
  "verbose": 5,
12
  "policy_kwargs": {},
13
- "num_timesteps": 5017333,
14
  "_total_timesteps": 5000000.0,
15
  "_num_timesteps_at_start": 0,
16
  "seed": null,
17
  "action_noise": null,
18
- "start_time": 1704124216615583280,
19
  "learning_rate": 0.02,
20
- "tensorboard_log": "runs/BipedalWalker-v3__ars-BipedalWalker-v3__1__1704124216",
21
  "_last_obs": {
22
  ":type:": "<class 'numpy.ndarray'>",
23
  ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAPly5jdoA9Wzj3QBN7O7J7mPK3A6RtYqt5iu1TvhzrQ3c7HnO/ncqTll0yq3usHUO8Ki8TZzsec7rCmEO4JqhTv8Rok72RCQOwxdmjvQFak7iYm9O/dH2Ttzsec7c7HnO5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsYhpSMAUOUdJRSlC4="
@@ -33,71 +33,519 @@
33
  "_episode_num": 0,
34
  "use_sde": false,
35
  "sde_sample_freq": -1,
36
- "_current_progress_remaining": 0.001653400000000027,
37
  "_stats_window_size": 100,
38
  "ep_info_buffer": [
39
  {
40
- "r": -22.732791,
41
  "l": 1600
42
  },
43
  {
44
- "r": -26.241545,
45
  "l": 1600
46
  },
47
  {
48
- "r": -21.244826,
49
  "l": 1600
50
  },
51
  {
52
- "r": -18.363228,
53
  "l": 1600
54
  },
55
  {
56
- "r": -21.464579,
57
  "l": 1600
58
  },
59
  {
60
- "r": -19.700786,
61
  "l": 1600
62
  },
63
  {
64
- "r": -20.990937,
65
  "l": 1600
66
  },
67
  {
68
- "r": -20.206168,
69
  "l": 1600
70
  },
71
  {
72
- "r": -13.470986,
73
  "l": 1600
74
  },
75
  {
76
- "r": -22.199595,
77
  "l": 1600
78
  },
79
  {
80
- "r": -16.295752,
81
  "l": 1600
82
  },
83
  {
84
- "r": -18.869419,
85
  "l": 1600
86
  },
87
  {
88
- "r": -24.387612,
89
  "l": 1600
90
  },
91
  {
92
- "r": -21.286163,
93
  "l": 1600
94
  },
95
  {
96
- "r": -30.705473,
97
  "l": 1600
98
  },
99
  {
100
- "r": -19.318436,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
101
  "l": 1600
102
  }
103
  ],
@@ -105,10 +553,10 @@
105
  ":type:": "<class 'collections.deque'>",
106
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
107
  },
108
- "_n_updates": 204,
109
  "observation_space": {
110
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
111
- ":serialized:": "gAWVRgQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBAolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgUSxiFlGgYdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoECiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaApLGIWUaBh0lFKUjARoaWdolGgQKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksYhZRoGHSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==",
112
  "dtype": "float32",
113
  "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]",
114
  "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]",
@@ -123,7 +571,7 @@
123
  },
124
  "action_space": {
125
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
126
- ":serialized:": "gAWVoQEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgHjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgQKJYEAAAAAAAAAAEBAQGUaBRLBIWUaBh0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgQKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaApLBIWUaBh0lFKUjARoaWdolGgQKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaApLBIWUaBh0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=",
127
  "dtype": "float32",
128
  "bounded_below": "[ True True True True]",
129
  "bounded_above": "[ True True True True]",
@@ -137,25 +585,25 @@
137
  "_np_random": null
138
  },
139
  "n_envs": 1,
140
- "n_delta": 8,
141
- "pop_size": 16,
142
  "delta_std_schedule": {
143
  ":type:": "<class 'function'>",
144
- ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz+pmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
145
  },
146
  "n_eval_episodes": 1,
147
- "n_top": 8,
148
  "alive_bonus_offset": 0,
149
  "zero_policy": true,
150
  "weights": {
151
  ":type:": "<class 'torch.Tensor'>",
152
- ":serialized:": "gAWVAgMAAAAAAACMDHRvcmNoLl91dGlsc5SMEl9yZWJ1aWxkX3RlbnNvcl92MpSTlCiMDXRvcmNoLnN0b3JhZ2WUjBBfbG9hZF9mcm9tX2J5dGVzlJOUQnsCAACAAooKbPycRvkgaqhQGS6AAk3pAy6AAn1xAChYEAAAAHByb3RvY29sX3ZlcnNpb25xAU3pA1gNAAAAbGl0dGxlX2VuZGlhbnECiFgKAAAAdHlwZV9zaXplc3EDfXEEKFgFAAAAc2hvcnRxBUsCWAMAAABpbnRxBksEWAQAAABsb25ncQdLBHV1LoACKFgHAAAAc3RvcmFnZXEAY3RvcmNoCkZsb2F0U3RvcmFnZQpxAVgOAAAAOTk2NjU2MDUyNTg2MjRxAlgDAAAAY3B1cQNLYE50cQRRLoACXXEAWA4AAAA5OTY2NTYwNTI1ODYyNHEBYS5gAAAAAAAAAAQaDj6YWpU9OgUCPfIel7wf7EK+rywhPqHHS7zskpW8vvVnPHS9Gjz+vwW7YrKNPlU0bL5ijmK99taAPJd0C75QJBi+fNQWPk/lF76PxZm+pwxivRBW8L3KLfM9nsbTvEBvCT3qwQA+SIPbvbnE/L2K2tI9riQRPjnpc75oRbY8OtJtPfZC07168M69c7+avhjJh71WD1A9jLSGPEOYWT5k0Bs7rusTvrbPML5iUhK9HDPIvpYIZjzKrmi9DS70PJ+O5D2wXHU+EGR2vArA8zx6cwi+l5rMvcBGZr1yOpk8BEDHPJOjVr3OZ7K9BjGgPVm8l76+F8w8/unPva5pTz4sFAS+zjD8PW64zT3TU6095ZuSvWPxgD5it6q8I3noPXavn76amxe+dWiDPtBB4D2SSFi+jyytvY2BsDwtYjy9iAfTPIqUCD7DzWW9E4OlPV8byb7AzZS9yZU3vd4kNL7Zx8k8u2suPbo/s74aiZ+9mFmQvkZztL3eaT09+j0avpSFlFKUSwBLYIWUSwGFlImMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpR0lFKULg=="
153
  },
154
  "processes": null,
155
  "old_count": 0,
156
  "lr_schedule": {
157
  ":type:": "<class 'function'>",
158
- ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz+UeuFHrhR7hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
159
  },
160
  "n_params": 96
161
  }
 
4
  ":serialized:": "gAWVMAAAAAAAAACMGHNiM19jb250cmliLmFycy5wb2xpY2llc5SMD0FSU0xpbmVhclBvbGljeZSTlC4=",
5
  "__module__": "sb3_contrib.ars.policies",
6
  "__doc__": "\n Linear policy network for ARS.\n\n :param observation_space: The observation space of the environment\n :param action_space: The action space of the environment\n :param with_bias: With or without bias on the output\n :param squash_output: For continuous actions, whether the output is squashed\n or not using a ``tanh()`` function. If not squashed with tanh the output will instead be clipped.\n ",
7
+ "__init__": "<function ARSLinearPolicy.__init__ at 0x000002A5AD53E440>",
8
  "__abstractmethods__": "frozenset()",
9
+ "_abc_impl": "<_abc._abc_data object at 0x000002A5AD545280>"
10
  },
11
  "verbose": 5,
12
  "policy_kwargs": {},
13
+ "num_timesteps": 5029198,
14
  "_total_timesteps": 5000000.0,
15
  "_num_timesteps_at_start": 0,
16
  "seed": null,
17
  "action_noise": null,
18
+ "start_time": 1704129075173670900,
19
  "learning_rate": 0.02,
20
+ "tensorboard_log": "runs/BipedalWalker-v3__ars-BipedalWalker-v3__1__1704129075",
21
  "_last_obs": {
22
  ":type:": "<class 'numpy.ndarray'>",
23
  ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAPly5jdoA9Wzj3QBN7O7J7mPK3A6RtYqt5iu1TvhzrQ3c7HnO/ncqTll0yq3usHUO8Ki8TZzsec7rCmEO4JqhTv8Rok72RCQOwxdmjvQFak7iYm9O/dH2Ttzsec7c7HnO5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsYhpSMAUOUdJRSlC4="
 
33
  "_episode_num": 0,
34
  "use_sde": false,
35
  "sde_sample_freq": -1,
36
+ "_current_progress_remaining": 0.03482660000000004,
37
  "_stats_window_size": 100,
38
  "ep_info_buffer": [
39
  {
40
+ "r": -0.858298,
41
  "l": 1600
42
  },
43
  {
44
+ "r": -2.976511,
45
  "l": 1600
46
  },
47
  {
48
+ "r": -2.287396,
49
  "l": 1600
50
  },
51
  {
52
+ "r": -0.170771,
53
  "l": 1600
54
  },
55
  {
56
+ "r": -3.177175,
57
  "l": 1600
58
  },
59
  {
60
+ "r": -1.321648,
61
  "l": 1600
62
  },
63
  {
64
+ "r": -0.810533,
65
  "l": 1600
66
  },
67
  {
68
+ "r": 1.043323,
69
  "l": 1600
70
  },
71
  {
72
+ "r": -4.461499,
73
  "l": 1600
74
  },
75
  {
76
+ "r": -0.691904,
77
  "l": 1600
78
  },
79
  {
80
+ "r": -0.388016,
81
  "l": 1600
82
  },
83
  {
84
+ "r": -6.926794,
85
  "l": 1600
86
  },
87
  {
88
+ "r": 0.965219,
89
  "l": 1600
90
  },
91
  {
92
+ "r": -1.449291,
93
  "l": 1600
94
  },
95
  {
96
+ "r": -1.782632,
97
  "l": 1600
98
  },
99
  {
100
+ "r": -18.089477,
101
+ "l": 1600
102
+ },
103
+ {
104
+ "r": -0.337723,
105
+ "l": 1600
106
+ },
107
+ {
108
+ "r": -2.969601,
109
+ "l": 1600
110
+ },
111
+ {
112
+ "r": -6.312056,
113
+ "l": 1600
114
+ },
115
+ {
116
+ "r": -4.653198,
117
+ "l": 1600
118
+ },
119
+ {
120
+ "r": -15.871131,
121
+ "l": 1600
122
+ },
123
+ {
124
+ "r": -2.104873,
125
+ "l": 1600
126
+ },
127
+ {
128
+ "r": -0.62008,
129
+ "l": 1600
130
+ },
131
+ {
132
+ "r": -22.682619,
133
+ "l": 1600
134
+ },
135
+ {
136
+ "r": -1.070423,
137
+ "l": 1600
138
+ },
139
+ {
140
+ "r": -0.868259,
141
+ "l": 1600
142
+ },
143
+ {
144
+ "r": -0.100044,
145
+ "l": 1600
146
+ },
147
+ {
148
+ "r": 1.388992,
149
+ "l": 1600
150
+ },
151
+ {
152
+ "r": -0.606481,
153
+ "l": 1600
154
+ },
155
+ {
156
+ "r": 0.13454,
157
+ "l": 1600
158
+ },
159
+ {
160
+ "r": 0.403181,
161
+ "l": 1600
162
+ },
163
+ {
164
+ "r": -6.21947,
165
+ "l": 1600
166
+ },
167
+ {
168
+ "r": -2.612893,
169
+ "l": 1600
170
+ },
171
+ {
172
+ "r": -0.490002,
173
+ "l": 1600
174
+ },
175
+ {
176
+ "r": 0.762088,
177
+ "l": 1600
178
+ },
179
+ {
180
+ "r": -8.212339,
181
+ "l": 1600
182
+ },
183
+ {
184
+ "r": -0.509528,
185
+ "l": 1600
186
+ },
187
+ {
188
+ "r": -6.702586,
189
+ "l": 1600
190
+ },
191
+ {
192
+ "r": -1.102252,
193
+ "l": 1600
194
+ },
195
+ {
196
+ "r": -0.542297,
197
+ "l": 1600
198
+ },
199
+ {
200
+ "r": -2.554229,
201
+ "l": 1600
202
+ },
203
+ {
204
+ "r": 0.288999,
205
+ "l": 1600
206
+ },
207
+ {
208
+ "r": -4.404716,
209
+ "l": 1600
210
+ },
211
+ {
212
+ "r": -1.628192,
213
+ "l": 1600
214
+ },
215
+ {
216
+ "r": -2.45756,
217
+ "l": 1600
218
+ },
219
+ {
220
+ "r": -4.696834,
221
+ "l": 1600
222
+ },
223
+ {
224
+ "r": -1.310907,
225
+ "l": 1600
226
+ },
227
+ {
228
+ "r": -18.882727,
229
+ "l": 1600
230
+ },
231
+ {
232
+ "r": -0.008551,
233
+ "l": 1600
234
+ },
235
+ {
236
+ "r": -123.061934,
237
+ "l": 131
238
+ },
239
+ {
240
+ "r": -1.392482,
241
+ "l": 1600
242
+ },
243
+ {
244
+ "r": -3.201651,
245
+ "l": 1600
246
+ },
247
+ {
248
+ "r": -4.626365,
249
+ "l": 1600
250
+ },
251
+ {
252
+ "r": -1.444375,
253
+ "l": 1600
254
+ },
255
+ {
256
+ "r": -0.352113,
257
+ "l": 1600
258
+ },
259
+ {
260
+ "r": -6.791308,
261
+ "l": 1600
262
+ },
263
+ {
264
+ "r": 0.680932,
265
+ "l": 1600
266
+ },
267
+ {
268
+ "r": 0.12628,
269
+ "l": 1600
270
+ },
271
+ {
272
+ "r": 0.355526,
273
+ "l": 1600
274
+ },
275
+ {
276
+ "r": 0.023249,
277
+ "l": 1600
278
+ },
279
+ {
280
+ "r": -1.837855,
281
+ "l": 1600
282
+ },
283
+ {
284
+ "r": -5.85537,
285
+ "l": 1600
286
+ },
287
+ {
288
+ "r": -14.421578,
289
+ "l": 1600
290
+ },
291
+ {
292
+ "r": -9.505591,
293
+ "l": 1600
294
+ },
295
+ {
296
+ "r": -9.183801,
297
+ "l": 1600
298
+ },
299
+ {
300
+ "r": -3.50715,
301
+ "l": 1600
302
+ },
303
+ {
304
+ "r": -0.847926,
305
+ "l": 1600
306
+ },
307
+ {
308
+ "r": -6.17393,
309
+ "l": 1600
310
+ },
311
+ {
312
+ "r": 1.062936,
313
+ "l": 1600
314
+ },
315
+ {
316
+ "r": -3.119987,
317
+ "l": 1600
318
+ },
319
+ {
320
+ "r": 0.006336,
321
+ "l": 1600
322
+ },
323
+ {
324
+ "r": -1.609798,
325
+ "l": 1600
326
+ },
327
+ {
328
+ "r": 0.511362,
329
+ "l": 1600
330
+ },
331
+ {
332
+ "r": -4.413853,
333
+ "l": 1600
334
+ },
335
+ {
336
+ "r": -0.91934,
337
+ "l": 1600
338
+ },
339
+ {
340
+ "r": -1.349594,
341
+ "l": 1600
342
+ },
343
+ {
344
+ "r": -0.870499,
345
+ "l": 1600
346
+ },
347
+ {
348
+ "r": -2.914988,
349
+ "l": 1600
350
+ },
351
+ {
352
+ "r": -4.91091,
353
+ "l": 1600
354
+ },
355
+ {
356
+ "r": -0.44238,
357
+ "l": 1600
358
+ },
359
+ {
360
+ "r": -27.981295,
361
+ "l": 1600
362
+ },
363
+ {
364
+ "r": 0.837673,
365
+ "l": 1600
366
+ },
367
+ {
368
+ "r": -0.325922,
369
+ "l": 1600
370
+ },
371
+ {
372
+ "r": 0.13985,
373
+ "l": 1600
374
+ },
375
+ {
376
+ "r": -4.315192,
377
+ "l": 1600
378
+ },
379
+ {
380
+ "r": -1.924887,
381
+ "l": 1600
382
+ },
383
+ {
384
+ "r": 0.74766,
385
+ "l": 1600
386
+ },
387
+ {
388
+ "r": -6.121636,
389
+ "l": 1600
390
+ },
391
+ {
392
+ "r": -5.363428,
393
+ "l": 1600
394
+ },
395
+ {
396
+ "r": 0.112126,
397
+ "l": 1600
398
+ },
399
+ {
400
+ "r": -0.011771,
401
+ "l": 1600
402
+ },
403
+ {
404
+ "r": -14.908066,
405
+ "l": 1600
406
+ },
407
+ {
408
+ "r": -9.280963,
409
+ "l": 1600
410
+ },
411
+ {
412
+ "r": -18.198948,
413
+ "l": 1600
414
+ },
415
+ {
416
+ "r": -7.720118,
417
+ "l": 1600
418
+ },
419
+ {
420
+ "r": -1.214567,
421
+ "l": 1600
422
+ },
423
+ {
424
+ "r": -30.454671,
425
+ "l": 1600
426
+ },
427
+ {
428
+ "r": -2.444359,
429
+ "l": 1600
430
+ },
431
+ {
432
+ "r": 0.096511,
433
+ "l": 1600
434
+ },
435
+ {
436
+ "r": -2.322823,
437
+ "l": 1600
438
+ },
439
+ {
440
+ "r": -3.36024,
441
+ "l": 1600
442
+ },
443
+ {
444
+ "r": -3.646635,
445
+ "l": 1600
446
+ },
447
+ {
448
+ "r": -3.357776,
449
+ "l": 1600
450
+ },
451
+ {
452
+ "r": -5.709417,
453
+ "l": 1600
454
+ },
455
+ {
456
+ "r": -2.717113,
457
+ "l": 1600
458
+ },
459
+ {
460
+ "r": -0.683711,
461
+ "l": 1600
462
+ },
463
+ {
464
+ "r": -2.402417,
465
+ "l": 1600
466
+ },
467
+ {
468
+ "r": -8.698189,
469
+ "l": 1600
470
+ },
471
+ {
472
+ "r": -4.708897,
473
+ "l": 1600
474
+ },
475
+ {
476
+ "r": -0.448583,
477
+ "l": 1600
478
+ },
479
+ {
480
+ "r": 0.919555,
481
+ "l": 1600
482
+ },
483
+ {
484
+ "r": -1.297185,
485
+ "l": 1600
486
+ },
487
+ {
488
+ "r": -4.644188,
489
+ "l": 1600
490
+ },
491
+ {
492
+ "r": -8.156213,
493
+ "l": 1600
494
+ },
495
+ {
496
+ "r": -5.759099,
497
+ "l": 1600
498
+ },
499
+ {
500
+ "r": -4.713412,
501
+ "l": 1600
502
+ },
503
+ {
504
+ "r": -3.76554,
505
+ "l": 1600
506
+ },
507
+ {
508
+ "r": -1.336931,
509
+ "l": 1600
510
+ },
511
+ {
512
+ "r": -4.596379,
513
+ "l": 1600
514
+ },
515
+ {
516
+ "r": -15.05301,
517
+ "l": 1600
518
+ },
519
+ {
520
+ "r": -1.604169,
521
+ "l": 1600
522
+ },
523
+ {
524
+ "r": -5.271523,
525
+ "l": 1600
526
+ },
527
+ {
528
+ "r": -0.984733,
529
+ "l": 1600
530
+ },
531
+ {
532
+ "r": -8.165095,
533
+ "l": 1600
534
+ },
535
+ {
536
+ "r": -9.881804,
537
+ "l": 1600
538
+ },
539
+ {
540
+ "r": -1.063293,
541
+ "l": 1600
542
+ },
543
+ {
544
+ "r": 0.720656,
545
+ "l": 1600
546
+ },
547
+ {
548
+ "r": -2.147401,
549
  "l": 1600
550
  }
551
  ],
 
553
  ":type:": "<class 'collections.deque'>",
554
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
555
  },
556
+ "_n_updates": 30,
557
  "observation_space": {
558
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
559
+ ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==",
560
  "dtype": "float32",
561
  "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]",
562
  "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]",
 
571
  },
572
  "action_space": {
573
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
574
+ ":serialized:": "gAWVpwEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=",
575
  "dtype": "float32",
576
  "bounded_below": "[ True True True True]",
577
  "bounded_above": "[ True True True True]",
 
585
  "_np_random": null
586
  },
587
  "n_envs": 1,
588
+ "n_delta": 64,
589
+ "pop_size": 128,
590
  "delta_std_schedule": {
591
  ":type:": "<class 'function'>",
592
+ ":serialized:": "gAWVaAIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMU2M6XFVzZXJzXHByaWNvXC5jb25kYVxlbnZzXEFUTk5cbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLg0MCBAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgMdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB59lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9+uFHrhR64hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
593
  },
594
  "n_eval_episodes": 1,
595
+ "n_top": 32,
596
  "alive_bonus_offset": 0,
597
  "zero_policy": true,
598
  "weights": {
599
  ":type:": "<class 'torch.Tensor'>",
600
+ ":serialized:": "gAWVAAMAAAAAAACMDHRvcmNoLl91dGlsc5SMEl9yZWJ1aWxkX3RlbnNvcl92MpSTlCiMDXRvcmNoLnN0b3JhZ2WUjBBfbG9hZF9mcm9tX2J5dGVzlJOUQnkCAACAAooKbPycRvkgaqhQGS6AAk3pAy6AAn1xAChYEAAAAHByb3RvY29sX3ZlcnNpb25xAU3pA1gNAAAAbGl0dGxlX2VuZGlhbnECiFgKAAAAdHlwZV9zaXplc3EDfXEEKFgFAAAAc2hvcnRxBUsCWAMAAABpbnRxBksEWAQAAABsb25ncQdLBHV1LoACKFgHAAAAc3RvcmFnZXEAY3RvcmNoCkZsb2F0U3RvcmFnZQpxAVgNAAAAMjkxMDU0MzczMzIzMnECWAMAAABjcHVxA0tgTnRxBFEugAJdcQBYDQAAADI5MTA1NDM3MzMyMzJxAWEuYAAAAAAAAABs7mU9nppBvNjTlTp00xm80CoWvT9ExTyyi0i9LqOWvOzZyzwkZAu9qo0pvRgdKL3eeMi8Lk8RvZ1kjTwYJrm8e2QIO60meT3Dh/w8A+3fvPqfBbwpL0k9HZD3OuR7lrxX6+Q8cmzUPKlFH73WXni8ACmnOssWDb2xDES8170dvRgen7lNzzi8r9oLPfEKjDxPXW08aifPu0jGO73BQ+i8yQ4BuxMBcrzoc2i8eQsNPRsDWLx5NCG87nuWPPGc4rz1Lzu8xLddPSgpzzs7X7M7gmBvvVzjJjvFT8S7OLWmvNPESTw00Rc8//SivKqqFz1yLAI9iHFDPWQ1rDxk66+8QB8zvPtKGj3l3V29MAbQvNrudLzJC1e9mI0oPUseAj0TxOk7ln+XPI5o07wCsaM8+PCLPDTBozw0QDI8oB+ovLcst7skdTA8xBAPvWA3yjsMVz+9UrVKvDNPrjvi2aM7Qsk0vVJb7zym4iW9OhpXPNVCvDwhunu7cEWhuj7bC72UhZRSlEsAS2CFlEsBhZSJjAtjb2xsZWN0aW9uc5SMC09yZGVyZWREaWN0lJOUKVKUdJRSlC4="
601
  },
602
  "processes": null,
603
  "old_count": 0,
604
  "lr_schedule": {
605
  ":type:": "<class 'function'>",
606
+ ":serialized:": "gAWVaAIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMU2M6XFVzZXJzXHByaWNvXC5jb25kYVxlbnZzXEFUTk5cbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLg0MCBAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgMdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB59lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz+UeuFHrhR7hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
607
  },
608
  "n_params": 96
609
  }
ars-BipedalWalker-v3/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d7a5cde8c3c85f14a6fc0598369f4ce74bc75fc7d8b8d9bd8ec08048adc065b
3
  size 1756
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:536cf4786f354654abb431796ecc69e665c968f06f19e5bd2cc760c4ab022f6b
3
  size 1756
ars-BipedalWalker-v3/pytorch_variables.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c35cea3b2e60fb5e7e162d3592df775cd400e575a31c72f359fb9e654ab00c5
3
  size 864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb4dde0c1ad63b7740276006a06cc491b21b407ea6c889928c223ec77ddad79f
3
  size 864
ars-BipedalWalker-v3/system_info.txt CHANGED
@@ -1,9 +1,9 @@
1
- - OS: Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023
2
  - Python: 3.10.12
3
  - Stable-Baselines3: 2.2.1
4
- - PyTorch: 2.1.0+cu121
5
  - GPU Enabled: False
6
- - Numpy: 1.23.5
7
- - Cloudpickle: 2.2.1
8
  - Gymnasium: 0.28.1
9
- - OpenAI Gym: 0.25.2
 
1
+ - OS: Windows-10-10.0.22621-SP0 10.0.22621
2
  - Python: 3.10.12
3
  - Stable-Baselines3: 2.2.1
4
+ - PyTorch: 2.1.0
5
  - GPU Enabled: False
6
+ - Numpy: 1.26.0
7
+ - Cloudpickle: 3.0.0
8
  - Gymnasium: 0.28.1
9
+ - OpenAI Gym: 0.21.0
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVMAAAAAAAAACMGHNiM19jb250cmliLmFycy5wb2xpY2llc5SMD0FSU0xpbmVhclBvbGljeZSTlC4=", "__module__": "sb3_contrib.ars.policies", "__doc__": "\n Linear policy network for ARS.\n\n :param observation_space: The observation space of the environment\n :param action_space: The action space of the environment\n :param with_bias: With or without bias on the output\n :param squash_output: For continuous actions, whether the output is squashed\n or not using a ``tanh()`` function. If not squashed with tanh the output will instead be clipped.\n ", "__init__": "<function ARSLinearPolicy.__init__ at 0x7d86d77088b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7d86d76f8d80>"}, "verbose": 5, "policy_kwargs": {}, "num_timesteps": 5017333, "_total_timesteps": 5000000.0, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1704124216615583280, "learning_rate": 0.02, "tensorboard_log": "runs/BipedalWalker-v3__ars-BipedalWalker-v3__1__1704124216", "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAPly5jdoA9Wzj3QBN7O7J7mPK3A6RtYqt5iu1TvhzrQ3c7HnO/ncqTll0yq3usHUO8Ki8TZzsec7rCmEO4JqhTv8Rok72RCQOwxdmjvQFak7iYm9O/dH2Ttzsec7c7HnO5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsYhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdAAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYBAAAAAAAAAAGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwGFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAJsONDvsbia3UUtKOkoSg7y6cbw91nqFupg4XD9TRQ07AACAP+HJBD2WeIW65ZFaPwDMPDoAAIA/YLLhPolC5D6bP+w+U6b6Pva6CD/jOho/yIo1P27MYj8AAIA/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsYhpSMAUOUdJRSlC4="}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.001653400000000027, "_stats_window_size": 100, "ep_info_buffer": [{"r": -22.732791, "l": 1600}, {"r": -26.241545, "l": 1600}, {"r": -21.244826, "l": 1600}, {"r": -18.363228, "l": 1600}, {"r": -21.464579, "l": 1600}, {"r": -19.700786, "l": 1600}, {"r": -20.990937, "l": 1600}, {"r": -20.206168, "l": 1600}, {"r": -13.470986, "l": 1600}, {"r": -22.199595, "l": 1600}, {"r": -16.295752, "l": 1600}, {"r": -18.869419, "l": 1600}, {"r": -24.387612, "l": 1600}, {"r": -21.286163, "l": 1600}, {"r": -30.705473, "l": 1600}, {"r": -19.318436, "l": 1600}], "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 204, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVRgQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBAolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgUSxiFlGgYdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoECiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaApLGIWUaBh0lFKUjARoaWdolGgQKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksYhZRoGHSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "_shape": [24], "low": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "low_repr": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high_repr": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVoQEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgHjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgQKJYEAAAAAAAAAAEBAQGUaBRLBIWUaBh0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgQKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaApLBIWUaBh0lFKUjARoaWdolGgQKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaApLBIWUaBh0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True]", "bounded_above": "[ True True True True]", "_shape": [4], "low": "[-1. -1. -1. -1.]", "high": "[1. 1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 1, "n_delta": 8, "pop_size": 16, "delta_std_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz+pmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "n_eval_episodes": 1, "n_top": 8, "alive_bonus_offset": 0, "zero_policy": true, "weights": {":type:": "<class 'torch.Tensor'>", ":serialized:": "gAWVAgMAAAAAAACMDHRvcmNoLl91dGlsc5SMEl9yZWJ1aWxkX3RlbnNvcl92MpSTlCiMDXRvcmNoLnN0b3JhZ2WUjBBfbG9hZF9mcm9tX2J5dGVzlJOUQnsCAACAAooKbPycRvkgaqhQGS6AAk3pAy6AAn1xAChYEAAAAHByb3RvY29sX3ZlcnNpb25xAU3pA1gNAAAAbGl0dGxlX2VuZGlhbnECiFgKAAAAdHlwZV9zaXplc3EDfXEEKFgFAAAAc2hvcnRxBUsCWAMAAABpbnRxBksEWAQAAABsb25ncQdLBHV1LoACKFgHAAAAc3RvcmFnZXEAY3RvcmNoCkZsb2F0U3RvcmFnZQpxAVgOAAAAOTk2NjU2MDUyNTg2MjRxAlgDAAAAY3B1cQNLYE50cQRRLoACXXEAWA4AAAA5OTY2NTYwNTI1ODYyNHEBYS5gAAAAAAAAAAQaDj6YWpU9OgUCPfIel7wf7EK+rywhPqHHS7zskpW8vvVnPHS9Gjz+vwW7YrKNPlU0bL5ijmK99taAPJd0C75QJBi+fNQWPk/lF76PxZm+pwxivRBW8L3KLfM9nsbTvEBvCT3qwQA+SIPbvbnE/L2K2tI9riQRPjnpc75oRbY8OtJtPfZC07168M69c7+avhjJh71WD1A9jLSGPEOYWT5k0Bs7rusTvrbPML5iUhK9HDPIvpYIZjzKrmi9DS70PJ+O5D2wXHU+EGR2vArA8zx6cwi+l5rMvcBGZr1yOpk8BEDHPJOjVr3OZ7K9BjGgPVm8l76+F8w8/unPva5pTz4sFAS+zjD8PW64zT3TU6095ZuSvWPxgD5it6q8I3noPXavn76amxe+dWiDPtBB4D2SSFi+jyytvY2BsDwtYjy9iAfTPIqUCD7DzWW9E4OlPV8byb7AzZS9yZU3vd4kNL7Zx8k8u2suPbo/s74aiZ+9mFmQvkZztL3eaT09+j0avpSFlFKUSwBLYIWUSwGFlImMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpR0lFKULg=="}, "processes": null, "old_count": 0, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuDQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz+UeuFHrhR7hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "n_params": 96, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.2.1", "PyTorch": "2.1.0+cu121", "GPU Enabled": "False", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVMAAAAAAAAACMGHNiM19jb250cmliLmFycy5wb2xpY2llc5SMD0FSU0xpbmVhclBvbGljeZSTlC4=", "__module__": "sb3_contrib.ars.policies", "__doc__": "\n Linear policy network for ARS.\n\n :param observation_space: The observation space of the environment\n :param action_space: The action space of the environment\n :param with_bias: With or without bias on the output\n :param squash_output: For continuous actions, whether the output is squashed\n or not using a ``tanh()`` function. If not squashed with tanh the output will instead be clipped.\n ", "__init__": "<function ARSLinearPolicy.__init__ at 0x000002A5AD53E440>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x000002A5AD545280>"}, "verbose": 5, "policy_kwargs": {}, "num_timesteps": 5029198, "_total_timesteps": 5000000.0, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1704129075173670900, "learning_rate": 0.02, "tensorboard_log": "runs/BipedalWalker-v3__ars-BipedalWalker-v3__1__1704129075", "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAPly5jdoA9Wzj3QBN7O7J7mPK3A6RtYqt5iu1TvhzrQ3c7HnO/ncqTll0yq3usHUO8Ki8TZzsec7rCmEO4JqhTv8Rok72RCQOwxdmjvQFak7iYm9O/dH2Ttzsec7c7HnO5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsYhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdAAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYBAAAAAAAAAAGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwGFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAJsONDvsbia3UUtKOkoSg7y6cbw91nqFupg4XD9TRQ07AACAP+HJBD2WeIW65ZFaPwDMPDoAAIA/YLLhPolC5D6bP+w+U6b6Pva6CD/jOho/yIo1P27MYj8AAIA/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsYhpSMAUOUdJRSlC4="}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.03482660000000004, "_stats_window_size": 100, "ep_info_buffer": [{"r": -0.858298, "l": 1600}, {"r": -2.976511, "l": 1600}, {"r": -2.287396, "l": 1600}, {"r": -0.170771, "l": 1600}, {"r": -3.177175, "l": 1600}, {"r": -1.321648, "l": 1600}, {"r": -0.810533, "l": 1600}, {"r": 1.043323, "l": 1600}, {"r": -4.461499, "l": 1600}, {"r": -0.691904, "l": 1600}, {"r": -0.388016, "l": 1600}, {"r": -6.926794, "l": 1600}, {"r": 0.965219, "l": 1600}, {"r": -1.449291, "l": 1600}, {"r": -1.782632, "l": 1600}, {"r": -18.089477, "l": 1600}, {"r": -0.337723, "l": 1600}, {"r": -2.969601, "l": 1600}, {"r": -6.312056, "l": 1600}, {"r": -4.653198, "l": 1600}, {"r": -15.871131, "l": 1600}, {"r": -2.104873, "l": 1600}, {"r": -0.62008, "l": 1600}, {"r": -22.682619, "l": 1600}, {"r": -1.070423, "l": 1600}, {"r": -0.868259, "l": 1600}, {"r": -0.100044, "l": 1600}, {"r": 1.388992, "l": 1600}, {"r": -0.606481, "l": 1600}, {"r": 0.13454, "l": 1600}, {"r": 0.403181, "l": 1600}, {"r": -6.21947, "l": 1600}, {"r": -2.612893, "l": 1600}, {"r": -0.490002, "l": 1600}, {"r": 0.762088, "l": 1600}, {"r": -8.212339, "l": 1600}, {"r": -0.509528, "l": 1600}, {"r": -6.702586, "l": 1600}, {"r": -1.102252, "l": 1600}, {"r": -0.542297, "l": 1600}, {"r": -2.554229, "l": 1600}, {"r": 0.288999, "l": 1600}, {"r": -4.404716, "l": 1600}, {"r": -1.628192, "l": 1600}, {"r": -2.45756, "l": 1600}, {"r": -4.696834, "l": 1600}, {"r": -1.310907, "l": 1600}, {"r": -18.882727, "l": 1600}, {"r": -0.008551, "l": 1600}, {"r": -123.061934, "l": 131}, {"r": -1.392482, "l": 1600}, {"r": -3.201651, "l": 1600}, {"r": -4.626365, "l": 1600}, {"r": -1.444375, "l": 1600}, {"r": -0.352113, "l": 1600}, {"r": -6.791308, "l": 1600}, {"r": 0.680932, "l": 1600}, {"r": 0.12628, "l": 1600}, {"r": 0.355526, "l": 1600}, {"r": 0.023249, "l": 1600}, {"r": -1.837855, "l": 1600}, {"r": -5.85537, "l": 1600}, {"r": -14.421578, "l": 1600}, {"r": -9.505591, "l": 1600}, {"r": -9.183801, "l": 1600}, {"r": -3.50715, "l": 1600}, {"r": -0.847926, "l": 1600}, {"r": -6.17393, "l": 1600}, {"r": 1.062936, "l": 1600}, {"r": -3.119987, "l": 1600}, {"r": 0.006336, "l": 1600}, {"r": -1.609798, "l": 1600}, {"r": 0.511362, "l": 1600}, {"r": -4.413853, "l": 1600}, {"r": -0.91934, "l": 1600}, {"r": -1.349594, "l": 1600}, {"r": -0.870499, "l": 1600}, {"r": -2.914988, "l": 1600}, {"r": -4.91091, "l": 1600}, {"r": -0.44238, "l": 1600}, {"r": -27.981295, "l": 1600}, {"r": 0.837673, "l": 1600}, {"r": -0.325922, "l": 1600}, {"r": 0.13985, "l": 1600}, {"r": -4.315192, "l": 1600}, {"r": -1.924887, "l": 1600}, {"r": 0.74766, "l": 1600}, {"r": -6.121636, "l": 1600}, {"r": -5.363428, "l": 1600}, {"r": 0.112126, "l": 1600}, {"r": -0.011771, "l": 1600}, {"r": -14.908066, "l": 1600}, {"r": -9.280963, "l": 1600}, {"r": -18.198948, "l": 1600}, {"r": -7.720118, "l": 1600}, {"r": -1.214567, "l": 1600}, {"r": -30.454671, "l": 1600}, {"r": -2.444359, "l": 1600}, {"r": 0.096511, "l": 1600}, {"r": -2.322823, "l": 1600}, {"r": -3.36024, "l": 1600}, {"r": -3.646635, "l": 1600}, {"r": -3.357776, "l": 1600}, {"r": -5.709417, "l": 1600}, {"r": -2.717113, "l": 1600}, {"r": -0.683711, "l": 1600}, {"r": -2.402417, "l": 1600}, {"r": -8.698189, "l": 1600}, {"r": -4.708897, "l": 1600}, {"r": -0.448583, "l": 1600}, {"r": 0.919555, "l": 1600}, {"r": -1.297185, "l": 1600}, {"r": -4.644188, "l": 1600}, {"r": -8.156213, "l": 1600}, {"r": -5.759099, "l": 1600}, {"r": -4.713412, "l": 1600}, {"r": -3.76554, "l": 1600}, {"r": -1.336931, "l": 1600}, {"r": -4.596379, "l": 1600}, {"r": -15.05301, "l": 1600}, {"r": -1.604169, "l": 1600}, {"r": -5.271523, "l": 1600}, {"r": -0.984733, "l": 1600}, {"r": -8.165095, "l": 1600}, {"r": -9.881804, "l": 1600}, {"r": -1.063293, "l": 1600}, {"r": 0.720656, "l": 1600}, {"r": -2.147401, "l": 1600}], "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 30, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "_shape": [24], "low": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "low_repr": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high_repr": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVpwEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True]", "bounded_above": "[ True True True True]", "_shape": [4], "low": "[-1. -1. -1. -1.]", "high": "[1. 1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 1, "n_delta": 64, "pop_size": 128, "delta_std_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVaAIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMU2M6XFVzZXJzXHByaWNvXC5jb25kYVxlbnZzXEFUTk5cbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLg0MCBAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgMdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB59lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9+uFHrhR64hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "n_eval_episodes": 1, "n_top": 32, "alive_bonus_offset": 0, "zero_policy": true, "weights": {":type:": "<class 'torch.Tensor'>", ":serialized:": "gAWVAAMAAAAAAACMDHRvcmNoLl91dGlsc5SMEl9yZWJ1aWxkX3RlbnNvcl92MpSTlCiMDXRvcmNoLnN0b3JhZ2WUjBBfbG9hZF9mcm9tX2J5dGVzlJOUQnkCAACAAooKbPycRvkgaqhQGS6AAk3pAy6AAn1xAChYEAAAAHByb3RvY29sX3ZlcnNpb25xAU3pA1gNAAAAbGl0dGxlX2VuZGlhbnECiFgKAAAAdHlwZV9zaXplc3EDfXEEKFgFAAAAc2hvcnRxBUsCWAMAAABpbnRxBksEWAQAAABsb25ncQdLBHV1LoACKFgHAAAAc3RvcmFnZXEAY3RvcmNoCkZsb2F0U3RvcmFnZQpxAVgNAAAAMjkxMDU0MzczMzIzMnECWAMAAABjcHVxA0tgTnRxBFEugAJdcQBYDQAAADI5MTA1NDM3MzMyMzJxAWEuYAAAAAAAAABs7mU9nppBvNjTlTp00xm80CoWvT9ExTyyi0i9LqOWvOzZyzwkZAu9qo0pvRgdKL3eeMi8Lk8RvZ1kjTwYJrm8e2QIO60meT3Dh/w8A+3fvPqfBbwpL0k9HZD3OuR7lrxX6+Q8cmzUPKlFH73WXni8ACmnOssWDb2xDES8170dvRgen7lNzzi8r9oLPfEKjDxPXW08aifPu0jGO73BQ+i8yQ4BuxMBcrzoc2i8eQsNPRsDWLx5NCG87nuWPPGc4rz1Lzu8xLddPSgpzzs7X7M7gmBvvVzjJjvFT8S7OLWmvNPESTw00Rc8//SivKqqFz1yLAI9iHFDPWQ1rDxk66+8QB8zvPtKGj3l3V29MAbQvNrudLzJC1e9mI0oPUseAj0TxOk7ln+XPI5o07wCsaM8+PCLPDTBozw0QDI8oB+ovLcst7skdTA8xBAPvWA3yjsMVz+9UrVKvDNPrjvi2aM7Qsk0vVJb7zym4iW9OhpXPNVCvDwhunu7cEWhuj7bC72UhZRSlEsAS2CFlEsBhZSJjAtjb2xsZWN0aW9uc5SMC09yZGVyZWREaWN0lJOUKVKUdJRSlC4="}, "processes": null, "old_count": 0, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVaAIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMU2M6XFVzZXJzXHByaWNvXC5jb25kYVxlbnZzXEFUTk5cbGliXHNpdGUtcGFja2FnZXNcc3RhYmxlX2Jhc2VsaW5lczNcY29tbW9uXHV0aWxzLnB5lIwEZnVuY5RLg0MCBAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flGgMdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB59lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz+UeuFHrhR7hZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "n_params": 96, "system_info": {"OS": "Windows-10-10.0.22621-SP0 10.0.22621", "Python": "3.10.12", "Stable-Baselines3": "2.2.1", "PyTorch": "2.1.0", "GPU Enabled": "False", "Numpy": "1.26.0", "Cloudpickle": "3.0.0", "Gymnasium": "0.28.1", "OpenAI Gym": "0.21.0"}}
logs/ARS_1/events.out.tfevents.1704129075.Thunder.26964.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ab4d296dc68944ee9d5ca1966d1d60c10f3dc8f7de8963abf6c35743db93a21
3
+ size 11990
logs/events.out.tfevents.1704129075.Thunder.26964.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c327a94facd4fa2b4d44521bc5146804c810dd16c7d330f462a83133eee3cc5
3
+ size 442
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -16.4242839, "std_reward": 2.5229827956590767, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-01-01T16:56:59.156856"}
 
1
+ {"mean_reward": -1.5756027, "std_reward": 1.2588001104043525, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-01-01T20:04:57.487335"}
vec_normalize.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e579a8c9b1bdf935fda91493ac1d7640426df8e94a8321d8eff91bb7fa1c41bb
3
  size 2665
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83a032c2f731760c92da8e27ba6221738fa716632f9b560bd24b7d0efb3babb8
3
  size 2665