pushing model
Browse files- .gitattributes +4 -0
- README.md +4 -4
- events.out.tfevents.1700810722.4090-171.1712170.0 → events.out.tfevents.1702935427.4090-171.242716.0 +2 -2
- ppo_fix_continuous_action.cleanrl_model +0 -0
- ppo_fix_continuous_action.py +1 -1
- replay.mp4 +0 -0
- videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1700810722-eval/rl-video-episode-1.mp4 +0 -0
- videos/{HalfCheetah-v4__ppo_fix_continuous_action__2__1700810722-eval → HalfCheetah-v4__ppo_fix_continuous_action__2__1702935419-eval}/rl-video-episode-0.mp4 +2 -2
- videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1702935419-eval/rl-video-episode-1.mp4 +3 -0
- videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1702935419-eval/rl-video-episode-8.mp4 +3 -0
.gitattributes
CHANGED
|
@@ -34,3 +34,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1700810722-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1700810722-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1702935419-eval/rl-video-episode-8.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1702935419-eval/rl-video-episode-1.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1702935419-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
replay.mp4 filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
|
@@ -16,7 +16,7 @@ model-index:
|
|
| 16 |
type: HalfCheetah-v4
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
-
value:
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
@@ -46,7 +46,7 @@ curl -OL https://huggingface.co/sdpkjc/HalfCheetah-v4-ppo_fix_continuous_action-
|
|
| 46 |
curl -OL https://huggingface.co/sdpkjc/HalfCheetah-v4-ppo_fix_continuous_action-seed2/raw/main/pyproject.toml
|
| 47 |
curl -OL https://huggingface.co/sdpkjc/HalfCheetah-v4-ppo_fix_continuous_action-seed2/raw/main/poetry.lock
|
| 48 |
poetry install --all-extras
|
| 49 |
-
python ppo_fix_continuous_action.py --save-model --hf-entity sdpkjc --
|
| 50 |
```
|
| 51 |
|
| 52 |
# Hyperparameters
|
|
@@ -74,8 +74,8 @@ python ppo_fix_continuous_action.py --save-model --hf-entity sdpkjc --seed 2 --t
|
|
| 74 |
'seed': 2,
|
| 75 |
'target_kl': None,
|
| 76 |
'torch_deterministic': True,
|
| 77 |
-
'total_timesteps':
|
| 78 |
-
'track':
|
| 79 |
'update_epochs': 10,
|
| 80 |
'upload_model': True,
|
| 81 |
'vf_coef': 0.5,
|
|
|
|
| 16 |
type: HalfCheetah-v4
|
| 17 |
metrics:
|
| 18 |
- type: mean_reward
|
| 19 |
+
value: 1638.41 +/- 53.59
|
| 20 |
name: mean_reward
|
| 21 |
verified: false
|
| 22 |
---
|
|
|
|
| 46 |
curl -OL https://huggingface.co/sdpkjc/HalfCheetah-v4-ppo_fix_continuous_action-seed2/raw/main/pyproject.toml
|
| 47 |
curl -OL https://huggingface.co/sdpkjc/HalfCheetah-v4-ppo_fix_continuous_action-seed2/raw/main/poetry.lock
|
| 48 |
poetry install --all-extras
|
| 49 |
+
python ppo_fix_continuous_action.py --save-model --upload-model --hf-entity sdpkjc --env-id HalfCheetah-v4 --seed 2 --track
|
| 50 |
```
|
| 51 |
|
| 52 |
# Hyperparameters
|
|
|
|
| 74 |
'seed': 2,
|
| 75 |
'target_kl': None,
|
| 76 |
'torch_deterministic': True,
|
| 77 |
+
'total_timesteps': 1000000,
|
| 78 |
+
'track': True,
|
| 79 |
'update_epochs': 10,
|
| 80 |
'upload_model': True,
|
| 81 |
'vf_coef': 0.5,
|
events.out.tfevents.1700810722.4090-171.1712170.0 → events.out.tfevents.1702935427.4090-171.242716.0
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95b0415c5b036980a987167a7055f8806f89b5c561741e8b8fde7298899f115d
|
| 3 |
+
size 376394
|
ppo_fix_continuous_action.cleanrl_model
CHANGED
|
Binary files a/ppo_fix_continuous_action.cleanrl_model and b/ppo_fix_continuous_action.cleanrl_model differ
|
|
|
ppo_fix_continuous_action.py
CHANGED
|
@@ -553,7 +553,7 @@ if __name__ == "__main__":
|
|
| 553 |
model_path,
|
| 554 |
make_eval_env,
|
| 555 |
args.env_id,
|
| 556 |
-
eval_episodes=
|
| 557 |
run_name=f"{run_name}-eval",
|
| 558 |
Model=Agent,
|
| 559 |
device=device,
|
|
|
|
| 553 |
model_path,
|
| 554 |
make_eval_env,
|
| 555 |
args.env_id,
|
| 556 |
+
eval_episodes=10,
|
| 557 |
run_name=f"{run_name}-eval",
|
| 558 |
Model=Agent,
|
| 559 |
device=device,
|
replay.mp4
CHANGED
|
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
|
videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1700810722-eval/rl-video-episode-1.mp4
DELETED
|
Binary file (6.54 kB)
|
|
|
videos/{HalfCheetah-v4__ppo_fix_continuous_action__2__1700810722-eval → HalfCheetah-v4__ppo_fix_continuous_action__2__1702935419-eval}/rl-video-episode-0.mp4
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08ff8568028087117e82b4a7c6141746d34506374f6f612b2f3101cd3ddd20c9
|
| 3 |
+
size 2037579
|
videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1702935419-eval/rl-video-episode-1.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8be8fe5f9debe2828337c6cb72360d2f61252726db87bcc26c14fd70b18e0ae
|
| 3 |
+
size 2086772
|
videos/HalfCheetah-v4__ppo_fix_continuous_action__2__1702935419-eval/rl-video-episode-8.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e43e954d9cc8290cc6d76be2c7797a0f66b9fb9f5ecd8581bcbd4fb35faf4170
|
| 3 |
+
size 2157054
|