first push
Browse files- Pyramids-1000068.onnx +3 -0
- Pyramids-1000068.pt +3 -0
- Pyramids-499974.onnx +3 -0
- Pyramids-499974.pt +3 -0
- Pyramids-999940.onnx +3 -0
- Pyramids-999940.pt +3 -0
- README.md +35 -0
- checkpoint.pt +3 -0
- config.json +1 -0
- configuration.yaml +10 -0
- events.out.tfevents.1739820732.1a30e00be6d1.373.0 +3 -0
Pyramids-1000068.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea1df536782253ab3a1add50927a82f81c0861283b30cf24ecb1de8f8cab16bd
|
3 |
+
size 1420238
|
Pyramids-1000068.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29dab52f6e56f12a18fe387a5c440f16e66a21dcb34bf0799fb6db61172333bf
|
3 |
+
size 8656252
|
Pyramids-499974.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed083c5cefd5dae32b76633bac18b630d25d6e3c426f12588f0d71c65a62cc88
|
3 |
+
size 1420238
|
Pyramids-499974.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b5060afb169b3f5a55696e6da25d4b617f8649e1f2328fbfd158845a67304da
|
3 |
+
size 8656173
|
Pyramids-999940.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea1df536782253ab3a1add50927a82f81c0861283b30cf24ecb1de8f8cab16bd
|
3 |
+
size 1420238
|
Pyramids-999940.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2703770c3f00e676cc605e3b977c38bdc179f0327183ff7edd5fb0257822be4
|
3 |
+
size 8656173
|
README.md
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: ml-agents
|
3 |
+
tags:
|
4 |
+
- PyramidsRND
|
5 |
+
- deep-reinforcement-learning
|
6 |
+
- reinforcement-learning
|
7 |
+
- ML-Agents-PyramidsRND
|
8 |
+
---
|
9 |
+
|
10 |
+
# **ppo** Agent playing **PyramidsRND**
|
11 |
+
This is a trained model of a **ppo** agent playing **PyramidsRND**
|
12 |
+
using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
|
13 |
+
|
14 |
+
## Usage (with ML-Agents)
|
15 |
+
The Documentation: https://unity-technologies.github.io/ml-agents/ML-Agents-Toolkit-Documentation/
|
16 |
+
|
17 |
+
We wrote a complete tutorial to learn to train your first agent using ML-Agents and publish it to the Hub:
|
18 |
+
- A *short tutorial* where you teach Huggy the Dog 🐶 to fetch the stick and then play with him directly in your
|
19 |
+
browser: https://huggingface.co/learn/deep-rl-course/unitbonus1/introduction
|
20 |
+
- A *longer tutorial* to understand how works ML-Agents:
|
21 |
+
https://huggingface.co/learn/deep-rl-course/unit5/introduction
|
22 |
+
|
23 |
+
### Resume the training
|
24 |
+
```bash
|
25 |
+
mlagents-learn <your_configuration_file_path.yaml> --run-id=<run_id> --resume
|
26 |
+
```
|
27 |
+
|
28 |
+
### Watch your Agent play
|
29 |
+
You can watch your agent **playing directly in your browser**
|
30 |
+
|
31 |
+
1. If the environment is part of ML-Agents official environments, go to https://huggingface.co/unity
|
32 |
+
2. Step 1: Find your model_id: AE1999/RND-Pyramids
|
33 |
+
3. Step 2: Select your *.nn /*.onnx file
|
34 |
+
4. Click on Watch the agent play 👀
|
35 |
+
|
checkpoint.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c25789e09687ea625f832829fcd92f086c0d75e4348025f4c0b0e32fbb78c0b8
|
3 |
+
size 8655778
|
config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"behaviors": {"PyramidsRND": {"batch_size": 128, "buffer_size": 4096, "gamma": 0.99, "hidden_units": 256, "learning_rate": 0.0003, "max_steps": 1000000, "num_layers": 2, "trainer_type": "ppo"}}}
|
configuration.yaml
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
behaviors:
|
2 |
+
PyramidsRND:
|
3 |
+
batch_size: 128
|
4 |
+
buffer_size: 4096
|
5 |
+
gamma: 0.99
|
6 |
+
hidden_units: 256
|
7 |
+
learning_rate: 0.0003
|
8 |
+
max_steps: 1000000
|
9 |
+
num_layers: 2
|
10 |
+
trainer_type: ppo
|
events.out.tfevents.1739820732.1a30e00be6d1.373.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:772a39dbf76cf1e8267bda82e8763633ed1304de7eb31bf75f8c6f2ce75e2aec
|
3 |
+
size 323470
|