Upload folder using huggingface_hub
Browse files- .hydra/config.yaml +160 -0
- .hydra/hydra.yaml +160 -0
- .hydra/overrides.yaml +3 -0
- checkpoints/005000/pretrained_model/README.md +12 -0
- checkpoints/005000/pretrained_model/config.json +55 -0
- checkpoints/005000/pretrained_model/config.yaml +248 -0
- checkpoints/005000/pretrained_model/model.safetensors +3 -0
- checkpoints/005000/training_state.pth +3 -0
- default.log +0 -0
- wandb/debug-internal.log +16 -0
- wandb/debug.log +25 -0
- wandb/run-20241206_222830-bwwpk9vl/files/config.yaml +194 -0
- wandb/run-20241206_222830-bwwpk9vl/files/output.log +46 -0
- wandb/run-20241206_222830-bwwpk9vl/files/requirements.txt +129 -0
- wandb/run-20241206_222830-bwwpk9vl/files/wandb-metadata.json +48 -0
- wandb/run-20241206_222830-bwwpk9vl/files/wandb-summary.json +1 -0
- wandb/run-20241206_222830-bwwpk9vl/logs/debug-core.log +15 -0
- wandb/run-20241206_222830-bwwpk9vl/logs/debug-internal.log +16 -0
- wandb/run-20241206_222830-bwwpk9vl/logs/debug.log +24 -0
- wandb/run-20241206_222830-bwwpk9vl/run-bwwpk9vl.wandb +0 -0
- wandb/run-20241207_010636-bwwpk9vl/files/config.yaml +296 -0
- wandb/run-20241207_010636-bwwpk9vl/files/output.log +28 -0
- wandb/run-20241207_010636-bwwpk9vl/files/requirements.txt +129 -0
- wandb/run-20241207_010636-bwwpk9vl/files/wandb-metadata.json +52 -0
- wandb/run-20241207_010636-bwwpk9vl/files/wandb-summary.json +1 -0
- wandb/run-20241207_010636-bwwpk9vl/logs/debug-core.log +14 -0
- wandb/run-20241207_010636-bwwpk9vl/logs/debug-internal.log +16 -0
- wandb/run-20241207_010636-bwwpk9vl/logs/debug.log +25 -0
- wandb/run-20241207_010636-bwwpk9vl/run-bwwpk9vl.wandb +0 -0
- wandb/run-20241207_010741-bwwpk9vl/files/config.yaml +296 -0
- wandb/run-20241207_010741-bwwpk9vl/files/output.log +28 -0
- wandb/run-20241207_010741-bwwpk9vl/files/requirements.txt +129 -0
- wandb/run-20241207_010741-bwwpk9vl/files/wandb-metadata.json +49 -0
- wandb/run-20241207_010741-bwwpk9vl/files/wandb-summary.json +1 -0
- wandb/run-20241207_010741-bwwpk9vl/logs/debug-core.log +14 -0
- wandb/run-20241207_010741-bwwpk9vl/logs/debug-internal.log +16 -0
- wandb/run-20241207_010741-bwwpk9vl/logs/debug.log +25 -0
- wandb/run-20241207_010741-bwwpk9vl/run-bwwpk9vl.wandb +0 -0
.hydra/config.yaml
ADDED
@@ -0,0 +1,160 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
resume: true
|
2 |
+
device: cuda
|
3 |
+
use_amp: false
|
4 |
+
seed: 100000
|
5 |
+
dataset_repo_id: HumanoidTeam/aloha_real_test
|
6 |
+
video_backend: pyav
|
7 |
+
training:
|
8 |
+
offline_steps: 5010
|
9 |
+
num_workers: 8
|
10 |
+
batch_size: 64
|
11 |
+
eval_freq: 25000
|
12 |
+
log_freq: 200
|
13 |
+
save_checkpoint: true
|
14 |
+
save_freq: 25000
|
15 |
+
online_steps: 0
|
16 |
+
online_rollout_n_episodes: 1
|
17 |
+
online_rollout_batch_size: 1
|
18 |
+
online_steps_between_rollouts: 1
|
19 |
+
online_sampling_ratio: 0.5
|
20 |
+
online_env_seed: null
|
21 |
+
online_buffer_capacity: null
|
22 |
+
online_buffer_seed_size: 0
|
23 |
+
do_online_rollout_async: false
|
24 |
+
image_transforms:
|
25 |
+
enable: false
|
26 |
+
max_num_transforms: 3
|
27 |
+
random_order: false
|
28 |
+
brightness:
|
29 |
+
weight: 1
|
30 |
+
min_max:
|
31 |
+
- 0.8
|
32 |
+
- 1.2
|
33 |
+
contrast:
|
34 |
+
weight: 1
|
35 |
+
min_max:
|
36 |
+
- 0.8
|
37 |
+
- 1.2
|
38 |
+
saturation:
|
39 |
+
weight: 1
|
40 |
+
min_max:
|
41 |
+
- 0.5
|
42 |
+
- 1.5
|
43 |
+
hue:
|
44 |
+
weight: 1
|
45 |
+
min_max:
|
46 |
+
- -0.05
|
47 |
+
- 0.05
|
48 |
+
sharpness:
|
49 |
+
weight: 1
|
50 |
+
min_max:
|
51 |
+
- 0.8
|
52 |
+
- 1.2
|
53 |
+
grad_clip_norm: 10
|
54 |
+
lr: 0.0001
|
55 |
+
lr_scheduler: cosine
|
56 |
+
lr_warmup_steps: 500
|
57 |
+
adam_betas:
|
58 |
+
- 0.95
|
59 |
+
- 0.999
|
60 |
+
adam_eps: 1.0e-08
|
61 |
+
adam_weight_decay: 1.0e-06
|
62 |
+
delta_timestamps:
|
63 |
+
observation.image: '[i / ${fps} for i in range(1 - ${policy.n_obs_steps}, 1)]'
|
64 |
+
observation.state: '[i / ${fps} for i in range(1 - ${policy.n_obs_steps}, 1)]'
|
65 |
+
action: '[i / ${fps} for i in range(1 - ${policy.n_obs_steps}, 1 - ${policy.n_obs_steps}
|
66 |
+
+ ${policy.horizon})]'
|
67 |
+
drop_n_last_frames: 7
|
68 |
+
eval:
|
69 |
+
n_episodes: 50
|
70 |
+
batch_size: 50
|
71 |
+
use_async_envs: false
|
72 |
+
wandb:
|
73 |
+
enable: true
|
74 |
+
disable_artifact: false
|
75 |
+
project: lerobot_real_aloha
|
76 |
+
notes: ws-lerobot-hackathon
|
77 |
+
fps: 10
|
78 |
+
env:
|
79 |
+
name: pusht
|
80 |
+
task: PushT-v0
|
81 |
+
image_size: 96
|
82 |
+
state_dim: 2
|
83 |
+
action_dim: 2
|
84 |
+
fps: ${fps}
|
85 |
+
episode_length: 300
|
86 |
+
gym:
|
87 |
+
obs_type: pixels_agent_pos
|
88 |
+
render_mode: rgb_array
|
89 |
+
visualization_width: 384
|
90 |
+
visualization_height: 384
|
91 |
+
override_dataset_stats:
|
92 |
+
observation.image:
|
93 |
+
mean:
|
94 |
+
- - - 0.5
|
95 |
+
- - - 0.5
|
96 |
+
- - - 0.5
|
97 |
+
std:
|
98 |
+
- - - 0.5
|
99 |
+
- - - 0.5
|
100 |
+
- - - 0.5
|
101 |
+
observation.state:
|
102 |
+
min:
|
103 |
+
- 13.456424
|
104 |
+
- 32.938293
|
105 |
+
max:
|
106 |
+
- 496.14618
|
107 |
+
- 510.9579
|
108 |
+
action:
|
109 |
+
min:
|
110 |
+
- 12.0
|
111 |
+
- 25.0
|
112 |
+
max:
|
113 |
+
- 511.0
|
114 |
+
- 511.0
|
115 |
+
policy:
|
116 |
+
name: diffusion
|
117 |
+
n_obs_steps: 2
|
118 |
+
horizon: 16
|
119 |
+
n_action_steps: 8
|
120 |
+
input_shapes:
|
121 |
+
observation.image:
|
122 |
+
- 3
|
123 |
+
- 96
|
124 |
+
- 96
|
125 |
+
observation.state:
|
126 |
+
- ${env.state_dim}
|
127 |
+
output_shapes:
|
128 |
+
action:
|
129 |
+
- ${env.action_dim}
|
130 |
+
input_normalization_modes:
|
131 |
+
observation.image: mean_std
|
132 |
+
observation.state: min_max
|
133 |
+
output_normalization_modes:
|
134 |
+
action: min_max
|
135 |
+
vision_backbone: resnet18
|
136 |
+
crop_shape:
|
137 |
+
- 84
|
138 |
+
- 84
|
139 |
+
crop_is_random: true
|
140 |
+
pretrained_backbone_weights: null
|
141 |
+
use_group_norm: true
|
142 |
+
spatial_softmax_num_keypoints: 32
|
143 |
+
down_dims:
|
144 |
+
- 512
|
145 |
+
- 1024
|
146 |
+
- 2048
|
147 |
+
kernel_size: 5
|
148 |
+
n_groups: 8
|
149 |
+
diffusion_step_embed_dim: 128
|
150 |
+
use_film_scale_modulation: true
|
151 |
+
noise_scheduler_type: DDPM
|
152 |
+
num_train_timesteps: 100
|
153 |
+
beta_schedule: squaredcos_cap_v2
|
154 |
+
beta_start: 0.0001
|
155 |
+
beta_end: 0.02
|
156 |
+
prediction_type: epsilon
|
157 |
+
clip_sample: true
|
158 |
+
clip_sample_range: 1.0
|
159 |
+
num_inference_steps: null
|
160 |
+
do_mask_loss_for_padding: false
|
.hydra/hydra.yaml
ADDED
@@ -0,0 +1,160 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
hydra:
|
2 |
+
run:
|
3 |
+
dir: outputs/train/2024-12-06/22-28-29_real_world_act_default
|
4 |
+
sweep:
|
5 |
+
dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
|
6 |
+
subdir: ${hydra.job.num}
|
7 |
+
launcher:
|
8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
9 |
+
sweeper:
|
10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
11 |
+
max_batch_size: null
|
12 |
+
params: null
|
13 |
+
help:
|
14 |
+
app_name: ${hydra.job.name}
|
15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
16 |
+
|
17 |
+
'
|
18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
19 |
+
|
20 |
+
Use --hydra-help to view Hydra specific help
|
21 |
+
|
22 |
+
'
|
23 |
+
template: '${hydra.help.header}
|
24 |
+
|
25 |
+
== Configuration groups ==
|
26 |
+
|
27 |
+
Compose your configuration from those groups (group=option)
|
28 |
+
|
29 |
+
|
30 |
+
$APP_CONFIG_GROUPS
|
31 |
+
|
32 |
+
|
33 |
+
== Config ==
|
34 |
+
|
35 |
+
Override anything in the config (foo.bar=value)
|
36 |
+
|
37 |
+
|
38 |
+
$CONFIG
|
39 |
+
|
40 |
+
|
41 |
+
${hydra.help.footer}
|
42 |
+
|
43 |
+
'
|
44 |
+
hydra_help:
|
45 |
+
template: 'Hydra (${hydra.runtime.version})
|
46 |
+
|
47 |
+
See https://hydra.cc for more info.
|
48 |
+
|
49 |
+
|
50 |
+
== Flags ==
|
51 |
+
|
52 |
+
$FLAGS_HELP
|
53 |
+
|
54 |
+
|
55 |
+
== Configuration groups ==
|
56 |
+
|
57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
58 |
+
to command line)
|
59 |
+
|
60 |
+
|
61 |
+
$HYDRA_CONFIG_GROUPS
|
62 |
+
|
63 |
+
|
64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
65 |
+
|
66 |
+
'
|
67 |
+
hydra_help: ???
|
68 |
+
hydra_logging:
|
69 |
+
version: 1
|
70 |
+
formatters:
|
71 |
+
simple:
|
72 |
+
format: '[%(asctime)s][HYDRA] %(message)s'
|
73 |
+
handlers:
|
74 |
+
console:
|
75 |
+
class: logging.StreamHandler
|
76 |
+
formatter: simple
|
77 |
+
stream: ext://sys.stdout
|
78 |
+
root:
|
79 |
+
level: INFO
|
80 |
+
handlers:
|
81 |
+
- console
|
82 |
+
loggers:
|
83 |
+
logging_example:
|
84 |
+
level: DEBUG
|
85 |
+
disable_existing_loggers: false
|
86 |
+
job_logging:
|
87 |
+
version: 1
|
88 |
+
formatters:
|
89 |
+
simple:
|
90 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
91 |
+
handlers:
|
92 |
+
console:
|
93 |
+
class: logging.StreamHandler
|
94 |
+
formatter: simple
|
95 |
+
stream: ext://sys.stdout
|
96 |
+
file:
|
97 |
+
class: logging.FileHandler
|
98 |
+
formatter: simple
|
99 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
100 |
+
root:
|
101 |
+
level: INFO
|
102 |
+
handlers:
|
103 |
+
- console
|
104 |
+
- file
|
105 |
+
disable_existing_loggers: false
|
106 |
+
env: {}
|
107 |
+
mode: RUN
|
108 |
+
searchpath: []
|
109 |
+
callbacks: {}
|
110 |
+
output_subdir: .hydra
|
111 |
+
overrides:
|
112 |
+
hydra:
|
113 |
+
- hydra.run.dir=outputs/train/2024-12-06/22-28-29_real_world_act_default
|
114 |
+
- hydra.mode=RUN
|
115 |
+
task:
|
116 |
+
- resume=true
|
117 |
+
- dataset_repo_id=HumanoidTeam/aloha_real_test
|
118 |
+
- training.offline_steps=5010
|
119 |
+
job:
|
120 |
+
name: default
|
121 |
+
chdir: null
|
122 |
+
override_dirname: dataset_repo_id=HumanoidTeam/aloha_real_test,resume=true,training.offline_steps=5010
|
123 |
+
id: ???
|
124 |
+
num: ???
|
125 |
+
config_name: default
|
126 |
+
env_set: {}
|
127 |
+
env_copy: []
|
128 |
+
config:
|
129 |
+
override_dirname:
|
130 |
+
kv_sep: '='
|
131 |
+
item_sep: ','
|
132 |
+
exclude_keys: []
|
133 |
+
runtime:
|
134 |
+
version: 1.3.2
|
135 |
+
version_base: '1.2'
|
136 |
+
cwd: /home/ubuntu/lerobot-hackathon
|
137 |
+
config_sources:
|
138 |
+
- path: hydra.conf
|
139 |
+
schema: pkg
|
140 |
+
provider: hydra
|
141 |
+
- path: /home/ubuntu/lerobot-hackathon/lerobot/configs
|
142 |
+
schema: file
|
143 |
+
provider: main
|
144 |
+
- path: ''
|
145 |
+
schema: structured
|
146 |
+
provider: schema
|
147 |
+
output_dir: /home/ubuntu/lerobot-hackathon/outputs/train/2024-12-06/22-28-29_real_world_act_default
|
148 |
+
choices:
|
149 |
+
policy: diffusion
|
150 |
+
env: pusht
|
151 |
+
hydra/env: default
|
152 |
+
hydra/callbacks: null
|
153 |
+
hydra/job_logging: default
|
154 |
+
hydra/hydra_logging: default
|
155 |
+
hydra/hydra_help: default
|
156 |
+
hydra/help: default
|
157 |
+
hydra/sweeper: basic
|
158 |
+
hydra/launcher: basic
|
159 |
+
hydra/output: default
|
160 |
+
verbose: false
|
.hydra/overrides.yaml
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
- resume=true
|
2 |
+
- dataset_repo_id=HumanoidTeam/aloha_real_test
|
3 |
+
- training.offline_steps=5010
|
checkpoints/005000/pretrained_model/README.md
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: lerobot
|
3 |
+
tags:
|
4 |
+
- act
|
5 |
+
- model_hub_mixin
|
6 |
+
- pytorch_model_hub_mixin
|
7 |
+
- robotics
|
8 |
+
---
|
9 |
+
|
10 |
+
This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
|
11 |
+
- Library: https://github.com/huggingface/lerobot
|
12 |
+
- Docs: [More Information Needed]
|
checkpoints/005000/pretrained_model/config.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"chunk_size": 100,
|
3 |
+
"dim_feedforward": 3200,
|
4 |
+
"dim_model": 512,
|
5 |
+
"dropout": 0.1,
|
6 |
+
"feedforward_activation": "relu",
|
7 |
+
"input_normalization_modes": {
|
8 |
+
"observation.images.cam_high": "mean_std",
|
9 |
+
"observation.images.cam_left_wrist": "mean_std",
|
10 |
+
"observation.images.cam_right_wrist": "mean_std",
|
11 |
+
"observation.state": "mean_std"
|
12 |
+
},
|
13 |
+
"input_shapes": {
|
14 |
+
"observation.images.cam_high": [
|
15 |
+
3,
|
16 |
+
480,
|
17 |
+
640
|
18 |
+
],
|
19 |
+
"observation.images.cam_left_wrist": [
|
20 |
+
3,
|
21 |
+
480,
|
22 |
+
640
|
23 |
+
],
|
24 |
+
"observation.images.cam_right_wrist": [
|
25 |
+
3,
|
26 |
+
480,
|
27 |
+
640
|
28 |
+
],
|
29 |
+
"observation.state": [
|
30 |
+
14
|
31 |
+
]
|
32 |
+
},
|
33 |
+
"kl_weight": 10.0,
|
34 |
+
"latent_dim": 32,
|
35 |
+
"n_action_steps": 100,
|
36 |
+
"n_decoder_layers": 1,
|
37 |
+
"n_encoder_layers": 4,
|
38 |
+
"n_heads": 8,
|
39 |
+
"n_obs_steps": 1,
|
40 |
+
"n_vae_encoder_layers": 4,
|
41 |
+
"output_normalization_modes": {
|
42 |
+
"action": "mean_std"
|
43 |
+
},
|
44 |
+
"output_shapes": {
|
45 |
+
"action": [
|
46 |
+
14
|
47 |
+
]
|
48 |
+
},
|
49 |
+
"pre_norm": false,
|
50 |
+
"pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
|
51 |
+
"replace_final_stride_with_dilation": false,
|
52 |
+
"temporal_ensemble_coeff": null,
|
53 |
+
"use_vae": true,
|
54 |
+
"vision_backbone": "resnet18"
|
55 |
+
}
|
checkpoints/005000/pretrained_model/config.yaml
ADDED
@@ -0,0 +1,248 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
resume: false
|
2 |
+
device: cuda
|
3 |
+
use_amp: false
|
4 |
+
seed: 1000
|
5 |
+
dataset_repo_id: ccop/aloha_stationary_replay_test_v2
|
6 |
+
video_backend: pyav
|
7 |
+
training:
|
8 |
+
offline_steps: 5000
|
9 |
+
num_workers: 8
|
10 |
+
batch_size: 8
|
11 |
+
eval_freq: -1
|
12 |
+
log_freq: 200
|
13 |
+
save_checkpoint: true
|
14 |
+
save_freq: 10000
|
15 |
+
online_steps: 0
|
16 |
+
online_rollout_n_episodes: 1
|
17 |
+
online_rollout_batch_size: 1
|
18 |
+
online_steps_between_rollouts: 1
|
19 |
+
online_sampling_ratio: 0.5
|
20 |
+
online_env_seed: null
|
21 |
+
online_buffer_capacity: null
|
22 |
+
online_buffer_seed_size: 0
|
23 |
+
do_online_rollout_async: false
|
24 |
+
image_transforms:
|
25 |
+
enable: false
|
26 |
+
max_num_transforms: 3
|
27 |
+
random_order: false
|
28 |
+
brightness:
|
29 |
+
weight: 1
|
30 |
+
min_max:
|
31 |
+
- 0.8
|
32 |
+
- 1.2
|
33 |
+
contrast:
|
34 |
+
weight: 1
|
35 |
+
min_max:
|
36 |
+
- 0.8
|
37 |
+
- 1.2
|
38 |
+
saturation:
|
39 |
+
weight: 1
|
40 |
+
min_max:
|
41 |
+
- 0.5
|
42 |
+
- 1.5
|
43 |
+
hue:
|
44 |
+
weight: 1
|
45 |
+
min_max:
|
46 |
+
- -0.05
|
47 |
+
- 0.05
|
48 |
+
sharpness:
|
49 |
+
weight: 1
|
50 |
+
min_max:
|
51 |
+
- 0.8
|
52 |
+
- 1.2
|
53 |
+
lr: 1.0e-05
|
54 |
+
lr_backbone: 1.0e-05
|
55 |
+
weight_decay: 0.0001
|
56 |
+
grad_clip_norm: 10
|
57 |
+
delta_timestamps:
|
58 |
+
action:
|
59 |
+
- 0.0
|
60 |
+
- 0.03333333333333333
|
61 |
+
- 0.06666666666666667
|
62 |
+
- 0.1
|
63 |
+
- 0.13333333333333333
|
64 |
+
- 0.16666666666666666
|
65 |
+
- 0.2
|
66 |
+
- 0.23333333333333334
|
67 |
+
- 0.26666666666666666
|
68 |
+
- 0.3
|
69 |
+
- 0.3333333333333333
|
70 |
+
- 0.36666666666666664
|
71 |
+
- 0.4
|
72 |
+
- 0.43333333333333335
|
73 |
+
- 0.4666666666666667
|
74 |
+
- 0.5
|
75 |
+
- 0.5333333333333333
|
76 |
+
- 0.5666666666666667
|
77 |
+
- 0.6
|
78 |
+
- 0.6333333333333333
|
79 |
+
- 0.6666666666666666
|
80 |
+
- 0.7
|
81 |
+
- 0.7333333333333333
|
82 |
+
- 0.7666666666666667
|
83 |
+
- 0.8
|
84 |
+
- 0.8333333333333334
|
85 |
+
- 0.8666666666666667
|
86 |
+
- 0.9
|
87 |
+
- 0.9333333333333333
|
88 |
+
- 0.9666666666666667
|
89 |
+
- 1.0
|
90 |
+
- 1.0333333333333334
|
91 |
+
- 1.0666666666666667
|
92 |
+
- 1.1
|
93 |
+
- 1.1333333333333333
|
94 |
+
- 1.1666666666666667
|
95 |
+
- 1.2
|
96 |
+
- 1.2333333333333334
|
97 |
+
- 1.2666666666666666
|
98 |
+
- 1.3
|
99 |
+
- 1.3333333333333333
|
100 |
+
- 1.3666666666666667
|
101 |
+
- 1.4
|
102 |
+
- 1.4333333333333333
|
103 |
+
- 1.4666666666666666
|
104 |
+
- 1.5
|
105 |
+
- 1.5333333333333334
|
106 |
+
- 1.5666666666666667
|
107 |
+
- 1.6
|
108 |
+
- 1.6333333333333333
|
109 |
+
- 1.6666666666666667
|
110 |
+
- 1.7
|
111 |
+
- 1.7333333333333334
|
112 |
+
- 1.7666666666666666
|
113 |
+
- 1.8
|
114 |
+
- 1.8333333333333333
|
115 |
+
- 1.8666666666666667
|
116 |
+
- 1.9
|
117 |
+
- 1.9333333333333333
|
118 |
+
- 1.9666666666666666
|
119 |
+
- 2.0
|
120 |
+
- 2.033333333333333
|
121 |
+
- 2.066666666666667
|
122 |
+
- 2.1
|
123 |
+
- 2.1333333333333333
|
124 |
+
- 2.1666666666666665
|
125 |
+
- 2.2
|
126 |
+
- 2.2333333333333334
|
127 |
+
- 2.2666666666666666
|
128 |
+
- 2.3
|
129 |
+
- 2.3333333333333335
|
130 |
+
- 2.3666666666666667
|
131 |
+
- 2.4
|
132 |
+
- 2.433333333333333
|
133 |
+
- 2.466666666666667
|
134 |
+
- 2.5
|
135 |
+
- 2.533333333333333
|
136 |
+
- 2.566666666666667
|
137 |
+
- 2.6
|
138 |
+
- 2.6333333333333333
|
139 |
+
- 2.6666666666666665
|
140 |
+
- 2.7
|
141 |
+
- 2.7333333333333334
|
142 |
+
- 2.7666666666666666
|
143 |
+
- 2.8
|
144 |
+
- 2.8333333333333335
|
145 |
+
- 2.8666666666666667
|
146 |
+
- 2.9
|
147 |
+
- 2.933333333333333
|
148 |
+
- 2.966666666666667
|
149 |
+
- 3.0
|
150 |
+
- 3.033333333333333
|
151 |
+
- 3.066666666666667
|
152 |
+
- 3.1
|
153 |
+
- 3.1333333333333333
|
154 |
+
- 3.1666666666666665
|
155 |
+
- 3.2
|
156 |
+
- 3.2333333333333334
|
157 |
+
- 3.2666666666666666
|
158 |
+
- 3.3
|
159 |
+
eval:
|
160 |
+
n_episodes: 50
|
161 |
+
batch_size: 50
|
162 |
+
use_async_envs: false
|
163 |
+
wandb:
|
164 |
+
enable: true
|
165 |
+
disable_artifact: false
|
166 |
+
project: lerobot_real_aloha
|
167 |
+
notes: ws-lerobot-hackathon
|
168 |
+
fps: 30
|
169 |
+
env:
|
170 |
+
name: real_world
|
171 |
+
task: null
|
172 |
+
state_dim: 14
|
173 |
+
action_dim: 14
|
174 |
+
fps: ${fps}
|
175 |
+
override_dataset_stats:
|
176 |
+
observation.images.cam_right_wrist:
|
177 |
+
mean:
|
178 |
+
- - - 0.485
|
179 |
+
- - - 0.456
|
180 |
+
- - - 0.406
|
181 |
+
std:
|
182 |
+
- - - 0.229
|
183 |
+
- - - 0.224
|
184 |
+
- - - 0.225
|
185 |
+
observation.images.cam_left_wrist:
|
186 |
+
mean:
|
187 |
+
- - - 0.485
|
188 |
+
- - - 0.456
|
189 |
+
- - - 0.406
|
190 |
+
std:
|
191 |
+
- - - 0.229
|
192 |
+
- - - 0.224
|
193 |
+
- - - 0.225
|
194 |
+
observation.images.cam_high:
|
195 |
+
mean:
|
196 |
+
- - - 0.485
|
197 |
+
- - - 0.456
|
198 |
+
- - - 0.406
|
199 |
+
std:
|
200 |
+
- - - 0.229
|
201 |
+
- - - 0.224
|
202 |
+
- - - 0.225
|
203 |
+
policy:
|
204 |
+
name: act
|
205 |
+
n_obs_steps: 1
|
206 |
+
chunk_size: 100
|
207 |
+
n_action_steps: 100
|
208 |
+
input_shapes:
|
209 |
+
observation.images.cam_right_wrist:
|
210 |
+
- 3
|
211 |
+
- 480
|
212 |
+
- 640
|
213 |
+
observation.images.cam_left_wrist:
|
214 |
+
- 3
|
215 |
+
- 480
|
216 |
+
- 640
|
217 |
+
observation.images.cam_high:
|
218 |
+
- 3
|
219 |
+
- 480
|
220 |
+
- 640
|
221 |
+
observation.state:
|
222 |
+
- ${env.state_dim}
|
223 |
+
output_shapes:
|
224 |
+
action:
|
225 |
+
- ${env.action_dim}
|
226 |
+
input_normalization_modes:
|
227 |
+
observation.images.cam_right_wrist: mean_std
|
228 |
+
observation.images.cam_left_wrist: mean_std
|
229 |
+
observation.images.cam_high: mean_std
|
230 |
+
observation.state: mean_std
|
231 |
+
output_normalization_modes:
|
232 |
+
action: mean_std
|
233 |
+
vision_backbone: resnet18
|
234 |
+
pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
|
235 |
+
replace_final_stride_with_dilation: false
|
236 |
+
pre_norm: false
|
237 |
+
dim_model: 512
|
238 |
+
n_heads: 8
|
239 |
+
dim_feedforward: 3200
|
240 |
+
feedforward_activation: relu
|
241 |
+
n_encoder_layers: 4
|
242 |
+
n_decoder_layers: 1
|
243 |
+
use_vae: true
|
244 |
+
latent_dim: 32
|
245 |
+
n_vae_encoder_layers: 4
|
246 |
+
temporal_ensemble_momentum: null
|
247 |
+
dropout: 0.1
|
248 |
+
kl_weight: 10.0
|
checkpoints/005000/pretrained_model/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eba28285320bc2ddcda5e0ce0be693634a20ec638d10cf364694649bfc184964
|
3 |
+
size 206767160
|
checkpoints/005000/training_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af943082a3d9b919922d7de964e9f2bdc429b3d800234ea46f97ccedce9b309c
|
3 |
+
size 413053071
|
default.log
ADDED
File without changes
|
wandb/debug-internal.log
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"time":"2024-12-07T01:07:41.167467035Z","level":"INFO","msg":"using version","core version":"0.19.0"}
|
2 |
+
{"time":"2024-12-07T01:07:41.167480199Z","level":"INFO","msg":"created symlink","path":"outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug-core.log"}
|
3 |
+
{"time":"2024-12-07T01:07:41.270189094Z","level":"INFO","msg":"created new stream","id":"bwwpk9vl"}
|
4 |
+
{"time":"2024-12-07T01:07:41.270216139Z","level":"INFO","msg":"stream: started","id":"bwwpk9vl"}
|
5 |
+
{"time":"2024-12-07T01:07:41.270250461Z","level":"INFO","msg":"writer: Do: started","stream_id":"bwwpk9vl"}
|
6 |
+
{"time":"2024-12-07T01:07:41.270250342Z","level":"INFO","msg":"sender: started","stream_id":"bwwpk9vl"}
|
7 |
+
{"time":"2024-12-07T01:07:41.270317361Z","level":"INFO","msg":"handler: started","stream_id":"bwwpk9vl"}
|
8 |
+
{"time":"2024-12-07T01:07:41.601065068Z","level":"INFO","msg":"Starting system monitor"}
|
9 |
+
{"time":"2024-12-07T01:07:46.320070438Z","level":"INFO","msg":"stream: closing","id":"bwwpk9vl"}
|
10 |
+
{"time":"2024-12-07T01:07:46.320109578Z","level":"INFO","msg":"Stopping system monitor"}
|
11 |
+
{"time":"2024-12-07T01:07:46.320581424Z","level":"INFO","msg":"Stopped system monitor"}
|
12 |
+
{"time":"2024-12-07T01:07:46.890807441Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
13 |
+
{"time":"2024-12-07T01:07:47.027194656Z","level":"INFO","msg":"handler: closed","stream_id":"bwwpk9vl"}
|
14 |
+
{"time":"2024-12-07T01:07:47.027227034Z","level":"INFO","msg":"sender: closed","stream_id":"bwwpk9vl"}
|
15 |
+
{"time":"2024-12-07T01:07:47.027228216Z","level":"INFO","msg":"writer: Close: closed","stream_id":"bwwpk9vl"}
|
16 |
+
{"time":"2024-12-07T01:07:47.027338658Z","level":"INFO","msg":"stream: closed","id":"bwwpk9vl"}
|
wandb/debug.log
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Current SDK version is 0.19.0
|
2 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Configure stats pid to 3507456
|
3 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/.config/wandb/settings
|
4 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/lerobot-hackathon/wandb/settings
|
5 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from environment variables
|
6 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] wandb: Using wandb-core as the SDK backend. Please refer to https://wandb.me/wandb-core for more information.
|
7 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:_log_setup():528] Logging user logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug.log
|
8 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:_log_setup():529] Logging internal logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug-internal.log
|
9 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():639] calling init triggers
|
10 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():645] wandb.init called with sweep_config: {}
|
11 |
+
config: {'resume': True, 'device': 'cuda', 'use_amp': False, 'seed': 1000, 'dataset_repo_id': 'ccop/aloha_stationary_replay_test_v2', 'video_backend': 'pyav', 'training': {'offline_steps': 5000, 'num_workers': 8, 'batch_size': 8, 'eval_freq': -1, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 10000, 'online_steps': 0, 'online_rollout_n_episodes': 1, 'online_rollout_batch_size': 1, 'online_steps_between_rollouts': 1, 'online_sampling_ratio': 0.5, 'online_env_seed': None, 'online_buffer_capacity': None, 'online_buffer_seed_size': 0, 'do_online_rollout_async': False, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'brightness': {'weight': 1, 'min_max': [0.8, 1.2]}, 'contrast': {'weight': 1, 'min_max': [0.8, 1.2]}, 'saturation': {'weight': 1, 'min_max': [0.5, 1.5]}, 'hue': {'weight': 1, 'min_max': [-0.05, 0.05]}, 'sharpness': {'weight': 1, 'min_max': [0.8, 1.2]}}, 'lr': 1e-05, 'lr_backbone': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10, 'delta_timestamps': {'action': [0.0, 0.03333333333333333, 0.06666666666666667, 0.1, 0.13333333333333333, 0.16666666666666666, 0.2, 0.23333333333333334, 0.26666666666666666, 0.3, 0.3333333333333333, 0.36666666666666664, 0.4, 0.43333333333333335, 0.4666666666666667, 0.5, 0.5333333333333333, 0.5666666666666667, 0.6, 0.6333333333333333, 0.6666666666666666, 0.7, 0.7333333333333333, 0.7666666666666667, 0.8, 0.8333333333333334, 0.8666666666666667, 0.9, 0.9333333333333333, 0.9666666666666667, 1.0, 1.0333333333333334, 1.0666666666666667, 1.1, 1.1333333333333333, 1.1666666666666667, 1.2, 1.2333333333333334, 1.2666666666666666, 1.3, 1.3333333333333333, 1.3666666666666667, 1.4, 1.4333333333333333, 1.4666666666666666, 1.5, 1.5333333333333334, 1.5666666666666667, 1.6, 1.6333333333333333, 1.6666666666666667, 1.7, 1.7333333333333334, 1.7666666666666666, 1.8, 1.8333333333333333, 1.8666666666666667, 1.9, 1.9333333333333333, 1.9666666666666666, 2.0, 2.033333333333333, 2.066666666666667, 2.1, 2.1333333333333333, 2.1666666666666665, 2.2, 2.2333333333333334, 2.2666666666666666, 2.3, 2.3333333333333335, 2.3666666666666667, 2.4, 2.433333333333333, 2.466666666666667, 2.5, 2.533333333333333, 2.566666666666667, 2.6, 2.6333333333333333, 2.6666666666666665, 2.7, 2.7333333333333334, 2.7666666666666666, 2.8, 2.8333333333333335, 2.8666666666666667, 2.9, 2.933333333333333, 2.966666666666667, 3.0, 3.033333333333333, 3.066666666666667, 3.1, 3.1333333333333333, 3.1666666666666665, 3.2, 3.2333333333333334, 3.2666666666666666, 3.3]}}, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot_real_aloha', 'notes': 'ws-lerobot-hackathon'}, 'fps': 30, 'env': {'name': 'real_world', 'task': None, 'state_dim': 14, 'action_dim': 14, 'fps': 30}, 'override_dataset_stats': {'observation.images.cam_right_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_left_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_high': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}}, 'policy': {'name': 'act', 'n_obs_steps': 1, 'chunk_size': 100, 'n_action_steps': 100, 'input_shapes': {'observation.images.cam_right_wrist': [3, 480, 640], 'observation.images.cam_left_wrist': [3, 480, 640], 'observation.images.cam_high': [3, 480, 640], 'observation.state': [14]}, 'output_shapes': {'action': [14]}, 'input_normalization_modes': {'observation.images.cam_right_wrist': 'mean_std', 'observation.images.cam_left_wrist': 'mean_std', 'observation.images.cam_high': 'mean_std', 'observation.state': 'mean_std'}, 'output_normalization_modes': {'action': 'mean_std'}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_momentum': None, 'dropout': 0.1, 'kl_weight': 10.0}}
|
12 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():688] starting backend
|
13 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():692] sending inform_init request
|
14 |
+
2024-12-07 01:07:41,165 INFO MainThread:3507456 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
|
15 |
+
2024-12-07 01:07:41,166 INFO MainThread:3507456 [wandb_init.py:init():705] backend started and connected
|
16 |
+
2024-12-07 01:07:41,168 INFO MainThread:3507456 [wandb_init.py:init():798] updated telemetry
|
17 |
+
2024-12-07 01:07:41,174 INFO MainThread:3507456 [wandb_init.py:init():830] communicating run to backend with 90.0 second timeout
|
18 |
+
2024-12-07 01:07:41,592 INFO MainThread:3507456 [wandb_init.py:init():875] run resumed
|
19 |
+
2024-12-07 01:07:41,597 INFO MainThread:3507456 [wandb_init.py:init():882] starting run threads in backend
|
20 |
+
2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_console_start():2443] atexit reg
|
21 |
+
2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2293] redirect: wrap_raw
|
22 |
+
2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2358] Wrapping output streams.
|
23 |
+
2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2383] Redirects installed.
|
24 |
+
2024-12-07 01:07:41,713 INFO MainThread:3507456 [wandb_init.py:init():925] run started, returning control to user process
|
25 |
+
2024-12-07 01:07:46,320 WARNING MsgRouterThr:3507456 [router.py:message_loop():75] message_loop has been closed
|
wandb/run-20241206_222830-bwwpk9vl/files/config.yaml
ADDED
@@ -0,0 +1,194 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_wandb:
|
2 |
+
value:
|
3 |
+
cli_version: 0.19.0
|
4 |
+
m: []
|
5 |
+
python_version: 3.10.12
|
6 |
+
t:
|
7 |
+
"1":
|
8 |
+
- 1
|
9 |
+
- 41
|
10 |
+
- 49
|
11 |
+
- 50
|
12 |
+
- 51
|
13 |
+
- 55
|
14 |
+
"2":
|
15 |
+
- 1
|
16 |
+
- 41
|
17 |
+
- 49
|
18 |
+
- 50
|
19 |
+
- 51
|
20 |
+
- 55
|
21 |
+
"3":
|
22 |
+
- 13
|
23 |
+
- 15
|
24 |
+
- 16
|
25 |
+
- 23
|
26 |
+
- 55
|
27 |
+
- 61
|
28 |
+
"4": 3.10.12
|
29 |
+
"5": 0.19.0
|
30 |
+
"8":
|
31 |
+
- 5
|
32 |
+
"12": 0.19.0
|
33 |
+
"13": linux-x86_64
|
34 |
+
dataset_repo_id:
|
35 |
+
value: ccop/aloha_stationary_replay_test_v2
|
36 |
+
device:
|
37 |
+
value: cuda
|
38 |
+
env:
|
39 |
+
value:
|
40 |
+
action_dim: 14
|
41 |
+
fps: 30
|
42 |
+
name: real_world
|
43 |
+
state_dim: 14
|
44 |
+
task: null
|
45 |
+
eval:
|
46 |
+
value:
|
47 |
+
batch_size: 50
|
48 |
+
n_episodes: 50
|
49 |
+
use_async_envs: false
|
50 |
+
fps:
|
51 |
+
value: 30
|
52 |
+
override_dataset_stats:
|
53 |
+
value:
|
54 |
+
observation.images.cam_high:
|
55 |
+
mean:
|
56 |
+
- - - 0.485
|
57 |
+
- - - 0.456
|
58 |
+
- - - 0.406
|
59 |
+
std:
|
60 |
+
- - - 0.229
|
61 |
+
- - - 0.224
|
62 |
+
- - - 0.225
|
63 |
+
observation.images.cam_left_wrist:
|
64 |
+
mean:
|
65 |
+
- - - 0.485
|
66 |
+
- - - 0.456
|
67 |
+
- - - 0.406
|
68 |
+
std:
|
69 |
+
- - - 0.229
|
70 |
+
- - - 0.224
|
71 |
+
- - - 0.225
|
72 |
+
observation.images.cam_right_wrist:
|
73 |
+
mean:
|
74 |
+
- - - 0.485
|
75 |
+
- - - 0.456
|
76 |
+
- - - 0.406
|
77 |
+
std:
|
78 |
+
- - - 0.229
|
79 |
+
- - - 0.224
|
80 |
+
- - - 0.225
|
81 |
+
policy:
|
82 |
+
value:
|
83 |
+
chunk_size: 100
|
84 |
+
dim_feedforward: 3200
|
85 |
+
dim_model: 512
|
86 |
+
dropout: 0.1
|
87 |
+
feedforward_activation: relu
|
88 |
+
input_normalization_modes:
|
89 |
+
observation.images.cam_high: mean_std
|
90 |
+
observation.images.cam_left_wrist: mean_std
|
91 |
+
observation.images.cam_right_wrist: mean_std
|
92 |
+
observation.state: mean_std
|
93 |
+
input_shapes:
|
94 |
+
observation.images.cam_high:
|
95 |
+
- 3
|
96 |
+
- 480
|
97 |
+
- 640
|
98 |
+
observation.images.cam_left_wrist:
|
99 |
+
- 3
|
100 |
+
- 480
|
101 |
+
- 640
|
102 |
+
observation.images.cam_right_wrist:
|
103 |
+
- 3
|
104 |
+
- 480
|
105 |
+
- 640
|
106 |
+
observation.state:
|
107 |
+
- 14
|
108 |
+
kl_weight: 10
|
109 |
+
latent_dim: 32
|
110 |
+
n_action_steps: 100
|
111 |
+
n_decoder_layers: 1
|
112 |
+
n_encoder_layers: 4
|
113 |
+
n_heads: 8
|
114 |
+
n_obs_steps: 1
|
115 |
+
n_vae_encoder_layers: 4
|
116 |
+
name: act
|
117 |
+
output_normalization_modes:
|
118 |
+
action: mean_std
|
119 |
+
output_shapes:
|
120 |
+
action:
|
121 |
+
- 14
|
122 |
+
pre_norm: false
|
123 |
+
pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
|
124 |
+
replace_final_stride_with_dilation: false
|
125 |
+
temporal_ensemble_momentum: null
|
126 |
+
use_vae: true
|
127 |
+
vision_backbone: resnet18
|
128 |
+
resume:
|
129 |
+
value: false
|
130 |
+
seed:
|
131 |
+
value: 1000
|
132 |
+
training:
|
133 |
+
value:
|
134 |
+
batch_size: 8
|
135 |
+
delta_timestamps:
|
136 |
+
action: '[i / 30 for i in range(100)]'
|
137 |
+
do_online_rollout_async: false
|
138 |
+
eval_freq: -1
|
139 |
+
grad_clip_norm: 10
|
140 |
+
image_transforms:
|
141 |
+
brightness:
|
142 |
+
min_max:
|
143 |
+
- 0.8
|
144 |
+
- 1.2
|
145 |
+
weight: 1
|
146 |
+
contrast:
|
147 |
+
min_max:
|
148 |
+
- 0.8
|
149 |
+
- 1.2
|
150 |
+
weight: 1
|
151 |
+
enable: false
|
152 |
+
hue:
|
153 |
+
min_max:
|
154 |
+
- -0.05
|
155 |
+
- 0.05
|
156 |
+
weight: 1
|
157 |
+
max_num_transforms: 3
|
158 |
+
random_order: false
|
159 |
+
saturation:
|
160 |
+
min_max:
|
161 |
+
- 0.5
|
162 |
+
- 1.5
|
163 |
+
weight: 1
|
164 |
+
sharpness:
|
165 |
+
min_max:
|
166 |
+
- 0.8
|
167 |
+
- 1.2
|
168 |
+
weight: 1
|
169 |
+
log_freq: 200
|
170 |
+
lr: 1e-05
|
171 |
+
lr_backbone: 1e-05
|
172 |
+
num_workers: 8
|
173 |
+
offline_steps: 5000
|
174 |
+
online_buffer_capacity: null
|
175 |
+
online_buffer_seed_size: 0
|
176 |
+
online_env_seed: null
|
177 |
+
online_rollout_batch_size: 1
|
178 |
+
online_rollout_n_episodes: 1
|
179 |
+
online_sampling_ratio: 0.5
|
180 |
+
online_steps: 0
|
181 |
+
online_steps_between_rollouts: 1
|
182 |
+
save_checkpoint: true
|
183 |
+
save_freq: 10000
|
184 |
+
weight_decay: 0.0001
|
185 |
+
use_amp:
|
186 |
+
value: false
|
187 |
+
video_backend:
|
188 |
+
value: pyav
|
189 |
+
wandb:
|
190 |
+
value:
|
191 |
+
disable_artifact: false
|
192 |
+
enable: true
|
193 |
+
notes: ws-lerobot-hackathon
|
194 |
+
project: lerobot_real_aloha
|
wandb/run-20241206_222830-bwwpk9vl/files/output.log
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[1m[34mLogs will be synced with wandb.[0m
|
2 |
+
INFO 2024-12-06 22:28:30 n/logger.py:132 Track this run --> [1m[33mhttps://wandb.ai/zaringleb/lerobot_real_aloha/runs/bwwpk9vl[0m
|
3 |
+
INFO 2024-12-06 22:28:30 ts/train.py:312 make_dataset
|
4 |
+
WARNING 2024-12-06 22:28:30 s/factory.py:68 There might be a mismatch between your training dataset (dataset_repo_id='ccop/aloha_stationary_replay_test_v2') and your environment (cfg.env.name='real_world').
|
5 |
+
Fetching 9 files: 100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 9/9 [00:00<00:00, 39945.75it/s]
|
6 |
+
INFO 2024-12-06 22:28:32 ts/train.py:328 make_policy
|
7 |
+
WARNING 2024-12-06 22:28:32 s/factory.py:28 Hydra config is missing arguments: {'temporal_ensemble_coeff'}
|
8 |
+
/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py:338: FutureWarning: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.
|
9 |
+
grad_scaler = GradScaler(enabled=cfg.use_amp)
|
10 |
+
INFO 2024-12-06 22:28:33 on/logger.py:39 [1m[33mOutput dir:[0m outputs/train/2024-12-06/22-28-29_real_world_act_default
|
11 |
+
INFO 2024-12-06 22:28:33 ts/train.py:349 cfg.env.task=None
|
12 |
+
INFO 2024-12-06 22:28:33 ts/train.py:350 cfg.training.offline_steps=5000 (5K)
|
13 |
+
INFO 2024-12-06 22:28:33 ts/train.py:351 cfg.training.online_steps=0
|
14 |
+
INFO 2024-12-06 22:28:33 ts/train.py:352 offline_dataset.num_samples=800 (800)
|
15 |
+
INFO 2024-12-06 22:28:33 ts/train.py:353 offline_dataset.num_episodes=1
|
16 |
+
INFO 2024-12-06 22:28:33 ts/train.py:354 num_learnable_params=51613582 (52M)
|
17 |
+
INFO 2024-12-06 22:28:33 ts/train.py:355 num_total_params=51613684 (52M)
|
18 |
+
INFO 2024-12-06 22:28:33 ts/train.py:421 Start offline training on a fixed dataset
|
19 |
+
INFO 2024-12-06 22:28:44 ts/train.py:192 step:0 smpl:8 ep:0 epch:0.01 loss:85.424 grdn:1036.794 lr:1.0e-05 updt_s:7.126 data_s:3.108
|
20 |
+
INFO 2024-12-06 22:32:21 ts/train.py:192 step:200 smpl:2K ep:2 epch:2.01 loss:3.562 grdn:97.104 lr:1.0e-05 updt_s:1.076 data_s:2.453
|
21 |
+
INFO 2024-12-06 22:36:00 ts/train.py:192 step:400 smpl:3K ep:4 epch:4.01 loss:2.455 grdn:86.458 lr:1.0e-05 updt_s:1.094 data_s:2.019
|
22 |
+
INFO 2024-12-06 22:39:40 ts/train.py:192 step:600 smpl:5K ep:6 epch:6.01 loss:2.300 grdn:76.224 lr:1.0e-05 updt_s:1.088 data_s:2.352
|
23 |
+
INFO 2024-12-06 22:43:19 ts/train.py:192 step:800 smpl:6K ep:8 epch:8.01 loss:1.897 grdn:66.798 lr:1.0e-05 updt_s:1.108 data_s:2.149
|
24 |
+
INFO 2024-12-06 22:46:58 ts/train.py:192 step:1K smpl:8K ep:10 epch:10.01 loss:1.727 grdn:65.505 lr:1.0e-05 updt_s:1.100 data_s:1.999
|
25 |
+
INFO 2024-12-06 22:50:37 ts/train.py:192 step:1K smpl:10K ep:12 epch:12.01 loss:1.474 grdn:56.429 lr:1.0e-05 updt_s:1.091 data_s:2.366
|
26 |
+
INFO 2024-12-06 22:54:16 ts/train.py:192 step:1K smpl:11K ep:14 epch:14.01 loss:1.324 grdn:52.798 lr:1.0e-05 updt_s:1.104 data_s:1.794
|
27 |
+
INFO 2024-12-06 22:57:55 ts/train.py:192 step:2K smpl:13K ep:16 epch:16.01 loss:1.275 grdn:48.997 lr:1.0e-05 updt_s:1.099 data_s:2.227
|
28 |
+
INFO 2024-12-06 23:01:35 ts/train.py:192 step:2K smpl:14K ep:18 epch:18.01 loss:1.195 grdn:50.355 lr:1.0e-05 updt_s:1.411 data_s:2.189
|
29 |
+
INFO 2024-12-06 23:05:13 ts/train.py:192 step:2K smpl:16K ep:20 epch:20.01 loss:1.077 grdn:40.395 lr:1.0e-05 updt_s:1.090 data_s:1.955
|
30 |
+
INFO 2024-12-06 23:08:53 ts/train.py:192 step:2K smpl:18K ep:22 epch:22.01 loss:0.905 grdn:47.089 lr:1.0e-05 updt_s:1.090 data_s:2.396
|
31 |
+
INFO 2024-12-06 23:12:32 ts/train.py:192 step:2K smpl:19K ep:24 epch:24.01 loss:0.878 grdn:44.676 lr:1.0e-05 updt_s:1.090 data_s:2.298
|
32 |
+
INFO 2024-12-06 23:16:11 ts/train.py:192 step:3K smpl:21K ep:26 epch:26.01 loss:0.736 grdn:41.427 lr:1.0e-05 updt_s:1.106 data_s:2.089
|
33 |
+
INFO 2024-12-06 23:19:50 ts/train.py:192 step:3K smpl:22K ep:28 epch:28.01 loss:0.633 grdn:33.782 lr:1.0e-05 updt_s:1.090 data_s:2.224
|
34 |
+
INFO 2024-12-06 23:23:29 ts/train.py:192 step:3K smpl:24K ep:30 epch:30.01 loss:0.550 grdn:34.230 lr:1.0e-05 updt_s:1.103 data_s:2.172
|
35 |
+
INFO 2024-12-06 23:27:08 ts/train.py:192 step:3K smpl:26K ep:32 epch:32.01 loss:0.572 grdn:37.149 lr:1.0e-05 updt_s:1.086 data_s:2.248
|
36 |
+
INFO 2024-12-06 23:30:47 ts/train.py:192 step:3K smpl:27K ep:34 epch:34.01 loss:0.490 grdn:34.704 lr:1.0e-05 updt_s:1.093 data_s:1.711
|
37 |
+
INFO 2024-12-06 23:34:25 ts/train.py:192 step:4K smpl:29K ep:36 epch:36.01 loss:0.459 grdn:28.810 lr:1.0e-05 updt_s:1.105 data_s:1.716
|
38 |
+
INFO 2024-12-06 23:38:04 ts/train.py:192 step:4K smpl:30K ep:38 epch:38.01 loss:0.450 grdn:30.977 lr:1.0e-05 updt_s:1.095 data_s:2.136
|
39 |
+
INFO 2024-12-06 23:41:44 ts/train.py:192 step:4K smpl:32K ep:40 epch:40.01 loss:0.376 grdn:34.368 lr:1.0e-05 updt_s:1.092 data_s:1.970
|
40 |
+
INFO 2024-12-06 23:45:23 ts/train.py:192 step:4K smpl:34K ep:42 epch:42.01 loss:0.309 grdn:26.141 lr:1.0e-05 updt_s:1.090 data_s:2.131
|
41 |
+
INFO 2024-12-06 23:49:02 ts/train.py:192 step:4K smpl:35K ep:44 epch:44.01 loss:0.282 grdn:21.178 lr:1.0e-05 updt_s:1.095 data_s:2.192
|
42 |
+
INFO 2024-12-06 23:52:41 ts/train.py:192 step:5K smpl:37K ep:46 epch:46.01 loss:0.255 grdn:25.957 lr:1.0e-05 updt_s:1.078 data_s:2.502
|
43 |
+
INFO 2024-12-06 23:56:20 ts/train.py:192 step:5K smpl:38K ep:48 epch:48.01 loss:0.250 grdn:20.830 lr:1.0e-05 updt_s:1.088 data_s:2.212
|
44 |
+
INFO 2024-12-06 23:59:56 ts/train.py:383 Checkpoint policy after step 5000
|
45 |
+
INFO 2024-12-06 23:59:58 ts/train.py:393 Resume training
|
46 |
+
INFO 2024-12-06 23:59:58 ts/train.py:455 End of training
|
wandb/run-20241206_222830-bwwpk9vl/files/requirements.txt
ADDED
@@ -0,0 +1,129 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
pymunk==6.9.0
|
2 |
+
charset-normalizer==3.4.0
|
3 |
+
pip==22.0.2
|
4 |
+
multidict==6.1.0
|
5 |
+
pytz==2024.2
|
6 |
+
pandas==2.2.3
|
7 |
+
fasteners==0.19
|
8 |
+
einops==0.8.0
|
9 |
+
setproctitle==1.3.4
|
10 |
+
python-dateutil==2.9.0.post0
|
11 |
+
pydantic==2.10.3
|
12 |
+
dm-control==1.0.14
|
13 |
+
MarkupSafe==3.0.2
|
14 |
+
safetensors==0.4.5
|
15 |
+
cloudpickle==3.1.0
|
16 |
+
imageio-ffmpeg==0.5.1
|
17 |
+
smmap==5.0.1
|
18 |
+
huggingface-hub==0.26.5
|
19 |
+
torch==2.6.0.dev20241112+cu121
|
20 |
+
nvidia-cusolver-cu12==11.4.5.107
|
21 |
+
inquirerpy==0.3.4
|
22 |
+
soupsieve==2.6
|
23 |
+
deepdiff==8.0.1
|
24 |
+
nvidia-nvjitlink-cu12==12.4.127
|
25 |
+
aiosignal==1.3.1
|
26 |
+
dm-tree==0.1.8
|
27 |
+
aiohappyeyeballs==2.4.4
|
28 |
+
propcache==0.2.1
|
29 |
+
gym-aloha==0.1.1
|
30 |
+
labmaze==1.0.6
|
31 |
+
pyav==14.0.1
|
32 |
+
nvidia-cuda-cupti-cu12==12.1.105
|
33 |
+
cffi==1.17.1
|
34 |
+
importlib_metadata==8.5.0
|
35 |
+
nvidia-cuda-runtime-cu12==12.1.105
|
36 |
+
pycparser==2.22
|
37 |
+
h5py==3.12.1
|
38 |
+
nvidia-nccl-cu12==2.21.5
|
39 |
+
orderly-set==5.2.2
|
40 |
+
pyarrow==18.1.0
|
41 |
+
Flask==3.1.0
|
42 |
+
multiprocess==0.70.16
|
43 |
+
blinker==1.9.0
|
44 |
+
regex==2024.11.6
|
45 |
+
Jinja2==3.1.4
|
46 |
+
tqdm==4.67.1
|
47 |
+
certifi==2024.8.30
|
48 |
+
frozenlist==1.5.0
|
49 |
+
attrs==24.2.0
|
50 |
+
pytorch-triton==3.1.0+cf34004b8a
|
51 |
+
omegaconf==2.3.0
|
52 |
+
itsdangerous==2.2.0
|
53 |
+
packaging==24.2
|
54 |
+
pfzy==0.3.4
|
55 |
+
pydantic_core==2.27.1
|
56 |
+
antlr4-python3-runtime==4.9.3
|
57 |
+
cmake==3.31.1
|
58 |
+
imageio==2.36.1
|
59 |
+
setuptools==59.6.0
|
60 |
+
nvidia-cusparselt-cu12==0.6.2
|
61 |
+
zipp==3.21.0
|
62 |
+
torchvision==0.20.0.dev20241112+cu121
|
63 |
+
nvidia-curand-cu12==10.3.2.106
|
64 |
+
PyOpenGL-accelerate==3.1.7
|
65 |
+
numpy==1.26.4
|
66 |
+
dm-env==1.6
|
67 |
+
nvidia-cusparse-cu12==12.1.0.106
|
68 |
+
networkx==3.4.2
|
69 |
+
triton==3.1.0
|
70 |
+
termcolor==2.5.0
|
71 |
+
gitdb==4.0.11
|
72 |
+
torchaudio==2.5.0.dev20241112+cu121
|
73 |
+
glfw==2.8.0
|
74 |
+
tzdata==2024.2
|
75 |
+
pillow==11.0.0
|
76 |
+
idna==3.10
|
77 |
+
pyparsing==3.2.0
|
78 |
+
typing_extensions==4.12.2
|
79 |
+
wcwidth==0.2.13
|
80 |
+
sympy==1.13.1
|
81 |
+
nvidia-cublas-cu12==12.1.3.1
|
82 |
+
zarr==2.18.3
|
83 |
+
protobuf==5.29.1
|
84 |
+
annotated-types==0.7.0
|
85 |
+
xxhash==3.5.0
|
86 |
+
aiohttp==3.11.10
|
87 |
+
Werkzeug==3.1.3
|
88 |
+
mujoco==2.3.7
|
89 |
+
gymnasium==0.29.1
|
90 |
+
rerun-sdk==0.20.3
|
91 |
+
nvidia-cufft-cu12==11.0.2.54
|
92 |
+
dill==0.3.8
|
93 |
+
scipy==1.14.1
|
94 |
+
hydra-core==1.3.2
|
95 |
+
fsspec==2024.9.0
|
96 |
+
platformdirs==4.3.6
|
97 |
+
PySocks==1.7.1
|
98 |
+
PyOpenGL==3.1.7
|
99 |
+
requests==2.32.3
|
100 |
+
lxml==5.3.0
|
101 |
+
Farama-Notifications==0.0.4
|
102 |
+
nvidia-cuda-nvrtc-cu12==12.1.105
|
103 |
+
numba==0.60.0
|
104 |
+
docker-pycreds==0.4.0
|
105 |
+
six==1.17.0
|
106 |
+
lerobot==0.1.0
|
107 |
+
nvidia-cudnn-cu12==9.1.0.70
|
108 |
+
sentry-sdk==2.19.2
|
109 |
+
absl-py==2.1.0
|
110 |
+
wandb==0.19.0
|
111 |
+
mpmath==1.3.0
|
112 |
+
llvmlite==0.43.0
|
113 |
+
numcodecs==0.13.1
|
114 |
+
GitPython==3.1.43
|
115 |
+
nvidia-nvtx-cu12==12.1.105
|
116 |
+
prompt_toolkit==3.0.48
|
117 |
+
datasets==3.1.0
|
118 |
+
opencv-python==4.10.0.84
|
119 |
+
filelock==3.16.1
|
120 |
+
async-timeout==5.0.1
|
121 |
+
diffusers==0.31.0
|
122 |
+
yarl==1.18.3
|
123 |
+
click==8.1.7
|
124 |
+
asciitree==0.3.3
|
125 |
+
psutil==6.1.0
|
126 |
+
gdown==5.2.0
|
127 |
+
PyYAML==6.0.2
|
128 |
+
urllib3==2.2.3
|
129 |
+
beautifulsoup4==4.12.3
|
wandb/run-20241206_222830-bwwpk9vl/files/wandb-metadata.json
ADDED
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"os": "Linux-6.8.0-1015-aws-x86_64-with-glibc2.35",
|
3 |
+
"python": "CPython 3.10.12",
|
4 |
+
"startedAt": "2024-12-06T22:28:30.311945Z",
|
5 |
+
"args": [
|
6 |
+
"policy=act_aloha_real",
|
7 |
+
"env=aloha_real",
|
8 |
+
"dataset_repo_id=ccop/aloha_stationary_replay_test_v2"
|
9 |
+
],
|
10 |
+
"program": "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py",
|
11 |
+
"codePath": "lerobot/scripts/train.py",
|
12 |
+
"git": {
|
13 |
+
"remote": "[email protected]:HumanoidTeam/lerobot-hackathon.git",
|
14 |
+
"commit": "ab8aa3f8e7b6e5486d7af26ccd319d358ffad579"
|
15 |
+
},
|
16 |
+
"email": "[email protected]",
|
17 |
+
"root": "outputs/train/2024-12-06/22-28-29_real_world_act_default",
|
18 |
+
"host": "ip-172-31-20-130",
|
19 |
+
"username": "humanoidteam",
|
20 |
+
"executable": "/home/ubuntu/lerobot-hackathon/lerobot/bin/python",
|
21 |
+
"codePathLocal": "lerobot/scripts/train.py",
|
22 |
+
"cpu_count": 4,
|
23 |
+
"cpu_count_logical": 8,
|
24 |
+
"gpu": "Tesla T4",
|
25 |
+
"gpu_count": 1,
|
26 |
+
"disk": {
|
27 |
+
"/": {
|
28 |
+
"total": "311993479168",
|
29 |
+
"used": "216540794880"
|
30 |
+
}
|
31 |
+
},
|
32 |
+
"memory": {
|
33 |
+
"total": "33263837184"
|
34 |
+
},
|
35 |
+
"cpu": {
|
36 |
+
"count": 4,
|
37 |
+
"countLogical": 8
|
38 |
+
},
|
39 |
+
"gpu_nvidia": [
|
40 |
+
{
|
41 |
+
"name": "Tesla T4",
|
42 |
+
"memoryTotal": "16106127360",
|
43 |
+
"cudaCores": 2560,
|
44 |
+
"architecture": "Turing"
|
45 |
+
}
|
46 |
+
],
|
47 |
+
"cudaVersion": "12.4"
|
48 |
+
}
|
wandb/run-20241206_222830-bwwpk9vl/files/wandb-summary.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train/lr":1e-05,"train/loss":0.2502947151660919,"train/is_online":false,"train/num_samples":38408,"train/num_episodes":48.01,"train/kld_loss":0.01526648923754692,"train/grad_norm":20.83009910583496,"train/dataloading_s":2.211516670999117,"_timestamp":1.7335293805980325e+09,"_step":4800,"_runtime":5488.627260612,"train/step":4800,"train/l1_loss":0.09762981534004211,"train/num_epochs":48.01,"_wandb":{"runtime":5488},"train/update_s":1.0881254139821976}
|
wandb/run-20241206_222830-bwwpk9vl/logs/debug-core.log
ADDED
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"time":"2024-12-06T22:28:29.883207186Z","level":"INFO","msg":"started logging, with flags","port-filename":"/tmp/tmpf2z320nz/port-2539524.txt","pid":2539524,"debug":false,"disable-analytics":false}
|
2 |
+
{"time":"2024-12-06T22:28:29.883234859Z","level":"INFO","msg":"FeatureState","shutdownOnParentExitEnabled":false}
|
3 |
+
{"time":"2024-12-06T22:28:29.886661968Z","level":"INFO","msg":"Will exit if parent process dies.","ppid":2539524}
|
4 |
+
{"time":"2024-12-06T22:28:29.886681547Z","level":"INFO","msg":"server is running","addr":{"IP":"127.0.0.1","Port":43495,"Zone":""}}
|
5 |
+
{"time":"2024-12-06T22:28:30.072566654Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:55002"}
|
6 |
+
{"time":"2024-12-06T22:28:30.312961224Z","level":"INFO","msg":"handleInformInit: received","streamId":"bwwpk9vl","id":"127.0.0.1:55002"}
|
7 |
+
{"time":"2024-12-06T22:28:30.416433116Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"bwwpk9vl","id":"127.0.0.1:55002"}
|
8 |
+
{"time":"2024-12-06T23:59:58.939118572Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"127.0.0.1:55002"}
|
9 |
+
{"time":"2024-12-06T23:59:58.939192863Z","level":"INFO","msg":"server is shutting down"}
|
10 |
+
{"time":"2024-12-06T23:59:58.939181535Z","level":"INFO","msg":"connection: Close: initiating connection closure","id":"127.0.0.1:55002"}
|
11 |
+
{"time":"2024-12-06T23:59:58.939312003Z","level":"INFO","msg":"connection: Close: connection successfully closed","id":"127.0.0.1:55002"}
|
12 |
+
{"time":"2024-12-07T00:00:06.315410708Z","level":"ERROR","msg":"processOutgoingData: flush error","error":"write tcp 127.0.0.1:43495->127.0.0.1:55002: use of closed network connection","id":"127.0.0.1:55002"}
|
13 |
+
{"time":"2024-12-07T00:00:06.536210754Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"127.0.0.1:55002"}
|
14 |
+
{"time":"2024-12-07T00:00:06.536232465Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"127.0.0.1:55002"}
|
15 |
+
{"time":"2024-12-07T00:00:06.536247048Z","level":"INFO","msg":"server is closed"}
|
wandb/run-20241206_222830-bwwpk9vl/logs/debug-internal.log
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"time":"2024-12-06T22:28:30.313104758Z","level":"INFO","msg":"using version","core version":"0.19.0"}
|
2 |
+
{"time":"2024-12-06T22:28:30.313117284Z","level":"INFO","msg":"created symlink","path":"outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241206_222830-bwwpk9vl/logs/debug-core.log"}
|
3 |
+
{"time":"2024-12-06T22:28:30.416399043Z","level":"INFO","msg":"created new stream","id":"bwwpk9vl"}
|
4 |
+
{"time":"2024-12-06T22:28:30.416428271Z","level":"INFO","msg":"stream: started","id":"bwwpk9vl"}
|
5 |
+
{"time":"2024-12-06T22:28:30.416469205Z","level":"INFO","msg":"handler: started","stream_id":"bwwpk9vl"}
|
6 |
+
{"time":"2024-12-06T22:28:30.416473548Z","level":"INFO","msg":"sender: started","stream_id":"bwwpk9vl"}
|
7 |
+
{"time":"2024-12-06T22:28:30.416459377Z","level":"INFO","msg":"writer: Do: started","stream_id":"bwwpk9vl"}
|
8 |
+
{"time":"2024-12-06T22:28:30.658850895Z","level":"INFO","msg":"Starting system monitor"}
|
9 |
+
{"time":"2024-12-06T23:59:58.939177282Z","level":"INFO","msg":"stream: closing","id":"bwwpk9vl"}
|
10 |
+
{"time":"2024-12-06T23:59:58.939228097Z","level":"INFO","msg":"Stopping system monitor"}
|
11 |
+
{"time":"2024-12-06T23:59:58.939881357Z","level":"INFO","msg":"Stopped system monitor"}
|
12 |
+
{"time":"2024-12-07T00:00:06.36632207Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
13 |
+
{"time":"2024-12-07T00:00:06.536040063Z","level":"INFO","msg":"handler: closed","stream_id":"bwwpk9vl"}
|
14 |
+
{"time":"2024-12-07T00:00:06.536088365Z","level":"INFO","msg":"writer: Close: closed","stream_id":"bwwpk9vl"}
|
15 |
+
{"time":"2024-12-07T00:00:06.536107691Z","level":"INFO","msg":"sender: closed","stream_id":"bwwpk9vl"}
|
16 |
+
{"time":"2024-12-07T00:00:06.536149416Z","level":"INFO","msg":"stream: closed","id":"bwwpk9vl"}
|
wandb/run-20241206_222830-bwwpk9vl/logs/debug.log
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
2024-12-06 22:28:30,306 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Current SDK version is 0.19.0
|
2 |
+
2024-12-06 22:28:30,306 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Configure stats pid to 2539524
|
3 |
+
2024-12-06 22:28:30,306 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/.config/wandb/settings
|
4 |
+
2024-12-06 22:28:30,306 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/lerobot-hackathon/wandb/settings
|
5 |
+
2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Loading settings from environment variables
|
6 |
+
2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_setup.py:_flush():68] wandb: Using wandb-core as the SDK backend. Please refer to https://wandb.me/wandb-core for more information.
|
7 |
+
2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:_log_setup():528] Logging user logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241206_222830-bwwpk9vl/logs/debug.log
|
8 |
+
2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:_log_setup():529] Logging internal logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241206_222830-bwwpk9vl/logs/debug-internal.log
|
9 |
+
2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:init():639] calling init triggers
|
10 |
+
2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:init():645] wandb.init called with sweep_config: {}
|
11 |
+
config: {'resume': False, 'device': 'cuda', 'use_amp': False, 'seed': 1000, 'dataset_repo_id': 'ccop/aloha_stationary_replay_test_v2', 'video_backend': 'pyav', 'training': {'offline_steps': 5000, 'num_workers': 8, 'batch_size': 8, 'eval_freq': -1, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 10000, 'online_steps': 0, 'online_rollout_n_episodes': 1, 'online_rollout_batch_size': 1, 'online_steps_between_rollouts': 1, 'online_sampling_ratio': 0.5, 'online_env_seed': None, 'online_buffer_capacity': None, 'online_buffer_seed_size': 0, 'do_online_rollout_async': False, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'brightness': {'weight': 1, 'min_max': [0.8, 1.2]}, 'contrast': {'weight': 1, 'min_max': [0.8, 1.2]}, 'saturation': {'weight': 1, 'min_max': [0.5, 1.5]}, 'hue': {'weight': 1, 'min_max': [-0.05, 0.05]}, 'sharpness': {'weight': 1, 'min_max': [0.8, 1.2]}}, 'lr': 1e-05, 'lr_backbone': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10, 'delta_timestamps': {'action': '[i / 30 for i in range(100)]'}}, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot_real_aloha', 'notes': 'ws-lerobot-hackathon'}, 'fps': 30, 'env': {'name': 'real_world', 'task': None, 'state_dim': 14, 'action_dim': 14, 'fps': 30}, 'override_dataset_stats': {'observation.images.cam_right_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_left_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_high': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}}, 'policy': {'name': 'act', 'n_obs_steps': 1, 'chunk_size': 100, 'n_action_steps': 100, 'input_shapes': {'observation.images.cam_right_wrist': [3, 480, 640], 'observation.images.cam_left_wrist': [3, 480, 640], 'observation.images.cam_high': [3, 480, 640], 'observation.state': [14]}, 'output_shapes': {'action': [14]}, 'input_normalization_modes': {'observation.images.cam_right_wrist': 'mean_std', 'observation.images.cam_left_wrist': 'mean_std', 'observation.images.cam_high': 'mean_std', 'observation.state': 'mean_std'}, 'output_normalization_modes': {'action': 'mean_std'}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_momentum': None, 'dropout': 0.1, 'kl_weight': 10.0}}
|
12 |
+
2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:init():688] starting backend
|
13 |
+
2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:init():692] sending inform_init request
|
14 |
+
2024-12-06 22:28:30,311 INFO MainThread:2539524 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
|
15 |
+
2024-12-06 22:28:30,311 INFO MainThread:2539524 [wandb_init.py:init():705] backend started and connected
|
16 |
+
2024-12-06 22:28:30,313 INFO MainThread:2539524 [wandb_init.py:init():798] updated telemetry
|
17 |
+
2024-12-06 22:28:30,319 INFO MainThread:2539524 [wandb_init.py:init():830] communicating run to backend with 90.0 second timeout
|
18 |
+
2024-12-06 22:28:30,655 INFO MainThread:2539524 [wandb_init.py:init():882] starting run threads in backend
|
19 |
+
2024-12-06 22:28:30,767 INFO MainThread:2539524 [wandb_run.py:_console_start():2443] atexit reg
|
20 |
+
2024-12-06 22:28:30,767 INFO MainThread:2539524 [wandb_run.py:_redirect():2293] redirect: wrap_raw
|
21 |
+
2024-12-06 22:28:30,767 INFO MainThread:2539524 [wandb_run.py:_redirect():2358] Wrapping output streams.
|
22 |
+
2024-12-06 22:28:30,767 INFO MainThread:2539524 [wandb_run.py:_redirect():2383] Redirects installed.
|
23 |
+
2024-12-06 22:28:30,769 INFO MainThread:2539524 [wandb_init.py:init():925] run started, returning control to user process
|
24 |
+
2024-12-06 23:59:58,939 WARNING MsgRouterThr:2539524 [router.py:message_loop():75] message_loop has been closed
|
wandb/run-20241206_222830-bwwpk9vl/run-bwwpk9vl.wandb
ADDED
Binary file (931 kB). View file
|
|
wandb/run-20241207_010636-bwwpk9vl/files/config.yaml
ADDED
@@ -0,0 +1,296 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_wandb:
|
2 |
+
value:
|
3 |
+
cli_version: 0.19.0
|
4 |
+
m: []
|
5 |
+
python_version: 3.10.12
|
6 |
+
t:
|
7 |
+
"1":
|
8 |
+
- 1
|
9 |
+
- 41
|
10 |
+
- 49
|
11 |
+
- 50
|
12 |
+
- 51
|
13 |
+
- 55
|
14 |
+
"2":
|
15 |
+
- 1
|
16 |
+
- 41
|
17 |
+
- 49
|
18 |
+
- 50
|
19 |
+
- 51
|
20 |
+
- 55
|
21 |
+
"3":
|
22 |
+
- 5
|
23 |
+
- 13
|
24 |
+
- 14
|
25 |
+
- 15
|
26 |
+
- 16
|
27 |
+
- 23
|
28 |
+
- 55
|
29 |
+
- 62
|
30 |
+
"4": 3.10.12
|
31 |
+
"5": 0.19.0
|
32 |
+
"8":
|
33 |
+
- 5
|
34 |
+
"12": 0.19.0
|
35 |
+
"13": linux-x86_64
|
36 |
+
dataset_repo_id:
|
37 |
+
value: ccop/aloha_stationary_replay_test_v2
|
38 |
+
device:
|
39 |
+
value: cuda
|
40 |
+
env:
|
41 |
+
value:
|
42 |
+
action_dim: 14
|
43 |
+
fps: 30
|
44 |
+
name: real_world
|
45 |
+
state_dim: 14
|
46 |
+
task: null
|
47 |
+
eval:
|
48 |
+
value:
|
49 |
+
batch_size: 50
|
50 |
+
n_episodes: 50
|
51 |
+
use_async_envs: false
|
52 |
+
fps:
|
53 |
+
value: 30
|
54 |
+
override_dataset_stats:
|
55 |
+
value:
|
56 |
+
observation.images.cam_high:
|
57 |
+
mean:
|
58 |
+
- - - 0.485
|
59 |
+
- - - 0.456
|
60 |
+
- - - 0.406
|
61 |
+
std:
|
62 |
+
- - - 0.229
|
63 |
+
- - - 0.224
|
64 |
+
- - - 0.225
|
65 |
+
observation.images.cam_left_wrist:
|
66 |
+
mean:
|
67 |
+
- - - 0.485
|
68 |
+
- - - 0.456
|
69 |
+
- - - 0.406
|
70 |
+
std:
|
71 |
+
- - - 0.229
|
72 |
+
- - - 0.224
|
73 |
+
- - - 0.225
|
74 |
+
observation.images.cam_right_wrist:
|
75 |
+
mean:
|
76 |
+
- - - 0.485
|
77 |
+
- - - 0.456
|
78 |
+
- - - 0.406
|
79 |
+
std:
|
80 |
+
- - - 0.229
|
81 |
+
- - - 0.224
|
82 |
+
- - - 0.225
|
83 |
+
policy:
|
84 |
+
value:
|
85 |
+
chunk_size: 100
|
86 |
+
dim_feedforward: 3200
|
87 |
+
dim_model: 512
|
88 |
+
dropout: 0.1
|
89 |
+
feedforward_activation: relu
|
90 |
+
input_normalization_modes:
|
91 |
+
observation.images.cam_high: mean_std
|
92 |
+
observation.images.cam_left_wrist: mean_std
|
93 |
+
observation.images.cam_right_wrist: mean_std
|
94 |
+
observation.state: mean_std
|
95 |
+
input_shapes:
|
96 |
+
observation.images.cam_high:
|
97 |
+
- 3
|
98 |
+
- 480
|
99 |
+
- 640
|
100 |
+
observation.images.cam_left_wrist:
|
101 |
+
- 3
|
102 |
+
- 480
|
103 |
+
- 640
|
104 |
+
observation.images.cam_right_wrist:
|
105 |
+
- 3
|
106 |
+
- 480
|
107 |
+
- 640
|
108 |
+
observation.state:
|
109 |
+
- 14
|
110 |
+
kl_weight: 10
|
111 |
+
latent_dim: 32
|
112 |
+
n_action_steps: 100
|
113 |
+
n_decoder_layers: 1
|
114 |
+
n_encoder_layers: 4
|
115 |
+
n_heads: 8
|
116 |
+
n_obs_steps: 1
|
117 |
+
n_vae_encoder_layers: 4
|
118 |
+
name: act
|
119 |
+
output_normalization_modes:
|
120 |
+
action: mean_std
|
121 |
+
output_shapes:
|
122 |
+
action:
|
123 |
+
- 14
|
124 |
+
pre_norm: false
|
125 |
+
pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
|
126 |
+
replace_final_stride_with_dilation: false
|
127 |
+
temporal_ensemble_momentum: null
|
128 |
+
use_vae: true
|
129 |
+
vision_backbone: resnet18
|
130 |
+
resume:
|
131 |
+
value: true
|
132 |
+
seed:
|
133 |
+
value: 1000
|
134 |
+
training:
|
135 |
+
value:
|
136 |
+
batch_size: 8
|
137 |
+
delta_timestamps:
|
138 |
+
action:
|
139 |
+
- 0
|
140 |
+
- 0.03333333333333333
|
141 |
+
- 0.06666666666666667
|
142 |
+
- 0.1
|
143 |
+
- 0.13333333333333333
|
144 |
+
- 0.16666666666666666
|
145 |
+
- 0.2
|
146 |
+
- 0.23333333333333334
|
147 |
+
- 0.26666666666666666
|
148 |
+
- 0.3
|
149 |
+
- 0.3333333333333333
|
150 |
+
- 0.36666666666666664
|
151 |
+
- 0.4
|
152 |
+
- 0.43333333333333335
|
153 |
+
- 0.4666666666666667
|
154 |
+
- 0.5
|
155 |
+
- 0.5333333333333333
|
156 |
+
- 0.5666666666666667
|
157 |
+
- 0.6
|
158 |
+
- 0.6333333333333333
|
159 |
+
- 0.6666666666666666
|
160 |
+
- 0.7
|
161 |
+
- 0.7333333333333333
|
162 |
+
- 0.7666666666666667
|
163 |
+
- 0.8
|
164 |
+
- 0.8333333333333334
|
165 |
+
- 0.8666666666666667
|
166 |
+
- 0.9
|
167 |
+
- 0.9333333333333333
|
168 |
+
- 0.9666666666666667
|
169 |
+
- 1
|
170 |
+
- 1.0333333333333334
|
171 |
+
- 1.0666666666666667
|
172 |
+
- 1.1
|
173 |
+
- 1.1333333333333333
|
174 |
+
- 1.1666666666666667
|
175 |
+
- 1.2
|
176 |
+
- 1.2333333333333334
|
177 |
+
- 1.2666666666666666
|
178 |
+
- 1.3
|
179 |
+
- 1.3333333333333333
|
180 |
+
- 1.3666666666666667
|
181 |
+
- 1.4
|
182 |
+
- 1.4333333333333333
|
183 |
+
- 1.4666666666666666
|
184 |
+
- 1.5
|
185 |
+
- 1.5333333333333334
|
186 |
+
- 1.5666666666666667
|
187 |
+
- 1.6
|
188 |
+
- 1.6333333333333333
|
189 |
+
- 1.6666666666666667
|
190 |
+
- 1.7
|
191 |
+
- 1.7333333333333334
|
192 |
+
- 1.7666666666666666
|
193 |
+
- 1.8
|
194 |
+
- 1.8333333333333333
|
195 |
+
- 1.8666666666666667
|
196 |
+
- 1.9
|
197 |
+
- 1.9333333333333333
|
198 |
+
- 1.9666666666666666
|
199 |
+
- 2
|
200 |
+
- 2.033333333333333
|
201 |
+
- 2.066666666666667
|
202 |
+
- 2.1
|
203 |
+
- 2.1333333333333333
|
204 |
+
- 2.1666666666666665
|
205 |
+
- 2.2
|
206 |
+
- 2.2333333333333334
|
207 |
+
- 2.2666666666666666
|
208 |
+
- 2.3
|
209 |
+
- 2.3333333333333335
|
210 |
+
- 2.3666666666666667
|
211 |
+
- 2.4
|
212 |
+
- 2.433333333333333
|
213 |
+
- 2.466666666666667
|
214 |
+
- 2.5
|
215 |
+
- 2.533333333333333
|
216 |
+
- 2.566666666666667
|
217 |
+
- 2.6
|
218 |
+
- 2.6333333333333333
|
219 |
+
- 2.6666666666666665
|
220 |
+
- 2.7
|
221 |
+
- 2.7333333333333334
|
222 |
+
- 2.7666666666666666
|
223 |
+
- 2.8
|
224 |
+
- 2.8333333333333335
|
225 |
+
- 2.8666666666666667
|
226 |
+
- 2.9
|
227 |
+
- 2.933333333333333
|
228 |
+
- 2.966666666666667
|
229 |
+
- 3
|
230 |
+
- 3.033333333333333
|
231 |
+
- 3.066666666666667
|
232 |
+
- 3.1
|
233 |
+
- 3.1333333333333333
|
234 |
+
- 3.1666666666666665
|
235 |
+
- 3.2
|
236 |
+
- 3.2333333333333334
|
237 |
+
- 3.2666666666666666
|
238 |
+
- 3.3
|
239 |
+
do_online_rollout_async: false
|
240 |
+
eval_freq: -1
|
241 |
+
grad_clip_norm: 10
|
242 |
+
image_transforms:
|
243 |
+
brightness:
|
244 |
+
min_max:
|
245 |
+
- 0.8
|
246 |
+
- 1.2
|
247 |
+
weight: 1
|
248 |
+
contrast:
|
249 |
+
min_max:
|
250 |
+
- 0.8
|
251 |
+
- 1.2
|
252 |
+
weight: 1
|
253 |
+
enable: false
|
254 |
+
hue:
|
255 |
+
min_max:
|
256 |
+
- -0.05
|
257 |
+
- 0.05
|
258 |
+
weight: 1
|
259 |
+
max_num_transforms: 3
|
260 |
+
random_order: false
|
261 |
+
saturation:
|
262 |
+
min_max:
|
263 |
+
- 0.5
|
264 |
+
- 1.5
|
265 |
+
weight: 1
|
266 |
+
sharpness:
|
267 |
+
min_max:
|
268 |
+
- 0.8
|
269 |
+
- 1.2
|
270 |
+
weight: 1
|
271 |
+
log_freq: 200
|
272 |
+
lr: 1e-05
|
273 |
+
lr_backbone: 1e-05
|
274 |
+
num_workers: 8
|
275 |
+
offline_steps: 5000
|
276 |
+
online_buffer_capacity: null
|
277 |
+
online_buffer_seed_size: 0
|
278 |
+
online_env_seed: null
|
279 |
+
online_rollout_batch_size: 1
|
280 |
+
online_rollout_n_episodes: 1
|
281 |
+
online_sampling_ratio: 0.5
|
282 |
+
online_steps: 0
|
283 |
+
online_steps_between_rollouts: 1
|
284 |
+
save_checkpoint: true
|
285 |
+
save_freq: 10000
|
286 |
+
weight_decay: 0.0001
|
287 |
+
use_amp:
|
288 |
+
value: false
|
289 |
+
video_backend:
|
290 |
+
value: pyav
|
291 |
+
wandb:
|
292 |
+
value:
|
293 |
+
disable_artifact: false
|
294 |
+
enable: true
|
295 |
+
notes: ws-lerobot-hackathon
|
296 |
+
project: lerobot_real_aloha
|
wandb/run-20241207_010636-bwwpk9vl/files/output.log
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[1m[34mLogs will be synced with wandb.[0m
|
2 |
+
INFO 2024-12-07 01:06:36 n/logger.py:132 Track this run --> [1m[33mhttps://wandb.ai/zaringleb/lerobot_real_aloha/runs/bwwpk9vl[0m
|
3 |
+
INFO 2024-12-07 01:06:36 ts/train.py:312 make_dataset
|
4 |
+
WARNING 2024-12-07 01:06:36 s/factory.py:68 There might be a mismatch between your training dataset (dataset_repo_id='ccop/aloha_stationary_replay_test_v2') and your environment (cfg.env.name='real_world').
|
5 |
+
Fetching 9 files: 100%|█████████████████████████████████████████████████████████████████████████████████████████████| 9/9 [00:00<00:00, 19774.09it/s]
|
6 |
+
INFO 2024-12-07 01:06:39 ts/train.py:328 make_policy
|
7 |
+
WARNING 2024-12-07 01:06:39 s/factory.py:28 Hydra config is missing arguments: {'temporal_ensemble_coeff'}
|
8 |
+
Loading weights from local directory
|
9 |
+
/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py:338: FutureWarning: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.
|
10 |
+
grad_scaler = GradScaler(enabled=cfg.use_amp)
|
11 |
+
Error executing job with overrides: ['policy=act_aloha_real', 'env=aloha_real', 'dataset_repo_id=ccop/aloha_stationary_replay_test_v2', 'resume=true', 'dataset_repo_id=HumanoidTeam/aloha_real_test', 'training.offline_steps=5010']
|
12 |
+
Traceback (most recent call last):
|
13 |
+
File "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py", line 652, in train_cli
|
14 |
+
train(
|
15 |
+
File "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py", line 343, in train
|
16 |
+
step = logger.load_last_training_state(optimizer, lr_scheduler)
|
17 |
+
File "/home/ubuntu/lerobot-hackathon/lerobot/common/logger.py", line 218, in load_last_training_state
|
18 |
+
training_state = torch.load(self.last_checkpoint_dir / self.training_state_file_name)
|
19 |
+
File "/home/ubuntu/lerobot-hackathon/lerobot/lib/python3.10/site-packages/torch/serialization.py", line 1444, in load
|
20 |
+
raise pickle.UnpicklingError(_get_wo_message(str(e))) from None
|
21 |
+
_pickle.UnpicklingError: Weights only load failed. This file can still be loaded, to do so you have two options, [1mdo those steps only if you trust the source of the checkpoint[0m.
|
22 |
+
(1) Re-running `torch.load` with `weights_only` set to `False` will likely succeed, but it can result in arbitrary code execution. Do it only if you got the file from a trusted source.
|
23 |
+
(2) Alternatively, to load with `weights_only=True` please check the recommended steps in the following error message.
|
24 |
+
WeightsUnpickler error: Unsupported global: GLOBAL numpy.core.multiarray._reconstruct was not an allowed global by default. Please use `torch.serialization.add_safe_globals([_reconstruct])` or the `torch.serialization.safe_globals([_reconstruct])` context manager to allowlist this global if you trust this class/function.
|
25 |
+
|
26 |
+
Check the documentation of torch.load to learn more about types accepted by default with weights_only https://pytorch.org/docs/stable/generated/torch.load.html.
|
27 |
+
|
28 |
+
Set the environment variable HYDRA_FULL_ERROR=1 for a complete stack trace.
|
wandb/run-20241207_010636-bwwpk9vl/files/requirements.txt
ADDED
@@ -0,0 +1,129 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
pymunk==6.9.0
|
2 |
+
charset-normalizer==3.4.0
|
3 |
+
pip==22.0.2
|
4 |
+
multidict==6.1.0
|
5 |
+
pytz==2024.2
|
6 |
+
pandas==2.2.3
|
7 |
+
fasteners==0.19
|
8 |
+
einops==0.8.0
|
9 |
+
setproctitle==1.3.4
|
10 |
+
python-dateutil==2.9.0.post0
|
11 |
+
pydantic==2.10.3
|
12 |
+
dm-control==1.0.14
|
13 |
+
MarkupSafe==3.0.2
|
14 |
+
safetensors==0.4.5
|
15 |
+
cloudpickle==3.1.0
|
16 |
+
imageio-ffmpeg==0.5.1
|
17 |
+
smmap==5.0.1
|
18 |
+
huggingface-hub==0.26.5
|
19 |
+
torch==2.6.0.dev20241112+cu121
|
20 |
+
nvidia-cusolver-cu12==11.4.5.107
|
21 |
+
inquirerpy==0.3.4
|
22 |
+
soupsieve==2.6
|
23 |
+
deepdiff==8.0.1
|
24 |
+
nvidia-nvjitlink-cu12==12.4.127
|
25 |
+
aiosignal==1.3.1
|
26 |
+
dm-tree==0.1.8
|
27 |
+
aiohappyeyeballs==2.4.4
|
28 |
+
propcache==0.2.1
|
29 |
+
gym-aloha==0.1.1
|
30 |
+
labmaze==1.0.6
|
31 |
+
pyav==14.0.1
|
32 |
+
nvidia-cuda-cupti-cu12==12.1.105
|
33 |
+
cffi==1.17.1
|
34 |
+
importlib_metadata==8.5.0
|
35 |
+
nvidia-cuda-runtime-cu12==12.1.105
|
36 |
+
pycparser==2.22
|
37 |
+
h5py==3.12.1
|
38 |
+
nvidia-nccl-cu12==2.21.5
|
39 |
+
orderly-set==5.2.2
|
40 |
+
pyarrow==18.1.0
|
41 |
+
Flask==3.1.0
|
42 |
+
multiprocess==0.70.16
|
43 |
+
blinker==1.9.0
|
44 |
+
regex==2024.11.6
|
45 |
+
Jinja2==3.1.4
|
46 |
+
tqdm==4.67.1
|
47 |
+
certifi==2024.8.30
|
48 |
+
frozenlist==1.5.0
|
49 |
+
attrs==24.2.0
|
50 |
+
pytorch-triton==3.1.0+cf34004b8a
|
51 |
+
omegaconf==2.3.0
|
52 |
+
itsdangerous==2.2.0
|
53 |
+
packaging==24.2
|
54 |
+
pfzy==0.3.4
|
55 |
+
pydantic_core==2.27.1
|
56 |
+
antlr4-python3-runtime==4.9.3
|
57 |
+
cmake==3.31.1
|
58 |
+
imageio==2.36.1
|
59 |
+
setuptools==59.6.0
|
60 |
+
nvidia-cusparselt-cu12==0.6.2
|
61 |
+
zipp==3.21.0
|
62 |
+
torchvision==0.20.0.dev20241112+cu121
|
63 |
+
nvidia-curand-cu12==10.3.2.106
|
64 |
+
PyOpenGL-accelerate==3.1.7
|
65 |
+
numpy==1.26.4
|
66 |
+
dm-env==1.6
|
67 |
+
nvidia-cusparse-cu12==12.1.0.106
|
68 |
+
networkx==3.4.2
|
69 |
+
triton==3.1.0
|
70 |
+
termcolor==2.5.0
|
71 |
+
gitdb==4.0.11
|
72 |
+
torchaudio==2.5.0.dev20241112+cu121
|
73 |
+
glfw==2.8.0
|
74 |
+
tzdata==2024.2
|
75 |
+
pillow==11.0.0
|
76 |
+
idna==3.10
|
77 |
+
pyparsing==3.2.0
|
78 |
+
typing_extensions==4.12.2
|
79 |
+
wcwidth==0.2.13
|
80 |
+
sympy==1.13.1
|
81 |
+
nvidia-cublas-cu12==12.1.3.1
|
82 |
+
zarr==2.18.3
|
83 |
+
protobuf==5.29.1
|
84 |
+
annotated-types==0.7.0
|
85 |
+
xxhash==3.5.0
|
86 |
+
aiohttp==3.11.10
|
87 |
+
Werkzeug==3.1.3
|
88 |
+
mujoco==2.3.7
|
89 |
+
gymnasium==0.29.1
|
90 |
+
rerun-sdk==0.20.3
|
91 |
+
nvidia-cufft-cu12==11.0.2.54
|
92 |
+
dill==0.3.8
|
93 |
+
scipy==1.14.1
|
94 |
+
hydra-core==1.3.2
|
95 |
+
fsspec==2024.9.0
|
96 |
+
platformdirs==4.3.6
|
97 |
+
PySocks==1.7.1
|
98 |
+
PyOpenGL==3.1.7
|
99 |
+
requests==2.32.3
|
100 |
+
lxml==5.3.0
|
101 |
+
Farama-Notifications==0.0.4
|
102 |
+
nvidia-cuda-nvrtc-cu12==12.1.105
|
103 |
+
numba==0.60.0
|
104 |
+
docker-pycreds==0.4.0
|
105 |
+
six==1.17.0
|
106 |
+
lerobot==0.1.0
|
107 |
+
nvidia-cudnn-cu12==9.1.0.70
|
108 |
+
sentry-sdk==2.19.2
|
109 |
+
absl-py==2.1.0
|
110 |
+
wandb==0.19.0
|
111 |
+
mpmath==1.3.0
|
112 |
+
llvmlite==0.43.0
|
113 |
+
numcodecs==0.13.1
|
114 |
+
GitPython==3.1.43
|
115 |
+
nvidia-nvtx-cu12==12.1.105
|
116 |
+
prompt_toolkit==3.0.48
|
117 |
+
datasets==3.1.0
|
118 |
+
opencv-python==4.10.0.84
|
119 |
+
filelock==3.16.1
|
120 |
+
async-timeout==5.0.1
|
121 |
+
diffusers==0.31.0
|
122 |
+
yarl==1.18.3
|
123 |
+
click==8.1.7
|
124 |
+
asciitree==0.3.3
|
125 |
+
psutil==6.1.0
|
126 |
+
gdown==5.2.0
|
127 |
+
PyYAML==6.0.2
|
128 |
+
urllib3==2.2.3
|
129 |
+
beautifulsoup4==4.12.3
|
wandb/run-20241207_010636-bwwpk9vl/files/wandb-metadata.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"os": "Linux-6.8.0-1015-aws-x86_64-with-glibc2.35",
|
3 |
+
"python": "CPython 3.10.12",
|
4 |
+
"startedAt": "2024-12-07T01:06:36.020217Z",
|
5 |
+
"args": [
|
6 |
+
"policy=act_aloha_real",
|
7 |
+
"env=aloha_real",
|
8 |
+
"dataset_repo_id=ccop/aloha_stationary_replay_test_v2",
|
9 |
+
"hydra.run.dir=outputs/train/2024-12-06/22-28-29_real_world_act_default",
|
10 |
+
"resume=true",
|
11 |
+
"dataset_repo_id=HumanoidTeam/aloha_real_test",
|
12 |
+
"training.offline_steps=5010"
|
13 |
+
],
|
14 |
+
"program": "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py",
|
15 |
+
"codePath": "lerobot/scripts/train.py",
|
16 |
+
"git": {
|
17 |
+
"remote": "[email protected]:HumanoidTeam/lerobot-hackathon.git",
|
18 |
+
"commit": "ab8aa3f8e7b6e5486d7af26ccd319d358ffad579"
|
19 |
+
},
|
20 |
+
"email": "[email protected]",
|
21 |
+
"root": "outputs/train/2024-12-06/22-28-29_real_world_act_default",
|
22 |
+
"host": "ip-172-31-20-130",
|
23 |
+
"username": "humanoidteam",
|
24 |
+
"executable": "/home/ubuntu/lerobot-hackathon/lerobot/bin/python",
|
25 |
+
"codePathLocal": "lerobot/scripts/train.py",
|
26 |
+
"cpu_count": 4,
|
27 |
+
"cpu_count_logical": 8,
|
28 |
+
"gpu": "Tesla T4",
|
29 |
+
"gpu_count": 1,
|
30 |
+
"disk": {
|
31 |
+
"/": {
|
32 |
+
"total": "311993479168",
|
33 |
+
"used": "217724030976"
|
34 |
+
}
|
35 |
+
},
|
36 |
+
"memory": {
|
37 |
+
"total": "33263837184"
|
38 |
+
},
|
39 |
+
"cpu": {
|
40 |
+
"count": 4,
|
41 |
+
"countLogical": 8
|
42 |
+
},
|
43 |
+
"gpu_nvidia": [
|
44 |
+
{
|
45 |
+
"name": "Tesla T4",
|
46 |
+
"memoryTotal": "16106127360",
|
47 |
+
"cudaCores": 2560,
|
48 |
+
"architecture": "Turing"
|
49 |
+
}
|
50 |
+
],
|
51 |
+
"cudaVersion": "12.4"
|
52 |
+
}
|
wandb/run-20241207_010636-bwwpk9vl/files/wandb-summary.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train/num_episodes":48.01,"train/is_online":false,"train/num_epochs":48.01,"_runtime":5488.627260612,"train/dataloading_s":2.211516670999117,"train/loss":0.2502947151660919,"_wandb":{"runtime":5493},"train/l1_loss":0.09762981534004211,"train/lr":1e-05,"train/step":4800,"train/grad_norm":20.83009910583496,"_step":4800,"train/num_samples":38408,"_timestamp":1.7335293805980325e+09,"train/update_s":1.0881254139821976,"train/kld_loss":0.01526648923754692}
|
wandb/run-20241207_010636-bwwpk9vl/logs/debug-core.log
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"time":"2024-12-07T01:06:35.555739791Z","level":"INFO","msg":"started logging, with flags","port-filename":"/tmp/tmpw4k2sq2e/port-3507304.txt","pid":3507304,"debug":false,"disable-analytics":false}
|
2 |
+
{"time":"2024-12-07T01:06:35.555772863Z","level":"INFO","msg":"FeatureState","shutdownOnParentExitEnabled":false}
|
3 |
+
{"time":"2024-12-07T01:06:35.559538633Z","level":"INFO","msg":"Will exit if parent process dies.","ppid":3507304}
|
4 |
+
{"time":"2024-12-07T01:06:35.559558787Z","level":"INFO","msg":"server is running","addr":{"IP":"127.0.0.1","Port":41501,"Zone":""}}
|
5 |
+
{"time":"2024-12-07T01:06:35.744706996Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:49972"}
|
6 |
+
{"time":"2024-12-07T01:06:36.021210331Z","level":"INFO","msg":"handleInformInit: received","streamId":"bwwpk9vl","id":"127.0.0.1:49972"}
|
7 |
+
{"time":"2024-12-07T01:06:36.124059246Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"bwwpk9vl","id":"127.0.0.1:49972"}
|
8 |
+
{"time":"2024-12-07T01:06:41.270283035Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"127.0.0.1:49972"}
|
9 |
+
{"time":"2024-12-07T01:06:41.270348753Z","level":"INFO","msg":"server is shutting down"}
|
10 |
+
{"time":"2024-12-07T01:06:41.270339778Z","level":"INFO","msg":"connection: Close: initiating connection closure","id":"127.0.0.1:49972"}
|
11 |
+
{"time":"2024-12-07T01:06:41.270441093Z","level":"INFO","msg":"connection: Close: connection successfully closed","id":"127.0.0.1:49972"}
|
12 |
+
{"time":"2024-12-07T01:06:42.336511877Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"127.0.0.1:49972"}
|
13 |
+
{"time":"2024-12-07T01:06:42.336534508Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"127.0.0.1:49972"}
|
14 |
+
{"time":"2024-12-07T01:06:42.336548673Z","level":"INFO","msg":"server is closed"}
|
wandb/run-20241207_010636-bwwpk9vl/logs/debug-internal.log
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"time":"2024-12-07T01:06:36.021365256Z","level":"INFO","msg":"using version","core version":"0.19.0"}
|
2 |
+
{"time":"2024-12-07T01:06:36.021379424Z","level":"INFO","msg":"created symlink","path":"outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010636-bwwpk9vl/logs/debug-core.log"}
|
3 |
+
{"time":"2024-12-07T01:06:36.124016018Z","level":"INFO","msg":"created new stream","id":"bwwpk9vl"}
|
4 |
+
{"time":"2024-12-07T01:06:36.124052183Z","level":"INFO","msg":"stream: started","id":"bwwpk9vl"}
|
5 |
+
{"time":"2024-12-07T01:06:36.124086504Z","level":"INFO","msg":"writer: Do: started","stream_id":"bwwpk9vl"}
|
6 |
+
{"time":"2024-12-07T01:06:36.124086178Z","level":"INFO","msg":"sender: started","stream_id":"bwwpk9vl"}
|
7 |
+
{"time":"2024-12-07T01:06:36.124165775Z","level":"INFO","msg":"handler: started","stream_id":"bwwpk9vl"}
|
8 |
+
{"time":"2024-12-07T01:06:36.467542952Z","level":"INFO","msg":"Starting system monitor"}
|
9 |
+
{"time":"2024-12-07T01:06:41.27033621Z","level":"INFO","msg":"stream: closing","id":"bwwpk9vl"}
|
10 |
+
{"time":"2024-12-07T01:06:41.270379684Z","level":"INFO","msg":"Stopping system monitor"}
|
11 |
+
{"time":"2024-12-07T01:06:41.270898953Z","level":"INFO","msg":"Stopped system monitor"}
|
12 |
+
{"time":"2024-12-07T01:06:42.191128546Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
13 |
+
{"time":"2024-12-07T01:06:42.336356796Z","level":"INFO","msg":"handler: closed","stream_id":"bwwpk9vl"}
|
14 |
+
{"time":"2024-12-07T01:06:42.336396896Z","level":"INFO","msg":"writer: Close: closed","stream_id":"bwwpk9vl"}
|
15 |
+
{"time":"2024-12-07T01:06:42.336425596Z","level":"INFO","msg":"sender: closed","stream_id":"bwwpk9vl"}
|
16 |
+
{"time":"2024-12-07T01:06:42.336454571Z","level":"INFO","msg":"stream: closed","id":"bwwpk9vl"}
|
wandb/run-20241207_010636-bwwpk9vl/logs/debug.log
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Current SDK version is 0.19.0
|
2 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Configure stats pid to 3507304
|
3 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/.config/wandb/settings
|
4 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/lerobot-hackathon/wandb/settings
|
5 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Loading settings from environment variables
|
6 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] wandb: Using wandb-core as the SDK backend. Please refer to https://wandb.me/wandb-core for more information.
|
7 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:_log_setup():528] Logging user logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010636-bwwpk9vl/logs/debug.log
|
8 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:_log_setup():529] Logging internal logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010636-bwwpk9vl/logs/debug-internal.log
|
9 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:init():639] calling init triggers
|
10 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:init():645] wandb.init called with sweep_config: {}
|
11 |
+
config: {'resume': True, 'device': 'cuda', 'use_amp': False, 'seed': 1000, 'dataset_repo_id': 'ccop/aloha_stationary_replay_test_v2', 'video_backend': 'pyav', 'training': {'offline_steps': 5000, 'num_workers': 8, 'batch_size': 8, 'eval_freq': -1, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 10000, 'online_steps': 0, 'online_rollout_n_episodes': 1, 'online_rollout_batch_size': 1, 'online_steps_between_rollouts': 1, 'online_sampling_ratio': 0.5, 'online_env_seed': None, 'online_buffer_capacity': None, 'online_buffer_seed_size': 0, 'do_online_rollout_async': False, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'brightness': {'weight': 1, 'min_max': [0.8, 1.2]}, 'contrast': {'weight': 1, 'min_max': [0.8, 1.2]}, 'saturation': {'weight': 1, 'min_max': [0.5, 1.5]}, 'hue': {'weight': 1, 'min_max': [-0.05, 0.05]}, 'sharpness': {'weight': 1, 'min_max': [0.8, 1.2]}}, 'lr': 1e-05, 'lr_backbone': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10, 'delta_timestamps': {'action': [0.0, 0.03333333333333333, 0.06666666666666667, 0.1, 0.13333333333333333, 0.16666666666666666, 0.2, 0.23333333333333334, 0.26666666666666666, 0.3, 0.3333333333333333, 0.36666666666666664, 0.4, 0.43333333333333335, 0.4666666666666667, 0.5, 0.5333333333333333, 0.5666666666666667, 0.6, 0.6333333333333333, 0.6666666666666666, 0.7, 0.7333333333333333, 0.7666666666666667, 0.8, 0.8333333333333334, 0.8666666666666667, 0.9, 0.9333333333333333, 0.9666666666666667, 1.0, 1.0333333333333334, 1.0666666666666667, 1.1, 1.1333333333333333, 1.1666666666666667, 1.2, 1.2333333333333334, 1.2666666666666666, 1.3, 1.3333333333333333, 1.3666666666666667, 1.4, 1.4333333333333333, 1.4666666666666666, 1.5, 1.5333333333333334, 1.5666666666666667, 1.6, 1.6333333333333333, 1.6666666666666667, 1.7, 1.7333333333333334, 1.7666666666666666, 1.8, 1.8333333333333333, 1.8666666666666667, 1.9, 1.9333333333333333, 1.9666666666666666, 2.0, 2.033333333333333, 2.066666666666667, 2.1, 2.1333333333333333, 2.1666666666666665, 2.2, 2.2333333333333334, 2.2666666666666666, 2.3, 2.3333333333333335, 2.3666666666666667, 2.4, 2.433333333333333, 2.466666666666667, 2.5, 2.533333333333333, 2.566666666666667, 2.6, 2.6333333333333333, 2.6666666666666665, 2.7, 2.7333333333333334, 2.7666666666666666, 2.8, 2.8333333333333335, 2.8666666666666667, 2.9, 2.933333333333333, 2.966666666666667, 3.0, 3.033333333333333, 3.066666666666667, 3.1, 3.1333333333333333, 3.1666666666666665, 3.2, 3.2333333333333334, 3.2666666666666666, 3.3]}}, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot_real_aloha', 'notes': 'ws-lerobot-hackathon'}, 'fps': 30, 'env': {'name': 'real_world', 'task': None, 'state_dim': 14, 'action_dim': 14, 'fps': 30}, 'override_dataset_stats': {'observation.images.cam_right_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_left_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_high': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}}, 'policy': {'name': 'act', 'n_obs_steps': 1, 'chunk_size': 100, 'n_action_steps': 100, 'input_shapes': {'observation.images.cam_right_wrist': [3, 480, 640], 'observation.images.cam_left_wrist': [3, 480, 640], 'observation.images.cam_high': [3, 480, 640], 'observation.state': [14]}, 'output_shapes': {'action': [14]}, 'input_normalization_modes': {'observation.images.cam_right_wrist': 'mean_std', 'observation.images.cam_left_wrist': 'mean_std', 'observation.images.cam_high': 'mean_std', 'observation.state': 'mean_std'}, 'output_normalization_modes': {'action': 'mean_std'}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_momentum': None, 'dropout': 0.1, 'kl_weight': 10.0}}
|
12 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:init():688] starting backend
|
13 |
+
2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:init():692] sending inform_init request
|
14 |
+
2024-12-07 01:06:36,019 INFO MainThread:3507304 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
|
15 |
+
2024-12-07 01:06:36,020 INFO MainThread:3507304 [wandb_init.py:init():705] backend started and connected
|
16 |
+
2024-12-07 01:06:36,022 INFO MainThread:3507304 [wandb_init.py:init():798] updated telemetry
|
17 |
+
2024-12-07 01:06:36,027 INFO MainThread:3507304 [wandb_init.py:init():830] communicating run to backend with 90.0 second timeout
|
18 |
+
2024-12-07 01:06:36,459 INFO MainThread:3507304 [wandb_init.py:init():875] run resumed
|
19 |
+
2024-12-07 01:06:36,463 INFO MainThread:3507304 [wandb_init.py:init():882] starting run threads in backend
|
20 |
+
2024-12-07 01:06:36,579 INFO MainThread:3507304 [wandb_run.py:_console_start():2443] atexit reg
|
21 |
+
2024-12-07 01:06:36,579 INFO MainThread:3507304 [wandb_run.py:_redirect():2293] redirect: wrap_raw
|
22 |
+
2024-12-07 01:06:36,580 INFO MainThread:3507304 [wandb_run.py:_redirect():2358] Wrapping output streams.
|
23 |
+
2024-12-07 01:06:36,580 INFO MainThread:3507304 [wandb_run.py:_redirect():2383] Redirects installed.
|
24 |
+
2024-12-07 01:06:36,581 INFO MainThread:3507304 [wandb_init.py:init():925] run started, returning control to user process
|
25 |
+
2024-12-07 01:06:41,270 WARNING MsgRouterThr:3507304 [router.py:message_loop():75] message_loop has been closed
|
wandb/run-20241207_010636-bwwpk9vl/run-bwwpk9vl.wandb
ADDED
Binary file (10.6 kB). View file
|
|
wandb/run-20241207_010741-bwwpk9vl/files/config.yaml
ADDED
@@ -0,0 +1,296 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_wandb:
|
2 |
+
value:
|
3 |
+
cli_version: 0.19.0
|
4 |
+
m: []
|
5 |
+
python_version: 3.10.12
|
6 |
+
t:
|
7 |
+
"1":
|
8 |
+
- 1
|
9 |
+
- 41
|
10 |
+
- 49
|
11 |
+
- 50
|
12 |
+
- 51
|
13 |
+
- 55
|
14 |
+
"2":
|
15 |
+
- 1
|
16 |
+
- 41
|
17 |
+
- 49
|
18 |
+
- 50
|
19 |
+
- 51
|
20 |
+
- 55
|
21 |
+
"3":
|
22 |
+
- 5
|
23 |
+
- 13
|
24 |
+
- 14
|
25 |
+
- 15
|
26 |
+
- 16
|
27 |
+
- 23
|
28 |
+
- 55
|
29 |
+
- 62
|
30 |
+
"4": 3.10.12
|
31 |
+
"5": 0.19.0
|
32 |
+
"8":
|
33 |
+
- 5
|
34 |
+
"12": 0.19.0
|
35 |
+
"13": linux-x86_64
|
36 |
+
dataset_repo_id:
|
37 |
+
value: ccop/aloha_stationary_replay_test_v2
|
38 |
+
device:
|
39 |
+
value: cuda
|
40 |
+
env:
|
41 |
+
value:
|
42 |
+
action_dim: 14
|
43 |
+
fps: 30
|
44 |
+
name: real_world
|
45 |
+
state_dim: 14
|
46 |
+
task: null
|
47 |
+
eval:
|
48 |
+
value:
|
49 |
+
batch_size: 50
|
50 |
+
n_episodes: 50
|
51 |
+
use_async_envs: false
|
52 |
+
fps:
|
53 |
+
value: 30
|
54 |
+
override_dataset_stats:
|
55 |
+
value:
|
56 |
+
observation.images.cam_high:
|
57 |
+
mean:
|
58 |
+
- - - 0.485
|
59 |
+
- - - 0.456
|
60 |
+
- - - 0.406
|
61 |
+
std:
|
62 |
+
- - - 0.229
|
63 |
+
- - - 0.224
|
64 |
+
- - - 0.225
|
65 |
+
observation.images.cam_left_wrist:
|
66 |
+
mean:
|
67 |
+
- - - 0.485
|
68 |
+
- - - 0.456
|
69 |
+
- - - 0.406
|
70 |
+
std:
|
71 |
+
- - - 0.229
|
72 |
+
- - - 0.224
|
73 |
+
- - - 0.225
|
74 |
+
observation.images.cam_right_wrist:
|
75 |
+
mean:
|
76 |
+
- - - 0.485
|
77 |
+
- - - 0.456
|
78 |
+
- - - 0.406
|
79 |
+
std:
|
80 |
+
- - - 0.229
|
81 |
+
- - - 0.224
|
82 |
+
- - - 0.225
|
83 |
+
policy:
|
84 |
+
value:
|
85 |
+
chunk_size: 100
|
86 |
+
dim_feedforward: 3200
|
87 |
+
dim_model: 512
|
88 |
+
dropout: 0.1
|
89 |
+
feedforward_activation: relu
|
90 |
+
input_normalization_modes:
|
91 |
+
observation.images.cam_high: mean_std
|
92 |
+
observation.images.cam_left_wrist: mean_std
|
93 |
+
observation.images.cam_right_wrist: mean_std
|
94 |
+
observation.state: mean_std
|
95 |
+
input_shapes:
|
96 |
+
observation.images.cam_high:
|
97 |
+
- 3
|
98 |
+
- 480
|
99 |
+
- 640
|
100 |
+
observation.images.cam_left_wrist:
|
101 |
+
- 3
|
102 |
+
- 480
|
103 |
+
- 640
|
104 |
+
observation.images.cam_right_wrist:
|
105 |
+
- 3
|
106 |
+
- 480
|
107 |
+
- 640
|
108 |
+
observation.state:
|
109 |
+
- 14
|
110 |
+
kl_weight: 10
|
111 |
+
latent_dim: 32
|
112 |
+
n_action_steps: 100
|
113 |
+
n_decoder_layers: 1
|
114 |
+
n_encoder_layers: 4
|
115 |
+
n_heads: 8
|
116 |
+
n_obs_steps: 1
|
117 |
+
n_vae_encoder_layers: 4
|
118 |
+
name: act
|
119 |
+
output_normalization_modes:
|
120 |
+
action: mean_std
|
121 |
+
output_shapes:
|
122 |
+
action:
|
123 |
+
- 14
|
124 |
+
pre_norm: false
|
125 |
+
pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
|
126 |
+
replace_final_stride_with_dilation: false
|
127 |
+
temporal_ensemble_momentum: null
|
128 |
+
use_vae: true
|
129 |
+
vision_backbone: resnet18
|
130 |
+
resume:
|
131 |
+
value: true
|
132 |
+
seed:
|
133 |
+
value: 1000
|
134 |
+
training:
|
135 |
+
value:
|
136 |
+
batch_size: 8
|
137 |
+
delta_timestamps:
|
138 |
+
action:
|
139 |
+
- 0
|
140 |
+
- 0.03333333333333333
|
141 |
+
- 0.06666666666666667
|
142 |
+
- 0.1
|
143 |
+
- 0.13333333333333333
|
144 |
+
- 0.16666666666666666
|
145 |
+
- 0.2
|
146 |
+
- 0.23333333333333334
|
147 |
+
- 0.26666666666666666
|
148 |
+
- 0.3
|
149 |
+
- 0.3333333333333333
|
150 |
+
- 0.36666666666666664
|
151 |
+
- 0.4
|
152 |
+
- 0.43333333333333335
|
153 |
+
- 0.4666666666666667
|
154 |
+
- 0.5
|
155 |
+
- 0.5333333333333333
|
156 |
+
- 0.5666666666666667
|
157 |
+
- 0.6
|
158 |
+
- 0.6333333333333333
|
159 |
+
- 0.6666666666666666
|
160 |
+
- 0.7
|
161 |
+
- 0.7333333333333333
|
162 |
+
- 0.7666666666666667
|
163 |
+
- 0.8
|
164 |
+
- 0.8333333333333334
|
165 |
+
- 0.8666666666666667
|
166 |
+
- 0.9
|
167 |
+
- 0.9333333333333333
|
168 |
+
- 0.9666666666666667
|
169 |
+
- 1
|
170 |
+
- 1.0333333333333334
|
171 |
+
- 1.0666666666666667
|
172 |
+
- 1.1
|
173 |
+
- 1.1333333333333333
|
174 |
+
- 1.1666666666666667
|
175 |
+
- 1.2
|
176 |
+
- 1.2333333333333334
|
177 |
+
- 1.2666666666666666
|
178 |
+
- 1.3
|
179 |
+
- 1.3333333333333333
|
180 |
+
- 1.3666666666666667
|
181 |
+
- 1.4
|
182 |
+
- 1.4333333333333333
|
183 |
+
- 1.4666666666666666
|
184 |
+
- 1.5
|
185 |
+
- 1.5333333333333334
|
186 |
+
- 1.5666666666666667
|
187 |
+
- 1.6
|
188 |
+
- 1.6333333333333333
|
189 |
+
- 1.6666666666666667
|
190 |
+
- 1.7
|
191 |
+
- 1.7333333333333334
|
192 |
+
- 1.7666666666666666
|
193 |
+
- 1.8
|
194 |
+
- 1.8333333333333333
|
195 |
+
- 1.8666666666666667
|
196 |
+
- 1.9
|
197 |
+
- 1.9333333333333333
|
198 |
+
- 1.9666666666666666
|
199 |
+
- 2
|
200 |
+
- 2.033333333333333
|
201 |
+
- 2.066666666666667
|
202 |
+
- 2.1
|
203 |
+
- 2.1333333333333333
|
204 |
+
- 2.1666666666666665
|
205 |
+
- 2.2
|
206 |
+
- 2.2333333333333334
|
207 |
+
- 2.2666666666666666
|
208 |
+
- 2.3
|
209 |
+
- 2.3333333333333335
|
210 |
+
- 2.3666666666666667
|
211 |
+
- 2.4
|
212 |
+
- 2.433333333333333
|
213 |
+
- 2.466666666666667
|
214 |
+
- 2.5
|
215 |
+
- 2.533333333333333
|
216 |
+
- 2.566666666666667
|
217 |
+
- 2.6
|
218 |
+
- 2.6333333333333333
|
219 |
+
- 2.6666666666666665
|
220 |
+
- 2.7
|
221 |
+
- 2.7333333333333334
|
222 |
+
- 2.7666666666666666
|
223 |
+
- 2.8
|
224 |
+
- 2.8333333333333335
|
225 |
+
- 2.8666666666666667
|
226 |
+
- 2.9
|
227 |
+
- 2.933333333333333
|
228 |
+
- 2.966666666666667
|
229 |
+
- 3
|
230 |
+
- 3.033333333333333
|
231 |
+
- 3.066666666666667
|
232 |
+
- 3.1
|
233 |
+
- 3.1333333333333333
|
234 |
+
- 3.1666666666666665
|
235 |
+
- 3.2
|
236 |
+
- 3.2333333333333334
|
237 |
+
- 3.2666666666666666
|
238 |
+
- 3.3
|
239 |
+
do_online_rollout_async: false
|
240 |
+
eval_freq: -1
|
241 |
+
grad_clip_norm: 10
|
242 |
+
image_transforms:
|
243 |
+
brightness:
|
244 |
+
min_max:
|
245 |
+
- 0.8
|
246 |
+
- 1.2
|
247 |
+
weight: 1
|
248 |
+
contrast:
|
249 |
+
min_max:
|
250 |
+
- 0.8
|
251 |
+
- 1.2
|
252 |
+
weight: 1
|
253 |
+
enable: false
|
254 |
+
hue:
|
255 |
+
min_max:
|
256 |
+
- -0.05
|
257 |
+
- 0.05
|
258 |
+
weight: 1
|
259 |
+
max_num_transforms: 3
|
260 |
+
random_order: false
|
261 |
+
saturation:
|
262 |
+
min_max:
|
263 |
+
- 0.5
|
264 |
+
- 1.5
|
265 |
+
weight: 1
|
266 |
+
sharpness:
|
267 |
+
min_max:
|
268 |
+
- 0.8
|
269 |
+
- 1.2
|
270 |
+
weight: 1
|
271 |
+
log_freq: 200
|
272 |
+
lr: 1e-05
|
273 |
+
lr_backbone: 1e-05
|
274 |
+
num_workers: 8
|
275 |
+
offline_steps: 5000
|
276 |
+
online_buffer_capacity: null
|
277 |
+
online_buffer_seed_size: 0
|
278 |
+
online_env_seed: null
|
279 |
+
online_rollout_batch_size: 1
|
280 |
+
online_rollout_n_episodes: 1
|
281 |
+
online_sampling_ratio: 0.5
|
282 |
+
online_steps: 0
|
283 |
+
online_steps_between_rollouts: 1
|
284 |
+
save_checkpoint: true
|
285 |
+
save_freq: 10000
|
286 |
+
weight_decay: 0.0001
|
287 |
+
use_amp:
|
288 |
+
value: false
|
289 |
+
video_backend:
|
290 |
+
value: pyav
|
291 |
+
wandb:
|
292 |
+
value:
|
293 |
+
disable_artifact: false
|
294 |
+
enable: true
|
295 |
+
notes: ws-lerobot-hackathon
|
296 |
+
project: lerobot_real_aloha
|
wandb/run-20241207_010741-bwwpk9vl/files/output.log
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[1m[34mLogs will be synced with wandb.[0m
|
2 |
+
INFO 2024-12-07 01:07:41 n/logger.py:132 Track this run --> [1m[33mhttps://wandb.ai/zaringleb/lerobot_real_aloha/runs/bwwpk9vl[0m
|
3 |
+
INFO 2024-12-07 01:07:41 ts/train.py:312 make_dataset
|
4 |
+
WARNING 2024-12-07 01:07:41 s/factory.py:68 There might be a mismatch between your training dataset (dataset_repo_id='ccop/aloha_stationary_replay_test_v2') and your environment (cfg.env.name='real_world').
|
5 |
+
Fetching 9 files: 100%|█████████████████████████████████████████████████████████████████████████████████████████████| 9/9 [00:00<00:00, 70034.76it/s]
|
6 |
+
INFO 2024-12-07 01:07:43 ts/train.py:328 make_policy
|
7 |
+
WARNING 2024-12-07 01:07:44 s/factory.py:28 Hydra config is missing arguments: {'temporal_ensemble_coeff'}
|
8 |
+
Loading weights from local directory
|
9 |
+
/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py:338: FutureWarning: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.
|
10 |
+
grad_scaler = GradScaler(enabled=cfg.use_amp)
|
11 |
+
Error executing job with overrides: ['resume=true', 'dataset_repo_id=HumanoidTeam/aloha_real_test', 'training.offline_steps=5010']
|
12 |
+
Traceback (most recent call last):
|
13 |
+
File "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py", line 652, in train_cli
|
14 |
+
train(
|
15 |
+
File "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py", line 343, in train
|
16 |
+
step = logger.load_last_training_state(optimizer, lr_scheduler)
|
17 |
+
File "/home/ubuntu/lerobot-hackathon/lerobot/common/logger.py", line 218, in load_last_training_state
|
18 |
+
training_state = torch.load(self.last_checkpoint_dir / self.training_state_file_name)
|
19 |
+
File "/home/ubuntu/lerobot-hackathon/lerobot/lib/python3.10/site-packages/torch/serialization.py", line 1444, in load
|
20 |
+
raise pickle.UnpicklingError(_get_wo_message(str(e))) from None
|
21 |
+
_pickle.UnpicklingError: Weights only load failed. This file can still be loaded, to do so you have two options, [1mdo those steps only if you trust the source of the checkpoint[0m.
|
22 |
+
(1) Re-running `torch.load` with `weights_only` set to `False` will likely succeed, but it can result in arbitrary code execution. Do it only if you got the file from a trusted source.
|
23 |
+
(2) Alternatively, to load with `weights_only=True` please check the recommended steps in the following error message.
|
24 |
+
WeightsUnpickler error: Unsupported global: GLOBAL numpy.core.multiarray._reconstruct was not an allowed global by default. Please use `torch.serialization.add_safe_globals([_reconstruct])` or the `torch.serialization.safe_globals([_reconstruct])` context manager to allowlist this global if you trust this class/function.
|
25 |
+
|
26 |
+
Check the documentation of torch.load to learn more about types accepted by default with weights_only https://pytorch.org/docs/stable/generated/torch.load.html.
|
27 |
+
|
28 |
+
Set the environment variable HYDRA_FULL_ERROR=1 for a complete stack trace.
|
wandb/run-20241207_010741-bwwpk9vl/files/requirements.txt
ADDED
@@ -0,0 +1,129 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
pymunk==6.9.0
|
2 |
+
charset-normalizer==3.4.0
|
3 |
+
pip==22.0.2
|
4 |
+
multidict==6.1.0
|
5 |
+
pytz==2024.2
|
6 |
+
pandas==2.2.3
|
7 |
+
fasteners==0.19
|
8 |
+
einops==0.8.0
|
9 |
+
setproctitle==1.3.4
|
10 |
+
python-dateutil==2.9.0.post0
|
11 |
+
pydantic==2.10.3
|
12 |
+
dm-control==1.0.14
|
13 |
+
MarkupSafe==3.0.2
|
14 |
+
safetensors==0.4.5
|
15 |
+
cloudpickle==3.1.0
|
16 |
+
imageio-ffmpeg==0.5.1
|
17 |
+
smmap==5.0.1
|
18 |
+
huggingface-hub==0.26.5
|
19 |
+
torch==2.6.0.dev20241112+cu121
|
20 |
+
nvidia-cusolver-cu12==11.4.5.107
|
21 |
+
inquirerpy==0.3.4
|
22 |
+
soupsieve==2.6
|
23 |
+
deepdiff==8.0.1
|
24 |
+
nvidia-nvjitlink-cu12==12.4.127
|
25 |
+
aiosignal==1.3.1
|
26 |
+
dm-tree==0.1.8
|
27 |
+
aiohappyeyeballs==2.4.4
|
28 |
+
propcache==0.2.1
|
29 |
+
gym-aloha==0.1.1
|
30 |
+
labmaze==1.0.6
|
31 |
+
pyav==14.0.1
|
32 |
+
nvidia-cuda-cupti-cu12==12.1.105
|
33 |
+
cffi==1.17.1
|
34 |
+
importlib_metadata==8.5.0
|
35 |
+
nvidia-cuda-runtime-cu12==12.1.105
|
36 |
+
pycparser==2.22
|
37 |
+
h5py==3.12.1
|
38 |
+
nvidia-nccl-cu12==2.21.5
|
39 |
+
orderly-set==5.2.2
|
40 |
+
pyarrow==18.1.0
|
41 |
+
Flask==3.1.0
|
42 |
+
multiprocess==0.70.16
|
43 |
+
blinker==1.9.0
|
44 |
+
regex==2024.11.6
|
45 |
+
Jinja2==3.1.4
|
46 |
+
tqdm==4.67.1
|
47 |
+
certifi==2024.8.30
|
48 |
+
frozenlist==1.5.0
|
49 |
+
attrs==24.2.0
|
50 |
+
pytorch-triton==3.1.0+cf34004b8a
|
51 |
+
omegaconf==2.3.0
|
52 |
+
itsdangerous==2.2.0
|
53 |
+
packaging==24.2
|
54 |
+
pfzy==0.3.4
|
55 |
+
pydantic_core==2.27.1
|
56 |
+
antlr4-python3-runtime==4.9.3
|
57 |
+
cmake==3.31.1
|
58 |
+
imageio==2.36.1
|
59 |
+
setuptools==59.6.0
|
60 |
+
nvidia-cusparselt-cu12==0.6.2
|
61 |
+
zipp==3.21.0
|
62 |
+
torchvision==0.20.0.dev20241112+cu121
|
63 |
+
nvidia-curand-cu12==10.3.2.106
|
64 |
+
PyOpenGL-accelerate==3.1.7
|
65 |
+
numpy==1.26.4
|
66 |
+
dm-env==1.6
|
67 |
+
nvidia-cusparse-cu12==12.1.0.106
|
68 |
+
networkx==3.4.2
|
69 |
+
triton==3.1.0
|
70 |
+
termcolor==2.5.0
|
71 |
+
gitdb==4.0.11
|
72 |
+
torchaudio==2.5.0.dev20241112+cu121
|
73 |
+
glfw==2.8.0
|
74 |
+
tzdata==2024.2
|
75 |
+
pillow==11.0.0
|
76 |
+
idna==3.10
|
77 |
+
pyparsing==3.2.0
|
78 |
+
typing_extensions==4.12.2
|
79 |
+
wcwidth==0.2.13
|
80 |
+
sympy==1.13.1
|
81 |
+
nvidia-cublas-cu12==12.1.3.1
|
82 |
+
zarr==2.18.3
|
83 |
+
protobuf==5.29.1
|
84 |
+
annotated-types==0.7.0
|
85 |
+
xxhash==3.5.0
|
86 |
+
aiohttp==3.11.10
|
87 |
+
Werkzeug==3.1.3
|
88 |
+
mujoco==2.3.7
|
89 |
+
gymnasium==0.29.1
|
90 |
+
rerun-sdk==0.20.3
|
91 |
+
nvidia-cufft-cu12==11.0.2.54
|
92 |
+
dill==0.3.8
|
93 |
+
scipy==1.14.1
|
94 |
+
hydra-core==1.3.2
|
95 |
+
fsspec==2024.9.0
|
96 |
+
platformdirs==4.3.6
|
97 |
+
PySocks==1.7.1
|
98 |
+
PyOpenGL==3.1.7
|
99 |
+
requests==2.32.3
|
100 |
+
lxml==5.3.0
|
101 |
+
Farama-Notifications==0.0.4
|
102 |
+
nvidia-cuda-nvrtc-cu12==12.1.105
|
103 |
+
numba==0.60.0
|
104 |
+
docker-pycreds==0.4.0
|
105 |
+
six==1.17.0
|
106 |
+
lerobot==0.1.0
|
107 |
+
nvidia-cudnn-cu12==9.1.0.70
|
108 |
+
sentry-sdk==2.19.2
|
109 |
+
absl-py==2.1.0
|
110 |
+
wandb==0.19.0
|
111 |
+
mpmath==1.3.0
|
112 |
+
llvmlite==0.43.0
|
113 |
+
numcodecs==0.13.1
|
114 |
+
GitPython==3.1.43
|
115 |
+
nvidia-nvtx-cu12==12.1.105
|
116 |
+
prompt_toolkit==3.0.48
|
117 |
+
datasets==3.1.0
|
118 |
+
opencv-python==4.10.0.84
|
119 |
+
filelock==3.16.1
|
120 |
+
async-timeout==5.0.1
|
121 |
+
diffusers==0.31.0
|
122 |
+
yarl==1.18.3
|
123 |
+
click==8.1.7
|
124 |
+
asciitree==0.3.3
|
125 |
+
psutil==6.1.0
|
126 |
+
gdown==5.2.0
|
127 |
+
PyYAML==6.0.2
|
128 |
+
urllib3==2.2.3
|
129 |
+
beautifulsoup4==4.12.3
|
wandb/run-20241207_010741-bwwpk9vl/files/wandb-metadata.json
ADDED
@@ -0,0 +1,49 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"os": "Linux-6.8.0-1015-aws-x86_64-with-glibc2.35",
|
3 |
+
"python": "CPython 3.10.12",
|
4 |
+
"startedAt": "2024-12-07T01:07:41.166322Z",
|
5 |
+
"args": [
|
6 |
+
"hydra.run.dir=outputs/train/2024-12-06/22-28-29_real_world_act_default",
|
7 |
+
"resume=true",
|
8 |
+
"dataset_repo_id=HumanoidTeam/aloha_real_test",
|
9 |
+
"training.offline_steps=5010"
|
10 |
+
],
|
11 |
+
"program": "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py",
|
12 |
+
"codePath": "lerobot/scripts/train.py",
|
13 |
+
"git": {
|
14 |
+
"remote": "[email protected]:HumanoidTeam/lerobot-hackathon.git",
|
15 |
+
"commit": "ab8aa3f8e7b6e5486d7af26ccd319d358ffad579"
|
16 |
+
},
|
17 |
+
"email": "[email protected]",
|
18 |
+
"root": "outputs/train/2024-12-06/22-28-29_real_world_act_default",
|
19 |
+
"host": "ip-172-31-20-130",
|
20 |
+
"username": "humanoidteam",
|
21 |
+
"executable": "/home/ubuntu/lerobot-hackathon/lerobot/bin/python",
|
22 |
+
"codePathLocal": "lerobot/scripts/train.py",
|
23 |
+
"cpu_count": 4,
|
24 |
+
"cpu_count_logical": 8,
|
25 |
+
"gpu": "Tesla T4",
|
26 |
+
"gpu_count": 1,
|
27 |
+
"disk": {
|
28 |
+
"/": {
|
29 |
+
"total": "311993479168",
|
30 |
+
"used": "217724108800"
|
31 |
+
}
|
32 |
+
},
|
33 |
+
"memory": {
|
34 |
+
"total": "33263837184"
|
35 |
+
},
|
36 |
+
"cpu": {
|
37 |
+
"count": 4,
|
38 |
+
"countLogical": 8
|
39 |
+
},
|
40 |
+
"gpu_nvidia": [
|
41 |
+
{
|
42 |
+
"name": "Tesla T4",
|
43 |
+
"memoryTotal": "16106127360",
|
44 |
+
"cudaCores": 2560,
|
45 |
+
"architecture": "Turing"
|
46 |
+
}
|
47 |
+
],
|
48 |
+
"cudaVersion": "12.4"
|
49 |
+
}
|
wandb/run-20241207_010741-bwwpk9vl/files/wandb-summary.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train/update_s":1.0881254139821976,"train/step":4800,"train/num_episodes":48.01,"train/dataloading_s":2.211516670999117,"train/lr":1e-05,"_step":4800,"train/grad_norm":20.83009910583496,"train/num_epochs":48.01,"_runtime":5488.627260612,"_wandb":{"runtime":5498},"train/is_online":false,"train/kld_loss":0.01526648923754692,"train/l1_loss":0.09762981534004211,"_timestamp":1.7335293805980325e+09,"train/num_samples":38408,"train/loss":0.2502947151660919}
|
wandb/run-20241207_010741-bwwpk9vl/logs/debug-core.log
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"time":"2024-12-07T01:07:40.734055218Z","level":"INFO","msg":"started logging, with flags","port-filename":"/tmp/tmpnmhdaztf/port-3507456.txt","pid":3507456,"debug":false,"disable-analytics":false}
|
2 |
+
{"time":"2024-12-07T01:07:40.734088106Z","level":"INFO","msg":"FeatureState","shutdownOnParentExitEnabled":false}
|
3 |
+
{"time":"2024-12-07T01:07:40.737816002Z","level":"INFO","msg":"Will exit if parent process dies.","ppid":3507456}
|
4 |
+
{"time":"2024-12-07T01:07:40.737842301Z","level":"INFO","msg":"server is running","addr":{"IP":"127.0.0.1","Port":36119,"Zone":""}}
|
5 |
+
{"time":"2024-12-07T01:07:40.923329848Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:47356"}
|
6 |
+
{"time":"2024-12-07T01:07:41.167320115Z","level":"INFO","msg":"handleInformInit: received","streamId":"bwwpk9vl","id":"127.0.0.1:47356"}
|
7 |
+
{"time":"2024-12-07T01:07:41.270221077Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"bwwpk9vl","id":"127.0.0.1:47356"}
|
8 |
+
{"time":"2024-12-07T01:07:46.320004505Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"127.0.0.1:47356"}
|
9 |
+
{"time":"2024-12-07T01:07:46.320088721Z","level":"INFO","msg":"server is shutting down"}
|
10 |
+
{"time":"2024-12-07T01:07:46.320081333Z","level":"INFO","msg":"connection: Close: initiating connection closure","id":"127.0.0.1:47356"}
|
11 |
+
{"time":"2024-12-07T01:07:46.320187736Z","level":"INFO","msg":"connection: Close: connection successfully closed","id":"127.0.0.1:47356"}
|
12 |
+
{"time":"2024-12-07T01:07:47.027392524Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"127.0.0.1:47356"}
|
13 |
+
{"time":"2024-12-07T01:07:47.027414185Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"127.0.0.1:47356"}
|
14 |
+
{"time":"2024-12-07T01:07:47.027425094Z","level":"INFO","msg":"server is closed"}
|
wandb/run-20241207_010741-bwwpk9vl/logs/debug-internal.log
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"time":"2024-12-07T01:07:41.167467035Z","level":"INFO","msg":"using version","core version":"0.19.0"}
|
2 |
+
{"time":"2024-12-07T01:07:41.167480199Z","level":"INFO","msg":"created symlink","path":"outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug-core.log"}
|
3 |
+
{"time":"2024-12-07T01:07:41.270189094Z","level":"INFO","msg":"created new stream","id":"bwwpk9vl"}
|
4 |
+
{"time":"2024-12-07T01:07:41.270216139Z","level":"INFO","msg":"stream: started","id":"bwwpk9vl"}
|
5 |
+
{"time":"2024-12-07T01:07:41.270250461Z","level":"INFO","msg":"writer: Do: started","stream_id":"bwwpk9vl"}
|
6 |
+
{"time":"2024-12-07T01:07:41.270250342Z","level":"INFO","msg":"sender: started","stream_id":"bwwpk9vl"}
|
7 |
+
{"time":"2024-12-07T01:07:41.270317361Z","level":"INFO","msg":"handler: started","stream_id":"bwwpk9vl"}
|
8 |
+
{"time":"2024-12-07T01:07:41.601065068Z","level":"INFO","msg":"Starting system monitor"}
|
9 |
+
{"time":"2024-12-07T01:07:46.320070438Z","level":"INFO","msg":"stream: closing","id":"bwwpk9vl"}
|
10 |
+
{"time":"2024-12-07T01:07:46.320109578Z","level":"INFO","msg":"Stopping system monitor"}
|
11 |
+
{"time":"2024-12-07T01:07:46.320581424Z","level":"INFO","msg":"Stopped system monitor"}
|
12 |
+
{"time":"2024-12-07T01:07:46.890807441Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
13 |
+
{"time":"2024-12-07T01:07:47.027194656Z","level":"INFO","msg":"handler: closed","stream_id":"bwwpk9vl"}
|
14 |
+
{"time":"2024-12-07T01:07:47.027227034Z","level":"INFO","msg":"sender: closed","stream_id":"bwwpk9vl"}
|
15 |
+
{"time":"2024-12-07T01:07:47.027228216Z","level":"INFO","msg":"writer: Close: closed","stream_id":"bwwpk9vl"}
|
16 |
+
{"time":"2024-12-07T01:07:47.027338658Z","level":"INFO","msg":"stream: closed","id":"bwwpk9vl"}
|
wandb/run-20241207_010741-bwwpk9vl/logs/debug.log
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Current SDK version is 0.19.0
|
2 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Configure stats pid to 3507456
|
3 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/.config/wandb/settings
|
4 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/lerobot-hackathon/wandb/settings
|
5 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from environment variables
|
6 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] wandb: Using wandb-core as the SDK backend. Please refer to https://wandb.me/wandb-core for more information.
|
7 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:_log_setup():528] Logging user logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug.log
|
8 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:_log_setup():529] Logging internal logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug-internal.log
|
9 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():639] calling init triggers
|
10 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():645] wandb.init called with sweep_config: {}
|
11 |
+
config: {'resume': True, 'device': 'cuda', 'use_amp': False, 'seed': 1000, 'dataset_repo_id': 'ccop/aloha_stationary_replay_test_v2', 'video_backend': 'pyav', 'training': {'offline_steps': 5000, 'num_workers': 8, 'batch_size': 8, 'eval_freq': -1, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 10000, 'online_steps': 0, 'online_rollout_n_episodes': 1, 'online_rollout_batch_size': 1, 'online_steps_between_rollouts': 1, 'online_sampling_ratio': 0.5, 'online_env_seed': None, 'online_buffer_capacity': None, 'online_buffer_seed_size': 0, 'do_online_rollout_async': False, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'brightness': {'weight': 1, 'min_max': [0.8, 1.2]}, 'contrast': {'weight': 1, 'min_max': [0.8, 1.2]}, 'saturation': {'weight': 1, 'min_max': [0.5, 1.5]}, 'hue': {'weight': 1, 'min_max': [-0.05, 0.05]}, 'sharpness': {'weight': 1, 'min_max': [0.8, 1.2]}}, 'lr': 1e-05, 'lr_backbone': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10, 'delta_timestamps': {'action': [0.0, 0.03333333333333333, 0.06666666666666667, 0.1, 0.13333333333333333, 0.16666666666666666, 0.2, 0.23333333333333334, 0.26666666666666666, 0.3, 0.3333333333333333, 0.36666666666666664, 0.4, 0.43333333333333335, 0.4666666666666667, 0.5, 0.5333333333333333, 0.5666666666666667, 0.6, 0.6333333333333333, 0.6666666666666666, 0.7, 0.7333333333333333, 0.7666666666666667, 0.8, 0.8333333333333334, 0.8666666666666667, 0.9, 0.9333333333333333, 0.9666666666666667, 1.0, 1.0333333333333334, 1.0666666666666667, 1.1, 1.1333333333333333, 1.1666666666666667, 1.2, 1.2333333333333334, 1.2666666666666666, 1.3, 1.3333333333333333, 1.3666666666666667, 1.4, 1.4333333333333333, 1.4666666666666666, 1.5, 1.5333333333333334, 1.5666666666666667, 1.6, 1.6333333333333333, 1.6666666666666667, 1.7, 1.7333333333333334, 1.7666666666666666, 1.8, 1.8333333333333333, 1.8666666666666667, 1.9, 1.9333333333333333, 1.9666666666666666, 2.0, 2.033333333333333, 2.066666666666667, 2.1, 2.1333333333333333, 2.1666666666666665, 2.2, 2.2333333333333334, 2.2666666666666666, 2.3, 2.3333333333333335, 2.3666666666666667, 2.4, 2.433333333333333, 2.466666666666667, 2.5, 2.533333333333333, 2.566666666666667, 2.6, 2.6333333333333333, 2.6666666666666665, 2.7, 2.7333333333333334, 2.7666666666666666, 2.8, 2.8333333333333335, 2.8666666666666667, 2.9, 2.933333333333333, 2.966666666666667, 3.0, 3.033333333333333, 3.066666666666667, 3.1, 3.1333333333333333, 3.1666666666666665, 3.2, 3.2333333333333334, 3.2666666666666666, 3.3]}}, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot_real_aloha', 'notes': 'ws-lerobot-hackathon'}, 'fps': 30, 'env': {'name': 'real_world', 'task': None, 'state_dim': 14, 'action_dim': 14, 'fps': 30}, 'override_dataset_stats': {'observation.images.cam_right_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_left_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_high': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}}, 'policy': {'name': 'act', 'n_obs_steps': 1, 'chunk_size': 100, 'n_action_steps': 100, 'input_shapes': {'observation.images.cam_right_wrist': [3, 480, 640], 'observation.images.cam_left_wrist': [3, 480, 640], 'observation.images.cam_high': [3, 480, 640], 'observation.state': [14]}, 'output_shapes': {'action': [14]}, 'input_normalization_modes': {'observation.images.cam_right_wrist': 'mean_std', 'observation.images.cam_left_wrist': 'mean_std', 'observation.images.cam_high': 'mean_std', 'observation.state': 'mean_std'}, 'output_normalization_modes': {'action': 'mean_std'}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_momentum': None, 'dropout': 0.1, 'kl_weight': 10.0}}
|
12 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():688] starting backend
|
13 |
+
2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():692] sending inform_init request
|
14 |
+
2024-12-07 01:07:41,165 INFO MainThread:3507456 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
|
15 |
+
2024-12-07 01:07:41,166 INFO MainThread:3507456 [wandb_init.py:init():705] backend started and connected
|
16 |
+
2024-12-07 01:07:41,168 INFO MainThread:3507456 [wandb_init.py:init():798] updated telemetry
|
17 |
+
2024-12-07 01:07:41,174 INFO MainThread:3507456 [wandb_init.py:init():830] communicating run to backend with 90.0 second timeout
|
18 |
+
2024-12-07 01:07:41,592 INFO MainThread:3507456 [wandb_init.py:init():875] run resumed
|
19 |
+
2024-12-07 01:07:41,597 INFO MainThread:3507456 [wandb_init.py:init():882] starting run threads in backend
|
20 |
+
2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_console_start():2443] atexit reg
|
21 |
+
2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2293] redirect: wrap_raw
|
22 |
+
2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2358] Wrapping output streams.
|
23 |
+
2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2383] Redirects installed.
|
24 |
+
2024-12-07 01:07:41,713 INFO MainThread:3507456 [wandb_init.py:init():925] run started, returning control to user process
|
25 |
+
2024-12-07 01:07:46,320 WARNING MsgRouterThr:3507456 [router.py:message_loop():75] message_loop has been closed
|
wandb/run-20241207_010741-bwwpk9vl/run-bwwpk9vl.wandb
ADDED
Binary file (10.5 kB). View file
|
|