zaringleb commited on
Commit
484316e
·
verified ·
1 Parent(s): 18e58cf

Upload folder using huggingface_hub

Browse files
Files changed (38) hide show
  1. .hydra/config.yaml +160 -0
  2. .hydra/hydra.yaml +160 -0
  3. .hydra/overrides.yaml +3 -0
  4. checkpoints/005000/pretrained_model/README.md +12 -0
  5. checkpoints/005000/pretrained_model/config.json +55 -0
  6. checkpoints/005000/pretrained_model/config.yaml +248 -0
  7. checkpoints/005000/pretrained_model/model.safetensors +3 -0
  8. checkpoints/005000/training_state.pth +3 -0
  9. default.log +0 -0
  10. wandb/debug-internal.log +16 -0
  11. wandb/debug.log +25 -0
  12. wandb/run-20241206_222830-bwwpk9vl/files/config.yaml +194 -0
  13. wandb/run-20241206_222830-bwwpk9vl/files/output.log +46 -0
  14. wandb/run-20241206_222830-bwwpk9vl/files/requirements.txt +129 -0
  15. wandb/run-20241206_222830-bwwpk9vl/files/wandb-metadata.json +48 -0
  16. wandb/run-20241206_222830-bwwpk9vl/files/wandb-summary.json +1 -0
  17. wandb/run-20241206_222830-bwwpk9vl/logs/debug-core.log +15 -0
  18. wandb/run-20241206_222830-bwwpk9vl/logs/debug-internal.log +16 -0
  19. wandb/run-20241206_222830-bwwpk9vl/logs/debug.log +24 -0
  20. wandb/run-20241206_222830-bwwpk9vl/run-bwwpk9vl.wandb +0 -0
  21. wandb/run-20241207_010636-bwwpk9vl/files/config.yaml +296 -0
  22. wandb/run-20241207_010636-bwwpk9vl/files/output.log +28 -0
  23. wandb/run-20241207_010636-bwwpk9vl/files/requirements.txt +129 -0
  24. wandb/run-20241207_010636-bwwpk9vl/files/wandb-metadata.json +52 -0
  25. wandb/run-20241207_010636-bwwpk9vl/files/wandb-summary.json +1 -0
  26. wandb/run-20241207_010636-bwwpk9vl/logs/debug-core.log +14 -0
  27. wandb/run-20241207_010636-bwwpk9vl/logs/debug-internal.log +16 -0
  28. wandb/run-20241207_010636-bwwpk9vl/logs/debug.log +25 -0
  29. wandb/run-20241207_010636-bwwpk9vl/run-bwwpk9vl.wandb +0 -0
  30. wandb/run-20241207_010741-bwwpk9vl/files/config.yaml +296 -0
  31. wandb/run-20241207_010741-bwwpk9vl/files/output.log +28 -0
  32. wandb/run-20241207_010741-bwwpk9vl/files/requirements.txt +129 -0
  33. wandb/run-20241207_010741-bwwpk9vl/files/wandb-metadata.json +49 -0
  34. wandb/run-20241207_010741-bwwpk9vl/files/wandb-summary.json +1 -0
  35. wandb/run-20241207_010741-bwwpk9vl/logs/debug-core.log +14 -0
  36. wandb/run-20241207_010741-bwwpk9vl/logs/debug-internal.log +16 -0
  37. wandb/run-20241207_010741-bwwpk9vl/logs/debug.log +25 -0
  38. wandb/run-20241207_010741-bwwpk9vl/run-bwwpk9vl.wandb +0 -0
.hydra/config.yaml ADDED
@@ -0,0 +1,160 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ resume: true
2
+ device: cuda
3
+ use_amp: false
4
+ seed: 100000
5
+ dataset_repo_id: HumanoidTeam/aloha_real_test
6
+ video_backend: pyav
7
+ training:
8
+ offline_steps: 5010
9
+ num_workers: 8
10
+ batch_size: 64
11
+ eval_freq: 25000
12
+ log_freq: 200
13
+ save_checkpoint: true
14
+ save_freq: 25000
15
+ online_steps: 0
16
+ online_rollout_n_episodes: 1
17
+ online_rollout_batch_size: 1
18
+ online_steps_between_rollouts: 1
19
+ online_sampling_ratio: 0.5
20
+ online_env_seed: null
21
+ online_buffer_capacity: null
22
+ online_buffer_seed_size: 0
23
+ do_online_rollout_async: false
24
+ image_transforms:
25
+ enable: false
26
+ max_num_transforms: 3
27
+ random_order: false
28
+ brightness:
29
+ weight: 1
30
+ min_max:
31
+ - 0.8
32
+ - 1.2
33
+ contrast:
34
+ weight: 1
35
+ min_max:
36
+ - 0.8
37
+ - 1.2
38
+ saturation:
39
+ weight: 1
40
+ min_max:
41
+ - 0.5
42
+ - 1.5
43
+ hue:
44
+ weight: 1
45
+ min_max:
46
+ - -0.05
47
+ - 0.05
48
+ sharpness:
49
+ weight: 1
50
+ min_max:
51
+ - 0.8
52
+ - 1.2
53
+ grad_clip_norm: 10
54
+ lr: 0.0001
55
+ lr_scheduler: cosine
56
+ lr_warmup_steps: 500
57
+ adam_betas:
58
+ - 0.95
59
+ - 0.999
60
+ adam_eps: 1.0e-08
61
+ adam_weight_decay: 1.0e-06
62
+ delta_timestamps:
63
+ observation.image: '[i / ${fps} for i in range(1 - ${policy.n_obs_steps}, 1)]'
64
+ observation.state: '[i / ${fps} for i in range(1 - ${policy.n_obs_steps}, 1)]'
65
+ action: '[i / ${fps} for i in range(1 - ${policy.n_obs_steps}, 1 - ${policy.n_obs_steps}
66
+ + ${policy.horizon})]'
67
+ drop_n_last_frames: 7
68
+ eval:
69
+ n_episodes: 50
70
+ batch_size: 50
71
+ use_async_envs: false
72
+ wandb:
73
+ enable: true
74
+ disable_artifact: false
75
+ project: lerobot_real_aloha
76
+ notes: ws-lerobot-hackathon
77
+ fps: 10
78
+ env:
79
+ name: pusht
80
+ task: PushT-v0
81
+ image_size: 96
82
+ state_dim: 2
83
+ action_dim: 2
84
+ fps: ${fps}
85
+ episode_length: 300
86
+ gym:
87
+ obs_type: pixels_agent_pos
88
+ render_mode: rgb_array
89
+ visualization_width: 384
90
+ visualization_height: 384
91
+ override_dataset_stats:
92
+ observation.image:
93
+ mean:
94
+ - - - 0.5
95
+ - - - 0.5
96
+ - - - 0.5
97
+ std:
98
+ - - - 0.5
99
+ - - - 0.5
100
+ - - - 0.5
101
+ observation.state:
102
+ min:
103
+ - 13.456424
104
+ - 32.938293
105
+ max:
106
+ - 496.14618
107
+ - 510.9579
108
+ action:
109
+ min:
110
+ - 12.0
111
+ - 25.0
112
+ max:
113
+ - 511.0
114
+ - 511.0
115
+ policy:
116
+ name: diffusion
117
+ n_obs_steps: 2
118
+ horizon: 16
119
+ n_action_steps: 8
120
+ input_shapes:
121
+ observation.image:
122
+ - 3
123
+ - 96
124
+ - 96
125
+ observation.state:
126
+ - ${env.state_dim}
127
+ output_shapes:
128
+ action:
129
+ - ${env.action_dim}
130
+ input_normalization_modes:
131
+ observation.image: mean_std
132
+ observation.state: min_max
133
+ output_normalization_modes:
134
+ action: min_max
135
+ vision_backbone: resnet18
136
+ crop_shape:
137
+ - 84
138
+ - 84
139
+ crop_is_random: true
140
+ pretrained_backbone_weights: null
141
+ use_group_norm: true
142
+ spatial_softmax_num_keypoints: 32
143
+ down_dims:
144
+ - 512
145
+ - 1024
146
+ - 2048
147
+ kernel_size: 5
148
+ n_groups: 8
149
+ diffusion_step_embed_dim: 128
150
+ use_film_scale_modulation: true
151
+ noise_scheduler_type: DDPM
152
+ num_train_timesteps: 100
153
+ beta_schedule: squaredcos_cap_v2
154
+ beta_start: 0.0001
155
+ beta_end: 0.02
156
+ prediction_type: epsilon
157
+ clip_sample: true
158
+ clip_sample_range: 1.0
159
+ num_inference_steps: null
160
+ do_mask_loss_for_padding: false
.hydra/hydra.yaml ADDED
@@ -0,0 +1,160 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: outputs/train/2024-12-06/22-28-29_real_world_act_default
4
+ sweep:
5
+ dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ formatters:
71
+ simple:
72
+ format: '[%(asctime)s][HYDRA] %(message)s'
73
+ handlers:
74
+ console:
75
+ class: logging.StreamHandler
76
+ formatter: simple
77
+ stream: ext://sys.stdout
78
+ root:
79
+ level: INFO
80
+ handlers:
81
+ - console
82
+ loggers:
83
+ logging_example:
84
+ level: DEBUG
85
+ disable_existing_loggers: false
86
+ job_logging:
87
+ version: 1
88
+ formatters:
89
+ simple:
90
+ format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
91
+ handlers:
92
+ console:
93
+ class: logging.StreamHandler
94
+ formatter: simple
95
+ stream: ext://sys.stdout
96
+ file:
97
+ class: logging.FileHandler
98
+ formatter: simple
99
+ filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
100
+ root:
101
+ level: INFO
102
+ handlers:
103
+ - console
104
+ - file
105
+ disable_existing_loggers: false
106
+ env: {}
107
+ mode: RUN
108
+ searchpath: []
109
+ callbacks: {}
110
+ output_subdir: .hydra
111
+ overrides:
112
+ hydra:
113
+ - hydra.run.dir=outputs/train/2024-12-06/22-28-29_real_world_act_default
114
+ - hydra.mode=RUN
115
+ task:
116
+ - resume=true
117
+ - dataset_repo_id=HumanoidTeam/aloha_real_test
118
+ - training.offline_steps=5010
119
+ job:
120
+ name: default
121
+ chdir: null
122
+ override_dirname: dataset_repo_id=HumanoidTeam/aloha_real_test,resume=true,training.offline_steps=5010
123
+ id: ???
124
+ num: ???
125
+ config_name: default
126
+ env_set: {}
127
+ env_copy: []
128
+ config:
129
+ override_dirname:
130
+ kv_sep: '='
131
+ item_sep: ','
132
+ exclude_keys: []
133
+ runtime:
134
+ version: 1.3.2
135
+ version_base: '1.2'
136
+ cwd: /home/ubuntu/lerobot-hackathon
137
+ config_sources:
138
+ - path: hydra.conf
139
+ schema: pkg
140
+ provider: hydra
141
+ - path: /home/ubuntu/lerobot-hackathon/lerobot/configs
142
+ schema: file
143
+ provider: main
144
+ - path: ''
145
+ schema: structured
146
+ provider: schema
147
+ output_dir: /home/ubuntu/lerobot-hackathon/outputs/train/2024-12-06/22-28-29_real_world_act_default
148
+ choices:
149
+ policy: diffusion
150
+ env: pusht
151
+ hydra/env: default
152
+ hydra/callbacks: null
153
+ hydra/job_logging: default
154
+ hydra/hydra_logging: default
155
+ hydra/hydra_help: default
156
+ hydra/help: default
157
+ hydra/sweeper: basic
158
+ hydra/launcher: basic
159
+ hydra/output: default
160
+ verbose: false
.hydra/overrides.yaml ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ - resume=true
2
+ - dataset_repo_id=HumanoidTeam/aloha_real_test
3
+ - training.offline_steps=5010
checkpoints/005000/pretrained_model/README.md ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: lerobot
3
+ tags:
4
+ - act
5
+ - model_hub_mixin
6
+ - pytorch_model_hub_mixin
7
+ - robotics
8
+ ---
9
+
10
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
11
+ - Library: https://github.com/huggingface/lerobot
12
+ - Docs: [More Information Needed]
checkpoints/005000/pretrained_model/config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "chunk_size": 100,
3
+ "dim_feedforward": 3200,
4
+ "dim_model": 512,
5
+ "dropout": 0.1,
6
+ "feedforward_activation": "relu",
7
+ "input_normalization_modes": {
8
+ "observation.images.cam_high": "mean_std",
9
+ "observation.images.cam_left_wrist": "mean_std",
10
+ "observation.images.cam_right_wrist": "mean_std",
11
+ "observation.state": "mean_std"
12
+ },
13
+ "input_shapes": {
14
+ "observation.images.cam_high": [
15
+ 3,
16
+ 480,
17
+ 640
18
+ ],
19
+ "observation.images.cam_left_wrist": [
20
+ 3,
21
+ 480,
22
+ 640
23
+ ],
24
+ "observation.images.cam_right_wrist": [
25
+ 3,
26
+ 480,
27
+ 640
28
+ ],
29
+ "observation.state": [
30
+ 14
31
+ ]
32
+ },
33
+ "kl_weight": 10.0,
34
+ "latent_dim": 32,
35
+ "n_action_steps": 100,
36
+ "n_decoder_layers": 1,
37
+ "n_encoder_layers": 4,
38
+ "n_heads": 8,
39
+ "n_obs_steps": 1,
40
+ "n_vae_encoder_layers": 4,
41
+ "output_normalization_modes": {
42
+ "action": "mean_std"
43
+ },
44
+ "output_shapes": {
45
+ "action": [
46
+ 14
47
+ ]
48
+ },
49
+ "pre_norm": false,
50
+ "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
51
+ "replace_final_stride_with_dilation": false,
52
+ "temporal_ensemble_coeff": null,
53
+ "use_vae": true,
54
+ "vision_backbone": "resnet18"
55
+ }
checkpoints/005000/pretrained_model/config.yaml ADDED
@@ -0,0 +1,248 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ resume: false
2
+ device: cuda
3
+ use_amp: false
4
+ seed: 1000
5
+ dataset_repo_id: ccop/aloha_stationary_replay_test_v2
6
+ video_backend: pyav
7
+ training:
8
+ offline_steps: 5000
9
+ num_workers: 8
10
+ batch_size: 8
11
+ eval_freq: -1
12
+ log_freq: 200
13
+ save_checkpoint: true
14
+ save_freq: 10000
15
+ online_steps: 0
16
+ online_rollout_n_episodes: 1
17
+ online_rollout_batch_size: 1
18
+ online_steps_between_rollouts: 1
19
+ online_sampling_ratio: 0.5
20
+ online_env_seed: null
21
+ online_buffer_capacity: null
22
+ online_buffer_seed_size: 0
23
+ do_online_rollout_async: false
24
+ image_transforms:
25
+ enable: false
26
+ max_num_transforms: 3
27
+ random_order: false
28
+ brightness:
29
+ weight: 1
30
+ min_max:
31
+ - 0.8
32
+ - 1.2
33
+ contrast:
34
+ weight: 1
35
+ min_max:
36
+ - 0.8
37
+ - 1.2
38
+ saturation:
39
+ weight: 1
40
+ min_max:
41
+ - 0.5
42
+ - 1.5
43
+ hue:
44
+ weight: 1
45
+ min_max:
46
+ - -0.05
47
+ - 0.05
48
+ sharpness:
49
+ weight: 1
50
+ min_max:
51
+ - 0.8
52
+ - 1.2
53
+ lr: 1.0e-05
54
+ lr_backbone: 1.0e-05
55
+ weight_decay: 0.0001
56
+ grad_clip_norm: 10
57
+ delta_timestamps:
58
+ action:
59
+ - 0.0
60
+ - 0.03333333333333333
61
+ - 0.06666666666666667
62
+ - 0.1
63
+ - 0.13333333333333333
64
+ - 0.16666666666666666
65
+ - 0.2
66
+ - 0.23333333333333334
67
+ - 0.26666666666666666
68
+ - 0.3
69
+ - 0.3333333333333333
70
+ - 0.36666666666666664
71
+ - 0.4
72
+ - 0.43333333333333335
73
+ - 0.4666666666666667
74
+ - 0.5
75
+ - 0.5333333333333333
76
+ - 0.5666666666666667
77
+ - 0.6
78
+ - 0.6333333333333333
79
+ - 0.6666666666666666
80
+ - 0.7
81
+ - 0.7333333333333333
82
+ - 0.7666666666666667
83
+ - 0.8
84
+ - 0.8333333333333334
85
+ - 0.8666666666666667
86
+ - 0.9
87
+ - 0.9333333333333333
88
+ - 0.9666666666666667
89
+ - 1.0
90
+ - 1.0333333333333334
91
+ - 1.0666666666666667
92
+ - 1.1
93
+ - 1.1333333333333333
94
+ - 1.1666666666666667
95
+ - 1.2
96
+ - 1.2333333333333334
97
+ - 1.2666666666666666
98
+ - 1.3
99
+ - 1.3333333333333333
100
+ - 1.3666666666666667
101
+ - 1.4
102
+ - 1.4333333333333333
103
+ - 1.4666666666666666
104
+ - 1.5
105
+ - 1.5333333333333334
106
+ - 1.5666666666666667
107
+ - 1.6
108
+ - 1.6333333333333333
109
+ - 1.6666666666666667
110
+ - 1.7
111
+ - 1.7333333333333334
112
+ - 1.7666666666666666
113
+ - 1.8
114
+ - 1.8333333333333333
115
+ - 1.8666666666666667
116
+ - 1.9
117
+ - 1.9333333333333333
118
+ - 1.9666666666666666
119
+ - 2.0
120
+ - 2.033333333333333
121
+ - 2.066666666666667
122
+ - 2.1
123
+ - 2.1333333333333333
124
+ - 2.1666666666666665
125
+ - 2.2
126
+ - 2.2333333333333334
127
+ - 2.2666666666666666
128
+ - 2.3
129
+ - 2.3333333333333335
130
+ - 2.3666666666666667
131
+ - 2.4
132
+ - 2.433333333333333
133
+ - 2.466666666666667
134
+ - 2.5
135
+ - 2.533333333333333
136
+ - 2.566666666666667
137
+ - 2.6
138
+ - 2.6333333333333333
139
+ - 2.6666666666666665
140
+ - 2.7
141
+ - 2.7333333333333334
142
+ - 2.7666666666666666
143
+ - 2.8
144
+ - 2.8333333333333335
145
+ - 2.8666666666666667
146
+ - 2.9
147
+ - 2.933333333333333
148
+ - 2.966666666666667
149
+ - 3.0
150
+ - 3.033333333333333
151
+ - 3.066666666666667
152
+ - 3.1
153
+ - 3.1333333333333333
154
+ - 3.1666666666666665
155
+ - 3.2
156
+ - 3.2333333333333334
157
+ - 3.2666666666666666
158
+ - 3.3
159
+ eval:
160
+ n_episodes: 50
161
+ batch_size: 50
162
+ use_async_envs: false
163
+ wandb:
164
+ enable: true
165
+ disable_artifact: false
166
+ project: lerobot_real_aloha
167
+ notes: ws-lerobot-hackathon
168
+ fps: 30
169
+ env:
170
+ name: real_world
171
+ task: null
172
+ state_dim: 14
173
+ action_dim: 14
174
+ fps: ${fps}
175
+ override_dataset_stats:
176
+ observation.images.cam_right_wrist:
177
+ mean:
178
+ - - - 0.485
179
+ - - - 0.456
180
+ - - - 0.406
181
+ std:
182
+ - - - 0.229
183
+ - - - 0.224
184
+ - - - 0.225
185
+ observation.images.cam_left_wrist:
186
+ mean:
187
+ - - - 0.485
188
+ - - - 0.456
189
+ - - - 0.406
190
+ std:
191
+ - - - 0.229
192
+ - - - 0.224
193
+ - - - 0.225
194
+ observation.images.cam_high:
195
+ mean:
196
+ - - - 0.485
197
+ - - - 0.456
198
+ - - - 0.406
199
+ std:
200
+ - - - 0.229
201
+ - - - 0.224
202
+ - - - 0.225
203
+ policy:
204
+ name: act
205
+ n_obs_steps: 1
206
+ chunk_size: 100
207
+ n_action_steps: 100
208
+ input_shapes:
209
+ observation.images.cam_right_wrist:
210
+ - 3
211
+ - 480
212
+ - 640
213
+ observation.images.cam_left_wrist:
214
+ - 3
215
+ - 480
216
+ - 640
217
+ observation.images.cam_high:
218
+ - 3
219
+ - 480
220
+ - 640
221
+ observation.state:
222
+ - ${env.state_dim}
223
+ output_shapes:
224
+ action:
225
+ - ${env.action_dim}
226
+ input_normalization_modes:
227
+ observation.images.cam_right_wrist: mean_std
228
+ observation.images.cam_left_wrist: mean_std
229
+ observation.images.cam_high: mean_std
230
+ observation.state: mean_std
231
+ output_normalization_modes:
232
+ action: mean_std
233
+ vision_backbone: resnet18
234
+ pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
235
+ replace_final_stride_with_dilation: false
236
+ pre_norm: false
237
+ dim_model: 512
238
+ n_heads: 8
239
+ dim_feedforward: 3200
240
+ feedforward_activation: relu
241
+ n_encoder_layers: 4
242
+ n_decoder_layers: 1
243
+ use_vae: true
244
+ latent_dim: 32
245
+ n_vae_encoder_layers: 4
246
+ temporal_ensemble_momentum: null
247
+ dropout: 0.1
248
+ kl_weight: 10.0
checkpoints/005000/pretrained_model/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eba28285320bc2ddcda5e0ce0be693634a20ec638d10cf364694649bfc184964
3
+ size 206767160
checkpoints/005000/training_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af943082a3d9b919922d7de964e9f2bdc429b3d800234ea46f97ccedce9b309c
3
+ size 413053071
default.log ADDED
File without changes
wandb/debug-internal.log ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-12-07T01:07:41.167467035Z","level":"INFO","msg":"using version","core version":"0.19.0"}
2
+ {"time":"2024-12-07T01:07:41.167480199Z","level":"INFO","msg":"created symlink","path":"outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug-core.log"}
3
+ {"time":"2024-12-07T01:07:41.270189094Z","level":"INFO","msg":"created new stream","id":"bwwpk9vl"}
4
+ {"time":"2024-12-07T01:07:41.270216139Z","level":"INFO","msg":"stream: started","id":"bwwpk9vl"}
5
+ {"time":"2024-12-07T01:07:41.270250461Z","level":"INFO","msg":"writer: Do: started","stream_id":"bwwpk9vl"}
6
+ {"time":"2024-12-07T01:07:41.270250342Z","level":"INFO","msg":"sender: started","stream_id":"bwwpk9vl"}
7
+ {"time":"2024-12-07T01:07:41.270317361Z","level":"INFO","msg":"handler: started","stream_id":"bwwpk9vl"}
8
+ {"time":"2024-12-07T01:07:41.601065068Z","level":"INFO","msg":"Starting system monitor"}
9
+ {"time":"2024-12-07T01:07:46.320070438Z","level":"INFO","msg":"stream: closing","id":"bwwpk9vl"}
10
+ {"time":"2024-12-07T01:07:46.320109578Z","level":"INFO","msg":"Stopping system monitor"}
11
+ {"time":"2024-12-07T01:07:46.320581424Z","level":"INFO","msg":"Stopped system monitor"}
12
+ {"time":"2024-12-07T01:07:46.890807441Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
13
+ {"time":"2024-12-07T01:07:47.027194656Z","level":"INFO","msg":"handler: closed","stream_id":"bwwpk9vl"}
14
+ {"time":"2024-12-07T01:07:47.027227034Z","level":"INFO","msg":"sender: closed","stream_id":"bwwpk9vl"}
15
+ {"time":"2024-12-07T01:07:47.027228216Z","level":"INFO","msg":"writer: Close: closed","stream_id":"bwwpk9vl"}
16
+ {"time":"2024-12-07T01:07:47.027338658Z","level":"INFO","msg":"stream: closed","id":"bwwpk9vl"}
wandb/debug.log ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Current SDK version is 0.19.0
2
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Configure stats pid to 3507456
3
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/.config/wandb/settings
4
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/lerobot-hackathon/wandb/settings
5
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from environment variables
6
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] wandb: Using wandb-core as the SDK backend. Please refer to https://wandb.me/wandb-core for more information.
7
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:_log_setup():528] Logging user logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug.log
8
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:_log_setup():529] Logging internal logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug-internal.log
9
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():639] calling init triggers
10
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():645] wandb.init called with sweep_config: {}
11
+ config: {'resume': True, 'device': 'cuda', 'use_amp': False, 'seed': 1000, 'dataset_repo_id': 'ccop/aloha_stationary_replay_test_v2', 'video_backend': 'pyav', 'training': {'offline_steps': 5000, 'num_workers': 8, 'batch_size': 8, 'eval_freq': -1, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 10000, 'online_steps': 0, 'online_rollout_n_episodes': 1, 'online_rollout_batch_size': 1, 'online_steps_between_rollouts': 1, 'online_sampling_ratio': 0.5, 'online_env_seed': None, 'online_buffer_capacity': None, 'online_buffer_seed_size': 0, 'do_online_rollout_async': False, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'brightness': {'weight': 1, 'min_max': [0.8, 1.2]}, 'contrast': {'weight': 1, 'min_max': [0.8, 1.2]}, 'saturation': {'weight': 1, 'min_max': [0.5, 1.5]}, 'hue': {'weight': 1, 'min_max': [-0.05, 0.05]}, 'sharpness': {'weight': 1, 'min_max': [0.8, 1.2]}}, 'lr': 1e-05, 'lr_backbone': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10, 'delta_timestamps': {'action': [0.0, 0.03333333333333333, 0.06666666666666667, 0.1, 0.13333333333333333, 0.16666666666666666, 0.2, 0.23333333333333334, 0.26666666666666666, 0.3, 0.3333333333333333, 0.36666666666666664, 0.4, 0.43333333333333335, 0.4666666666666667, 0.5, 0.5333333333333333, 0.5666666666666667, 0.6, 0.6333333333333333, 0.6666666666666666, 0.7, 0.7333333333333333, 0.7666666666666667, 0.8, 0.8333333333333334, 0.8666666666666667, 0.9, 0.9333333333333333, 0.9666666666666667, 1.0, 1.0333333333333334, 1.0666666666666667, 1.1, 1.1333333333333333, 1.1666666666666667, 1.2, 1.2333333333333334, 1.2666666666666666, 1.3, 1.3333333333333333, 1.3666666666666667, 1.4, 1.4333333333333333, 1.4666666666666666, 1.5, 1.5333333333333334, 1.5666666666666667, 1.6, 1.6333333333333333, 1.6666666666666667, 1.7, 1.7333333333333334, 1.7666666666666666, 1.8, 1.8333333333333333, 1.8666666666666667, 1.9, 1.9333333333333333, 1.9666666666666666, 2.0, 2.033333333333333, 2.066666666666667, 2.1, 2.1333333333333333, 2.1666666666666665, 2.2, 2.2333333333333334, 2.2666666666666666, 2.3, 2.3333333333333335, 2.3666666666666667, 2.4, 2.433333333333333, 2.466666666666667, 2.5, 2.533333333333333, 2.566666666666667, 2.6, 2.6333333333333333, 2.6666666666666665, 2.7, 2.7333333333333334, 2.7666666666666666, 2.8, 2.8333333333333335, 2.8666666666666667, 2.9, 2.933333333333333, 2.966666666666667, 3.0, 3.033333333333333, 3.066666666666667, 3.1, 3.1333333333333333, 3.1666666666666665, 3.2, 3.2333333333333334, 3.2666666666666666, 3.3]}}, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot_real_aloha', 'notes': 'ws-lerobot-hackathon'}, 'fps': 30, 'env': {'name': 'real_world', 'task': None, 'state_dim': 14, 'action_dim': 14, 'fps': 30}, 'override_dataset_stats': {'observation.images.cam_right_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_left_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_high': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}}, 'policy': {'name': 'act', 'n_obs_steps': 1, 'chunk_size': 100, 'n_action_steps': 100, 'input_shapes': {'observation.images.cam_right_wrist': [3, 480, 640], 'observation.images.cam_left_wrist': [3, 480, 640], 'observation.images.cam_high': [3, 480, 640], 'observation.state': [14]}, 'output_shapes': {'action': [14]}, 'input_normalization_modes': {'observation.images.cam_right_wrist': 'mean_std', 'observation.images.cam_left_wrist': 'mean_std', 'observation.images.cam_high': 'mean_std', 'observation.state': 'mean_std'}, 'output_normalization_modes': {'action': 'mean_std'}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_momentum': None, 'dropout': 0.1, 'kl_weight': 10.0}}
12
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():688] starting backend
13
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():692] sending inform_init request
14
+ 2024-12-07 01:07:41,165 INFO MainThread:3507456 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
15
+ 2024-12-07 01:07:41,166 INFO MainThread:3507456 [wandb_init.py:init():705] backend started and connected
16
+ 2024-12-07 01:07:41,168 INFO MainThread:3507456 [wandb_init.py:init():798] updated telemetry
17
+ 2024-12-07 01:07:41,174 INFO MainThread:3507456 [wandb_init.py:init():830] communicating run to backend with 90.0 second timeout
18
+ 2024-12-07 01:07:41,592 INFO MainThread:3507456 [wandb_init.py:init():875] run resumed
19
+ 2024-12-07 01:07:41,597 INFO MainThread:3507456 [wandb_init.py:init():882] starting run threads in backend
20
+ 2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_console_start():2443] atexit reg
21
+ 2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2293] redirect: wrap_raw
22
+ 2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2358] Wrapping output streams.
23
+ 2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2383] Redirects installed.
24
+ 2024-12-07 01:07:41,713 INFO MainThread:3507456 [wandb_init.py:init():925] run started, returning control to user process
25
+ 2024-12-07 01:07:46,320 WARNING MsgRouterThr:3507456 [router.py:message_loop():75] message_loop has been closed
wandb/run-20241206_222830-bwwpk9vl/files/config.yaml ADDED
@@ -0,0 +1,194 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.19.0
4
+ m: []
5
+ python_version: 3.10.12
6
+ t:
7
+ "1":
8
+ - 1
9
+ - 41
10
+ - 49
11
+ - 50
12
+ - 51
13
+ - 55
14
+ "2":
15
+ - 1
16
+ - 41
17
+ - 49
18
+ - 50
19
+ - 51
20
+ - 55
21
+ "3":
22
+ - 13
23
+ - 15
24
+ - 16
25
+ - 23
26
+ - 55
27
+ - 61
28
+ "4": 3.10.12
29
+ "5": 0.19.0
30
+ "8":
31
+ - 5
32
+ "12": 0.19.0
33
+ "13": linux-x86_64
34
+ dataset_repo_id:
35
+ value: ccop/aloha_stationary_replay_test_v2
36
+ device:
37
+ value: cuda
38
+ env:
39
+ value:
40
+ action_dim: 14
41
+ fps: 30
42
+ name: real_world
43
+ state_dim: 14
44
+ task: null
45
+ eval:
46
+ value:
47
+ batch_size: 50
48
+ n_episodes: 50
49
+ use_async_envs: false
50
+ fps:
51
+ value: 30
52
+ override_dataset_stats:
53
+ value:
54
+ observation.images.cam_high:
55
+ mean:
56
+ - - - 0.485
57
+ - - - 0.456
58
+ - - - 0.406
59
+ std:
60
+ - - - 0.229
61
+ - - - 0.224
62
+ - - - 0.225
63
+ observation.images.cam_left_wrist:
64
+ mean:
65
+ - - - 0.485
66
+ - - - 0.456
67
+ - - - 0.406
68
+ std:
69
+ - - - 0.229
70
+ - - - 0.224
71
+ - - - 0.225
72
+ observation.images.cam_right_wrist:
73
+ mean:
74
+ - - - 0.485
75
+ - - - 0.456
76
+ - - - 0.406
77
+ std:
78
+ - - - 0.229
79
+ - - - 0.224
80
+ - - - 0.225
81
+ policy:
82
+ value:
83
+ chunk_size: 100
84
+ dim_feedforward: 3200
85
+ dim_model: 512
86
+ dropout: 0.1
87
+ feedforward_activation: relu
88
+ input_normalization_modes:
89
+ observation.images.cam_high: mean_std
90
+ observation.images.cam_left_wrist: mean_std
91
+ observation.images.cam_right_wrist: mean_std
92
+ observation.state: mean_std
93
+ input_shapes:
94
+ observation.images.cam_high:
95
+ - 3
96
+ - 480
97
+ - 640
98
+ observation.images.cam_left_wrist:
99
+ - 3
100
+ - 480
101
+ - 640
102
+ observation.images.cam_right_wrist:
103
+ - 3
104
+ - 480
105
+ - 640
106
+ observation.state:
107
+ - 14
108
+ kl_weight: 10
109
+ latent_dim: 32
110
+ n_action_steps: 100
111
+ n_decoder_layers: 1
112
+ n_encoder_layers: 4
113
+ n_heads: 8
114
+ n_obs_steps: 1
115
+ n_vae_encoder_layers: 4
116
+ name: act
117
+ output_normalization_modes:
118
+ action: mean_std
119
+ output_shapes:
120
+ action:
121
+ - 14
122
+ pre_norm: false
123
+ pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
124
+ replace_final_stride_with_dilation: false
125
+ temporal_ensemble_momentum: null
126
+ use_vae: true
127
+ vision_backbone: resnet18
128
+ resume:
129
+ value: false
130
+ seed:
131
+ value: 1000
132
+ training:
133
+ value:
134
+ batch_size: 8
135
+ delta_timestamps:
136
+ action: '[i / 30 for i in range(100)]'
137
+ do_online_rollout_async: false
138
+ eval_freq: -1
139
+ grad_clip_norm: 10
140
+ image_transforms:
141
+ brightness:
142
+ min_max:
143
+ - 0.8
144
+ - 1.2
145
+ weight: 1
146
+ contrast:
147
+ min_max:
148
+ - 0.8
149
+ - 1.2
150
+ weight: 1
151
+ enable: false
152
+ hue:
153
+ min_max:
154
+ - -0.05
155
+ - 0.05
156
+ weight: 1
157
+ max_num_transforms: 3
158
+ random_order: false
159
+ saturation:
160
+ min_max:
161
+ - 0.5
162
+ - 1.5
163
+ weight: 1
164
+ sharpness:
165
+ min_max:
166
+ - 0.8
167
+ - 1.2
168
+ weight: 1
169
+ log_freq: 200
170
+ lr: 1e-05
171
+ lr_backbone: 1e-05
172
+ num_workers: 8
173
+ offline_steps: 5000
174
+ online_buffer_capacity: null
175
+ online_buffer_seed_size: 0
176
+ online_env_seed: null
177
+ online_rollout_batch_size: 1
178
+ online_rollout_n_episodes: 1
179
+ online_sampling_ratio: 0.5
180
+ online_steps: 0
181
+ online_steps_between_rollouts: 1
182
+ save_checkpoint: true
183
+ save_freq: 10000
184
+ weight_decay: 0.0001
185
+ use_amp:
186
+ value: false
187
+ video_backend:
188
+ value: pyav
189
+ wandb:
190
+ value:
191
+ disable_artifact: false
192
+ enable: true
193
+ notes: ws-lerobot-hackathon
194
+ project: lerobot_real_aloha
wandb/run-20241206_222830-bwwpk9vl/files/output.log ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Logs will be synced with wandb.
2
+ INFO 2024-12-06 22:28:30 n/logger.py:132 Track this run --> https://wandb.ai/zaringleb/lerobot_real_aloha/runs/bwwpk9vl
3
+ INFO 2024-12-06 22:28:30 ts/train.py:312 make_dataset
4
+ WARNING 2024-12-06 22:28:30 s/factory.py:68 There might be a mismatch between your training dataset (dataset_repo_id='ccop/aloha_stationary_replay_test_v2') and your environment (cfg.env.name='real_world').
5
+ Fetching 9 files: 100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 9/9 [00:00<00:00, 39945.75it/s]
6
+ INFO 2024-12-06 22:28:32 ts/train.py:328 make_policy
7
+ WARNING 2024-12-06 22:28:32 s/factory.py:28 Hydra config is missing arguments: {'temporal_ensemble_coeff'}
8
+ /home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py:338: FutureWarning: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.
9
+ grad_scaler = GradScaler(enabled=cfg.use_amp)
10
+ INFO 2024-12-06 22:28:33 on/logger.py:39 Output dir: outputs/train/2024-12-06/22-28-29_real_world_act_default
11
+ INFO 2024-12-06 22:28:33 ts/train.py:349 cfg.env.task=None
12
+ INFO 2024-12-06 22:28:33 ts/train.py:350 cfg.training.offline_steps=5000 (5K)
13
+ INFO 2024-12-06 22:28:33 ts/train.py:351 cfg.training.online_steps=0
14
+ INFO 2024-12-06 22:28:33 ts/train.py:352 offline_dataset.num_samples=800 (800)
15
+ INFO 2024-12-06 22:28:33 ts/train.py:353 offline_dataset.num_episodes=1
16
+ INFO 2024-12-06 22:28:33 ts/train.py:354 num_learnable_params=51613582 (52M)
17
+ INFO 2024-12-06 22:28:33 ts/train.py:355 num_total_params=51613684 (52M)
18
+ INFO 2024-12-06 22:28:33 ts/train.py:421 Start offline training on a fixed dataset
19
+ INFO 2024-12-06 22:28:44 ts/train.py:192 step:0 smpl:8 ep:0 epch:0.01 loss:85.424 grdn:1036.794 lr:1.0e-05 updt_s:7.126 data_s:3.108
20
+ INFO 2024-12-06 22:32:21 ts/train.py:192 step:200 smpl:2K ep:2 epch:2.01 loss:3.562 grdn:97.104 lr:1.0e-05 updt_s:1.076 data_s:2.453
21
+ INFO 2024-12-06 22:36:00 ts/train.py:192 step:400 smpl:3K ep:4 epch:4.01 loss:2.455 grdn:86.458 lr:1.0e-05 updt_s:1.094 data_s:2.019
22
+ INFO 2024-12-06 22:39:40 ts/train.py:192 step:600 smpl:5K ep:6 epch:6.01 loss:2.300 grdn:76.224 lr:1.0e-05 updt_s:1.088 data_s:2.352
23
+ INFO 2024-12-06 22:43:19 ts/train.py:192 step:800 smpl:6K ep:8 epch:8.01 loss:1.897 grdn:66.798 lr:1.0e-05 updt_s:1.108 data_s:2.149
24
+ INFO 2024-12-06 22:46:58 ts/train.py:192 step:1K smpl:8K ep:10 epch:10.01 loss:1.727 grdn:65.505 lr:1.0e-05 updt_s:1.100 data_s:1.999
25
+ INFO 2024-12-06 22:50:37 ts/train.py:192 step:1K smpl:10K ep:12 epch:12.01 loss:1.474 grdn:56.429 lr:1.0e-05 updt_s:1.091 data_s:2.366
26
+ INFO 2024-12-06 22:54:16 ts/train.py:192 step:1K smpl:11K ep:14 epch:14.01 loss:1.324 grdn:52.798 lr:1.0e-05 updt_s:1.104 data_s:1.794
27
+ INFO 2024-12-06 22:57:55 ts/train.py:192 step:2K smpl:13K ep:16 epch:16.01 loss:1.275 grdn:48.997 lr:1.0e-05 updt_s:1.099 data_s:2.227
28
+ INFO 2024-12-06 23:01:35 ts/train.py:192 step:2K smpl:14K ep:18 epch:18.01 loss:1.195 grdn:50.355 lr:1.0e-05 updt_s:1.411 data_s:2.189
29
+ INFO 2024-12-06 23:05:13 ts/train.py:192 step:2K smpl:16K ep:20 epch:20.01 loss:1.077 grdn:40.395 lr:1.0e-05 updt_s:1.090 data_s:1.955
30
+ INFO 2024-12-06 23:08:53 ts/train.py:192 step:2K smpl:18K ep:22 epch:22.01 loss:0.905 grdn:47.089 lr:1.0e-05 updt_s:1.090 data_s:2.396
31
+ INFO 2024-12-06 23:12:32 ts/train.py:192 step:2K smpl:19K ep:24 epch:24.01 loss:0.878 grdn:44.676 lr:1.0e-05 updt_s:1.090 data_s:2.298
32
+ INFO 2024-12-06 23:16:11 ts/train.py:192 step:3K smpl:21K ep:26 epch:26.01 loss:0.736 grdn:41.427 lr:1.0e-05 updt_s:1.106 data_s:2.089
33
+ INFO 2024-12-06 23:19:50 ts/train.py:192 step:3K smpl:22K ep:28 epch:28.01 loss:0.633 grdn:33.782 lr:1.0e-05 updt_s:1.090 data_s:2.224
34
+ INFO 2024-12-06 23:23:29 ts/train.py:192 step:3K smpl:24K ep:30 epch:30.01 loss:0.550 grdn:34.230 lr:1.0e-05 updt_s:1.103 data_s:2.172
35
+ INFO 2024-12-06 23:27:08 ts/train.py:192 step:3K smpl:26K ep:32 epch:32.01 loss:0.572 grdn:37.149 lr:1.0e-05 updt_s:1.086 data_s:2.248
36
+ INFO 2024-12-06 23:30:47 ts/train.py:192 step:3K smpl:27K ep:34 epch:34.01 loss:0.490 grdn:34.704 lr:1.0e-05 updt_s:1.093 data_s:1.711
37
+ INFO 2024-12-06 23:34:25 ts/train.py:192 step:4K smpl:29K ep:36 epch:36.01 loss:0.459 grdn:28.810 lr:1.0e-05 updt_s:1.105 data_s:1.716
38
+ INFO 2024-12-06 23:38:04 ts/train.py:192 step:4K smpl:30K ep:38 epch:38.01 loss:0.450 grdn:30.977 lr:1.0e-05 updt_s:1.095 data_s:2.136
39
+ INFO 2024-12-06 23:41:44 ts/train.py:192 step:4K smpl:32K ep:40 epch:40.01 loss:0.376 grdn:34.368 lr:1.0e-05 updt_s:1.092 data_s:1.970
40
+ INFO 2024-12-06 23:45:23 ts/train.py:192 step:4K smpl:34K ep:42 epch:42.01 loss:0.309 grdn:26.141 lr:1.0e-05 updt_s:1.090 data_s:2.131
41
+ INFO 2024-12-06 23:49:02 ts/train.py:192 step:4K smpl:35K ep:44 epch:44.01 loss:0.282 grdn:21.178 lr:1.0e-05 updt_s:1.095 data_s:2.192
42
+ INFO 2024-12-06 23:52:41 ts/train.py:192 step:5K smpl:37K ep:46 epch:46.01 loss:0.255 grdn:25.957 lr:1.0e-05 updt_s:1.078 data_s:2.502
43
+ INFO 2024-12-06 23:56:20 ts/train.py:192 step:5K smpl:38K ep:48 epch:48.01 loss:0.250 grdn:20.830 lr:1.0e-05 updt_s:1.088 data_s:2.212
44
+ INFO 2024-12-06 23:59:56 ts/train.py:383 Checkpoint policy after step 5000
45
+ INFO 2024-12-06 23:59:58 ts/train.py:393 Resume training
46
+ INFO 2024-12-06 23:59:58 ts/train.py:455 End of training
wandb/run-20241206_222830-bwwpk9vl/files/requirements.txt ADDED
@@ -0,0 +1,129 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ pymunk==6.9.0
2
+ charset-normalizer==3.4.0
3
+ pip==22.0.2
4
+ multidict==6.1.0
5
+ pytz==2024.2
6
+ pandas==2.2.3
7
+ fasteners==0.19
8
+ einops==0.8.0
9
+ setproctitle==1.3.4
10
+ python-dateutil==2.9.0.post0
11
+ pydantic==2.10.3
12
+ dm-control==1.0.14
13
+ MarkupSafe==3.0.2
14
+ safetensors==0.4.5
15
+ cloudpickle==3.1.0
16
+ imageio-ffmpeg==0.5.1
17
+ smmap==5.0.1
18
+ huggingface-hub==0.26.5
19
+ torch==2.6.0.dev20241112+cu121
20
+ nvidia-cusolver-cu12==11.4.5.107
21
+ inquirerpy==0.3.4
22
+ soupsieve==2.6
23
+ deepdiff==8.0.1
24
+ nvidia-nvjitlink-cu12==12.4.127
25
+ aiosignal==1.3.1
26
+ dm-tree==0.1.8
27
+ aiohappyeyeballs==2.4.4
28
+ propcache==0.2.1
29
+ gym-aloha==0.1.1
30
+ labmaze==1.0.6
31
+ pyav==14.0.1
32
+ nvidia-cuda-cupti-cu12==12.1.105
33
+ cffi==1.17.1
34
+ importlib_metadata==8.5.0
35
+ nvidia-cuda-runtime-cu12==12.1.105
36
+ pycparser==2.22
37
+ h5py==3.12.1
38
+ nvidia-nccl-cu12==2.21.5
39
+ orderly-set==5.2.2
40
+ pyarrow==18.1.0
41
+ Flask==3.1.0
42
+ multiprocess==0.70.16
43
+ blinker==1.9.0
44
+ regex==2024.11.6
45
+ Jinja2==3.1.4
46
+ tqdm==4.67.1
47
+ certifi==2024.8.30
48
+ frozenlist==1.5.0
49
+ attrs==24.2.0
50
+ pytorch-triton==3.1.0+cf34004b8a
51
+ omegaconf==2.3.0
52
+ itsdangerous==2.2.0
53
+ packaging==24.2
54
+ pfzy==0.3.4
55
+ pydantic_core==2.27.1
56
+ antlr4-python3-runtime==4.9.3
57
+ cmake==3.31.1
58
+ imageio==2.36.1
59
+ setuptools==59.6.0
60
+ nvidia-cusparselt-cu12==0.6.2
61
+ zipp==3.21.0
62
+ torchvision==0.20.0.dev20241112+cu121
63
+ nvidia-curand-cu12==10.3.2.106
64
+ PyOpenGL-accelerate==3.1.7
65
+ numpy==1.26.4
66
+ dm-env==1.6
67
+ nvidia-cusparse-cu12==12.1.0.106
68
+ networkx==3.4.2
69
+ triton==3.1.0
70
+ termcolor==2.5.0
71
+ gitdb==4.0.11
72
+ torchaudio==2.5.0.dev20241112+cu121
73
+ glfw==2.8.0
74
+ tzdata==2024.2
75
+ pillow==11.0.0
76
+ idna==3.10
77
+ pyparsing==3.2.0
78
+ typing_extensions==4.12.2
79
+ wcwidth==0.2.13
80
+ sympy==1.13.1
81
+ nvidia-cublas-cu12==12.1.3.1
82
+ zarr==2.18.3
83
+ protobuf==5.29.1
84
+ annotated-types==0.7.0
85
+ xxhash==3.5.0
86
+ aiohttp==3.11.10
87
+ Werkzeug==3.1.3
88
+ mujoco==2.3.7
89
+ gymnasium==0.29.1
90
+ rerun-sdk==0.20.3
91
+ nvidia-cufft-cu12==11.0.2.54
92
+ dill==0.3.8
93
+ scipy==1.14.1
94
+ hydra-core==1.3.2
95
+ fsspec==2024.9.0
96
+ platformdirs==4.3.6
97
+ PySocks==1.7.1
98
+ PyOpenGL==3.1.7
99
+ requests==2.32.3
100
+ lxml==5.3.0
101
+ Farama-Notifications==0.0.4
102
+ nvidia-cuda-nvrtc-cu12==12.1.105
103
+ numba==0.60.0
104
+ docker-pycreds==0.4.0
105
+ six==1.17.0
106
+ lerobot==0.1.0
107
+ nvidia-cudnn-cu12==9.1.0.70
108
+ sentry-sdk==2.19.2
109
+ absl-py==2.1.0
110
+ wandb==0.19.0
111
+ mpmath==1.3.0
112
+ llvmlite==0.43.0
113
+ numcodecs==0.13.1
114
+ GitPython==3.1.43
115
+ nvidia-nvtx-cu12==12.1.105
116
+ prompt_toolkit==3.0.48
117
+ datasets==3.1.0
118
+ opencv-python==4.10.0.84
119
+ filelock==3.16.1
120
+ async-timeout==5.0.1
121
+ diffusers==0.31.0
122
+ yarl==1.18.3
123
+ click==8.1.7
124
+ asciitree==0.3.3
125
+ psutil==6.1.0
126
+ gdown==5.2.0
127
+ PyYAML==6.0.2
128
+ urllib3==2.2.3
129
+ beautifulsoup4==4.12.3
wandb/run-20241206_222830-bwwpk9vl/files/wandb-metadata.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1015-aws-x86_64-with-glibc2.35",
3
+ "python": "CPython 3.10.12",
4
+ "startedAt": "2024-12-06T22:28:30.311945Z",
5
+ "args": [
6
+ "policy=act_aloha_real",
7
+ "env=aloha_real",
8
+ "dataset_repo_id=ccop/aloha_stationary_replay_test_v2"
9
+ ],
10
+ "program": "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py",
11
+ "codePath": "lerobot/scripts/train.py",
12
+ "git": {
13
+ "remote": "[email protected]:HumanoidTeam/lerobot-hackathon.git",
14
+ "commit": "ab8aa3f8e7b6e5486d7af26ccd319d358ffad579"
15
+ },
16
+ "email": "[email protected]",
17
+ "root": "outputs/train/2024-12-06/22-28-29_real_world_act_default",
18
+ "host": "ip-172-31-20-130",
19
+ "username": "humanoidteam",
20
+ "executable": "/home/ubuntu/lerobot-hackathon/lerobot/bin/python",
21
+ "codePathLocal": "lerobot/scripts/train.py",
22
+ "cpu_count": 4,
23
+ "cpu_count_logical": 8,
24
+ "gpu": "Tesla T4",
25
+ "gpu_count": 1,
26
+ "disk": {
27
+ "/": {
28
+ "total": "311993479168",
29
+ "used": "216540794880"
30
+ }
31
+ },
32
+ "memory": {
33
+ "total": "33263837184"
34
+ },
35
+ "cpu": {
36
+ "count": 4,
37
+ "countLogical": 8
38
+ },
39
+ "gpu_nvidia": [
40
+ {
41
+ "name": "Tesla T4",
42
+ "memoryTotal": "16106127360",
43
+ "cudaCores": 2560,
44
+ "architecture": "Turing"
45
+ }
46
+ ],
47
+ "cudaVersion": "12.4"
48
+ }
wandb/run-20241206_222830-bwwpk9vl/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train/lr":1e-05,"train/loss":0.2502947151660919,"train/is_online":false,"train/num_samples":38408,"train/num_episodes":48.01,"train/kld_loss":0.01526648923754692,"train/grad_norm":20.83009910583496,"train/dataloading_s":2.211516670999117,"_timestamp":1.7335293805980325e+09,"_step":4800,"_runtime":5488.627260612,"train/step":4800,"train/l1_loss":0.09762981534004211,"train/num_epochs":48.01,"_wandb":{"runtime":5488},"train/update_s":1.0881254139821976}
wandb/run-20241206_222830-bwwpk9vl/logs/debug-core.log ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-12-06T22:28:29.883207186Z","level":"INFO","msg":"started logging, with flags","port-filename":"/tmp/tmpf2z320nz/port-2539524.txt","pid":2539524,"debug":false,"disable-analytics":false}
2
+ {"time":"2024-12-06T22:28:29.883234859Z","level":"INFO","msg":"FeatureState","shutdownOnParentExitEnabled":false}
3
+ {"time":"2024-12-06T22:28:29.886661968Z","level":"INFO","msg":"Will exit if parent process dies.","ppid":2539524}
4
+ {"time":"2024-12-06T22:28:29.886681547Z","level":"INFO","msg":"server is running","addr":{"IP":"127.0.0.1","Port":43495,"Zone":""}}
5
+ {"time":"2024-12-06T22:28:30.072566654Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:55002"}
6
+ {"time":"2024-12-06T22:28:30.312961224Z","level":"INFO","msg":"handleInformInit: received","streamId":"bwwpk9vl","id":"127.0.0.1:55002"}
7
+ {"time":"2024-12-06T22:28:30.416433116Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"bwwpk9vl","id":"127.0.0.1:55002"}
8
+ {"time":"2024-12-06T23:59:58.939118572Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"127.0.0.1:55002"}
9
+ {"time":"2024-12-06T23:59:58.939192863Z","level":"INFO","msg":"server is shutting down"}
10
+ {"time":"2024-12-06T23:59:58.939181535Z","level":"INFO","msg":"connection: Close: initiating connection closure","id":"127.0.0.1:55002"}
11
+ {"time":"2024-12-06T23:59:58.939312003Z","level":"INFO","msg":"connection: Close: connection successfully closed","id":"127.0.0.1:55002"}
12
+ {"time":"2024-12-07T00:00:06.315410708Z","level":"ERROR","msg":"processOutgoingData: flush error","error":"write tcp 127.0.0.1:43495->127.0.0.1:55002: use of closed network connection","id":"127.0.0.1:55002"}
13
+ {"time":"2024-12-07T00:00:06.536210754Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"127.0.0.1:55002"}
14
+ {"time":"2024-12-07T00:00:06.536232465Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"127.0.0.1:55002"}
15
+ {"time":"2024-12-07T00:00:06.536247048Z","level":"INFO","msg":"server is closed"}
wandb/run-20241206_222830-bwwpk9vl/logs/debug-internal.log ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-12-06T22:28:30.313104758Z","level":"INFO","msg":"using version","core version":"0.19.0"}
2
+ {"time":"2024-12-06T22:28:30.313117284Z","level":"INFO","msg":"created symlink","path":"outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241206_222830-bwwpk9vl/logs/debug-core.log"}
3
+ {"time":"2024-12-06T22:28:30.416399043Z","level":"INFO","msg":"created new stream","id":"bwwpk9vl"}
4
+ {"time":"2024-12-06T22:28:30.416428271Z","level":"INFO","msg":"stream: started","id":"bwwpk9vl"}
5
+ {"time":"2024-12-06T22:28:30.416469205Z","level":"INFO","msg":"handler: started","stream_id":"bwwpk9vl"}
6
+ {"time":"2024-12-06T22:28:30.416473548Z","level":"INFO","msg":"sender: started","stream_id":"bwwpk9vl"}
7
+ {"time":"2024-12-06T22:28:30.416459377Z","level":"INFO","msg":"writer: Do: started","stream_id":"bwwpk9vl"}
8
+ {"time":"2024-12-06T22:28:30.658850895Z","level":"INFO","msg":"Starting system monitor"}
9
+ {"time":"2024-12-06T23:59:58.939177282Z","level":"INFO","msg":"stream: closing","id":"bwwpk9vl"}
10
+ {"time":"2024-12-06T23:59:58.939228097Z","level":"INFO","msg":"Stopping system monitor"}
11
+ {"time":"2024-12-06T23:59:58.939881357Z","level":"INFO","msg":"Stopped system monitor"}
12
+ {"time":"2024-12-07T00:00:06.36632207Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
13
+ {"time":"2024-12-07T00:00:06.536040063Z","level":"INFO","msg":"handler: closed","stream_id":"bwwpk9vl"}
14
+ {"time":"2024-12-07T00:00:06.536088365Z","level":"INFO","msg":"writer: Close: closed","stream_id":"bwwpk9vl"}
15
+ {"time":"2024-12-07T00:00:06.536107691Z","level":"INFO","msg":"sender: closed","stream_id":"bwwpk9vl"}
16
+ {"time":"2024-12-07T00:00:06.536149416Z","level":"INFO","msg":"stream: closed","id":"bwwpk9vl"}
wandb/run-20241206_222830-bwwpk9vl/logs/debug.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-12-06 22:28:30,306 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Current SDK version is 0.19.0
2
+ 2024-12-06 22:28:30,306 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Configure stats pid to 2539524
3
+ 2024-12-06 22:28:30,306 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/.config/wandb/settings
4
+ 2024-12-06 22:28:30,306 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/lerobot-hackathon/wandb/settings
5
+ 2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_setup.py:_flush():68] Loading settings from environment variables
6
+ 2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_setup.py:_flush():68] wandb: Using wandb-core as the SDK backend. Please refer to https://wandb.me/wandb-core for more information.
7
+ 2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:_log_setup():528] Logging user logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241206_222830-bwwpk9vl/logs/debug.log
8
+ 2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:_log_setup():529] Logging internal logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241206_222830-bwwpk9vl/logs/debug-internal.log
9
+ 2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:init():639] calling init triggers
10
+ 2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:init():645] wandb.init called with sweep_config: {}
11
+ config: {'resume': False, 'device': 'cuda', 'use_amp': False, 'seed': 1000, 'dataset_repo_id': 'ccop/aloha_stationary_replay_test_v2', 'video_backend': 'pyav', 'training': {'offline_steps': 5000, 'num_workers': 8, 'batch_size': 8, 'eval_freq': -1, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 10000, 'online_steps': 0, 'online_rollout_n_episodes': 1, 'online_rollout_batch_size': 1, 'online_steps_between_rollouts': 1, 'online_sampling_ratio': 0.5, 'online_env_seed': None, 'online_buffer_capacity': None, 'online_buffer_seed_size': 0, 'do_online_rollout_async': False, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'brightness': {'weight': 1, 'min_max': [0.8, 1.2]}, 'contrast': {'weight': 1, 'min_max': [0.8, 1.2]}, 'saturation': {'weight': 1, 'min_max': [0.5, 1.5]}, 'hue': {'weight': 1, 'min_max': [-0.05, 0.05]}, 'sharpness': {'weight': 1, 'min_max': [0.8, 1.2]}}, 'lr': 1e-05, 'lr_backbone': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10, 'delta_timestamps': {'action': '[i / 30 for i in range(100)]'}}, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot_real_aloha', 'notes': 'ws-lerobot-hackathon'}, 'fps': 30, 'env': {'name': 'real_world', 'task': None, 'state_dim': 14, 'action_dim': 14, 'fps': 30}, 'override_dataset_stats': {'observation.images.cam_right_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_left_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_high': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}}, 'policy': {'name': 'act', 'n_obs_steps': 1, 'chunk_size': 100, 'n_action_steps': 100, 'input_shapes': {'observation.images.cam_right_wrist': [3, 480, 640], 'observation.images.cam_left_wrist': [3, 480, 640], 'observation.images.cam_high': [3, 480, 640], 'observation.state': [14]}, 'output_shapes': {'action': [14]}, 'input_normalization_modes': {'observation.images.cam_right_wrist': 'mean_std', 'observation.images.cam_left_wrist': 'mean_std', 'observation.images.cam_high': 'mean_std', 'observation.state': 'mean_std'}, 'output_normalization_modes': {'action': 'mean_std'}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_momentum': None, 'dropout': 0.1, 'kl_weight': 10.0}}
12
+ 2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:init():688] starting backend
13
+ 2024-12-06 22:28:30,307 INFO MainThread:2539524 [wandb_init.py:init():692] sending inform_init request
14
+ 2024-12-06 22:28:30,311 INFO MainThread:2539524 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
15
+ 2024-12-06 22:28:30,311 INFO MainThread:2539524 [wandb_init.py:init():705] backend started and connected
16
+ 2024-12-06 22:28:30,313 INFO MainThread:2539524 [wandb_init.py:init():798] updated telemetry
17
+ 2024-12-06 22:28:30,319 INFO MainThread:2539524 [wandb_init.py:init():830] communicating run to backend with 90.0 second timeout
18
+ 2024-12-06 22:28:30,655 INFO MainThread:2539524 [wandb_init.py:init():882] starting run threads in backend
19
+ 2024-12-06 22:28:30,767 INFO MainThread:2539524 [wandb_run.py:_console_start():2443] atexit reg
20
+ 2024-12-06 22:28:30,767 INFO MainThread:2539524 [wandb_run.py:_redirect():2293] redirect: wrap_raw
21
+ 2024-12-06 22:28:30,767 INFO MainThread:2539524 [wandb_run.py:_redirect():2358] Wrapping output streams.
22
+ 2024-12-06 22:28:30,767 INFO MainThread:2539524 [wandb_run.py:_redirect():2383] Redirects installed.
23
+ 2024-12-06 22:28:30,769 INFO MainThread:2539524 [wandb_init.py:init():925] run started, returning control to user process
24
+ 2024-12-06 23:59:58,939 WARNING MsgRouterThr:2539524 [router.py:message_loop():75] message_loop has been closed
wandb/run-20241206_222830-bwwpk9vl/run-bwwpk9vl.wandb ADDED
Binary file (931 kB). View file
 
wandb/run-20241207_010636-bwwpk9vl/files/config.yaml ADDED
@@ -0,0 +1,296 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.19.0
4
+ m: []
5
+ python_version: 3.10.12
6
+ t:
7
+ "1":
8
+ - 1
9
+ - 41
10
+ - 49
11
+ - 50
12
+ - 51
13
+ - 55
14
+ "2":
15
+ - 1
16
+ - 41
17
+ - 49
18
+ - 50
19
+ - 51
20
+ - 55
21
+ "3":
22
+ - 5
23
+ - 13
24
+ - 14
25
+ - 15
26
+ - 16
27
+ - 23
28
+ - 55
29
+ - 62
30
+ "4": 3.10.12
31
+ "5": 0.19.0
32
+ "8":
33
+ - 5
34
+ "12": 0.19.0
35
+ "13": linux-x86_64
36
+ dataset_repo_id:
37
+ value: ccop/aloha_stationary_replay_test_v2
38
+ device:
39
+ value: cuda
40
+ env:
41
+ value:
42
+ action_dim: 14
43
+ fps: 30
44
+ name: real_world
45
+ state_dim: 14
46
+ task: null
47
+ eval:
48
+ value:
49
+ batch_size: 50
50
+ n_episodes: 50
51
+ use_async_envs: false
52
+ fps:
53
+ value: 30
54
+ override_dataset_stats:
55
+ value:
56
+ observation.images.cam_high:
57
+ mean:
58
+ - - - 0.485
59
+ - - - 0.456
60
+ - - - 0.406
61
+ std:
62
+ - - - 0.229
63
+ - - - 0.224
64
+ - - - 0.225
65
+ observation.images.cam_left_wrist:
66
+ mean:
67
+ - - - 0.485
68
+ - - - 0.456
69
+ - - - 0.406
70
+ std:
71
+ - - - 0.229
72
+ - - - 0.224
73
+ - - - 0.225
74
+ observation.images.cam_right_wrist:
75
+ mean:
76
+ - - - 0.485
77
+ - - - 0.456
78
+ - - - 0.406
79
+ std:
80
+ - - - 0.229
81
+ - - - 0.224
82
+ - - - 0.225
83
+ policy:
84
+ value:
85
+ chunk_size: 100
86
+ dim_feedforward: 3200
87
+ dim_model: 512
88
+ dropout: 0.1
89
+ feedforward_activation: relu
90
+ input_normalization_modes:
91
+ observation.images.cam_high: mean_std
92
+ observation.images.cam_left_wrist: mean_std
93
+ observation.images.cam_right_wrist: mean_std
94
+ observation.state: mean_std
95
+ input_shapes:
96
+ observation.images.cam_high:
97
+ - 3
98
+ - 480
99
+ - 640
100
+ observation.images.cam_left_wrist:
101
+ - 3
102
+ - 480
103
+ - 640
104
+ observation.images.cam_right_wrist:
105
+ - 3
106
+ - 480
107
+ - 640
108
+ observation.state:
109
+ - 14
110
+ kl_weight: 10
111
+ latent_dim: 32
112
+ n_action_steps: 100
113
+ n_decoder_layers: 1
114
+ n_encoder_layers: 4
115
+ n_heads: 8
116
+ n_obs_steps: 1
117
+ n_vae_encoder_layers: 4
118
+ name: act
119
+ output_normalization_modes:
120
+ action: mean_std
121
+ output_shapes:
122
+ action:
123
+ - 14
124
+ pre_norm: false
125
+ pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
126
+ replace_final_stride_with_dilation: false
127
+ temporal_ensemble_momentum: null
128
+ use_vae: true
129
+ vision_backbone: resnet18
130
+ resume:
131
+ value: true
132
+ seed:
133
+ value: 1000
134
+ training:
135
+ value:
136
+ batch_size: 8
137
+ delta_timestamps:
138
+ action:
139
+ - 0
140
+ - 0.03333333333333333
141
+ - 0.06666666666666667
142
+ - 0.1
143
+ - 0.13333333333333333
144
+ - 0.16666666666666666
145
+ - 0.2
146
+ - 0.23333333333333334
147
+ - 0.26666666666666666
148
+ - 0.3
149
+ - 0.3333333333333333
150
+ - 0.36666666666666664
151
+ - 0.4
152
+ - 0.43333333333333335
153
+ - 0.4666666666666667
154
+ - 0.5
155
+ - 0.5333333333333333
156
+ - 0.5666666666666667
157
+ - 0.6
158
+ - 0.6333333333333333
159
+ - 0.6666666666666666
160
+ - 0.7
161
+ - 0.7333333333333333
162
+ - 0.7666666666666667
163
+ - 0.8
164
+ - 0.8333333333333334
165
+ - 0.8666666666666667
166
+ - 0.9
167
+ - 0.9333333333333333
168
+ - 0.9666666666666667
169
+ - 1
170
+ - 1.0333333333333334
171
+ - 1.0666666666666667
172
+ - 1.1
173
+ - 1.1333333333333333
174
+ - 1.1666666666666667
175
+ - 1.2
176
+ - 1.2333333333333334
177
+ - 1.2666666666666666
178
+ - 1.3
179
+ - 1.3333333333333333
180
+ - 1.3666666666666667
181
+ - 1.4
182
+ - 1.4333333333333333
183
+ - 1.4666666666666666
184
+ - 1.5
185
+ - 1.5333333333333334
186
+ - 1.5666666666666667
187
+ - 1.6
188
+ - 1.6333333333333333
189
+ - 1.6666666666666667
190
+ - 1.7
191
+ - 1.7333333333333334
192
+ - 1.7666666666666666
193
+ - 1.8
194
+ - 1.8333333333333333
195
+ - 1.8666666666666667
196
+ - 1.9
197
+ - 1.9333333333333333
198
+ - 1.9666666666666666
199
+ - 2
200
+ - 2.033333333333333
201
+ - 2.066666666666667
202
+ - 2.1
203
+ - 2.1333333333333333
204
+ - 2.1666666666666665
205
+ - 2.2
206
+ - 2.2333333333333334
207
+ - 2.2666666666666666
208
+ - 2.3
209
+ - 2.3333333333333335
210
+ - 2.3666666666666667
211
+ - 2.4
212
+ - 2.433333333333333
213
+ - 2.466666666666667
214
+ - 2.5
215
+ - 2.533333333333333
216
+ - 2.566666666666667
217
+ - 2.6
218
+ - 2.6333333333333333
219
+ - 2.6666666666666665
220
+ - 2.7
221
+ - 2.7333333333333334
222
+ - 2.7666666666666666
223
+ - 2.8
224
+ - 2.8333333333333335
225
+ - 2.8666666666666667
226
+ - 2.9
227
+ - 2.933333333333333
228
+ - 2.966666666666667
229
+ - 3
230
+ - 3.033333333333333
231
+ - 3.066666666666667
232
+ - 3.1
233
+ - 3.1333333333333333
234
+ - 3.1666666666666665
235
+ - 3.2
236
+ - 3.2333333333333334
237
+ - 3.2666666666666666
238
+ - 3.3
239
+ do_online_rollout_async: false
240
+ eval_freq: -1
241
+ grad_clip_norm: 10
242
+ image_transforms:
243
+ brightness:
244
+ min_max:
245
+ - 0.8
246
+ - 1.2
247
+ weight: 1
248
+ contrast:
249
+ min_max:
250
+ - 0.8
251
+ - 1.2
252
+ weight: 1
253
+ enable: false
254
+ hue:
255
+ min_max:
256
+ - -0.05
257
+ - 0.05
258
+ weight: 1
259
+ max_num_transforms: 3
260
+ random_order: false
261
+ saturation:
262
+ min_max:
263
+ - 0.5
264
+ - 1.5
265
+ weight: 1
266
+ sharpness:
267
+ min_max:
268
+ - 0.8
269
+ - 1.2
270
+ weight: 1
271
+ log_freq: 200
272
+ lr: 1e-05
273
+ lr_backbone: 1e-05
274
+ num_workers: 8
275
+ offline_steps: 5000
276
+ online_buffer_capacity: null
277
+ online_buffer_seed_size: 0
278
+ online_env_seed: null
279
+ online_rollout_batch_size: 1
280
+ online_rollout_n_episodes: 1
281
+ online_sampling_ratio: 0.5
282
+ online_steps: 0
283
+ online_steps_between_rollouts: 1
284
+ save_checkpoint: true
285
+ save_freq: 10000
286
+ weight_decay: 0.0001
287
+ use_amp:
288
+ value: false
289
+ video_backend:
290
+ value: pyav
291
+ wandb:
292
+ value:
293
+ disable_artifact: false
294
+ enable: true
295
+ notes: ws-lerobot-hackathon
296
+ project: lerobot_real_aloha
wandb/run-20241207_010636-bwwpk9vl/files/output.log ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Logs will be synced with wandb.
2
+ INFO 2024-12-07 01:06:36 n/logger.py:132 Track this run --> https://wandb.ai/zaringleb/lerobot_real_aloha/runs/bwwpk9vl
3
+ INFO 2024-12-07 01:06:36 ts/train.py:312 make_dataset
4
+ WARNING 2024-12-07 01:06:36 s/factory.py:68 There might be a mismatch between your training dataset (dataset_repo_id='ccop/aloha_stationary_replay_test_v2') and your environment (cfg.env.name='real_world').
5
+ Fetching 9 files: 100%|█████████████████████████████████████████████████████████████████████████████████████████████| 9/9 [00:00<00:00, 19774.09it/s]
6
+ INFO 2024-12-07 01:06:39 ts/train.py:328 make_policy
7
+ WARNING 2024-12-07 01:06:39 s/factory.py:28 Hydra config is missing arguments: {'temporal_ensemble_coeff'}
8
+ Loading weights from local directory
9
+ /home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py:338: FutureWarning: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.
10
+ grad_scaler = GradScaler(enabled=cfg.use_amp)
11
+ Error executing job with overrides: ['policy=act_aloha_real', 'env=aloha_real', 'dataset_repo_id=ccop/aloha_stationary_replay_test_v2', 'resume=true', 'dataset_repo_id=HumanoidTeam/aloha_real_test', 'training.offline_steps=5010']
12
+ Traceback (most recent call last):
13
+ File "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py", line 652, in train_cli
14
+ train(
15
+ File "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py", line 343, in train
16
+ step = logger.load_last_training_state(optimizer, lr_scheduler)
17
+ File "/home/ubuntu/lerobot-hackathon/lerobot/common/logger.py", line 218, in load_last_training_state
18
+ training_state = torch.load(self.last_checkpoint_dir / self.training_state_file_name)
19
+ File "/home/ubuntu/lerobot-hackathon/lerobot/lib/python3.10/site-packages/torch/serialization.py", line 1444, in load
20
+ raise pickle.UnpicklingError(_get_wo_message(str(e))) from None
21
+ _pickle.UnpicklingError: Weights only load failed. This file can still be loaded, to do so you have two options, do those steps only if you trust the source of the checkpoint.
22
+ (1) Re-running `torch.load` with `weights_only` set to `False` will likely succeed, but it can result in arbitrary code execution. Do it only if you got the file from a trusted source.
23
+ (2) Alternatively, to load with `weights_only=True` please check the recommended steps in the following error message.
24
+ WeightsUnpickler error: Unsupported global: GLOBAL numpy.core.multiarray._reconstruct was not an allowed global by default. Please use `torch.serialization.add_safe_globals([_reconstruct])` or the `torch.serialization.safe_globals([_reconstruct])` context manager to allowlist this global if you trust this class/function.
25
+
26
+ Check the documentation of torch.load to learn more about types accepted by default with weights_only https://pytorch.org/docs/stable/generated/torch.load.html.
27
+
28
+ Set the environment variable HYDRA_FULL_ERROR=1 for a complete stack trace.
wandb/run-20241207_010636-bwwpk9vl/files/requirements.txt ADDED
@@ -0,0 +1,129 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ pymunk==6.9.0
2
+ charset-normalizer==3.4.0
3
+ pip==22.0.2
4
+ multidict==6.1.0
5
+ pytz==2024.2
6
+ pandas==2.2.3
7
+ fasteners==0.19
8
+ einops==0.8.0
9
+ setproctitle==1.3.4
10
+ python-dateutil==2.9.0.post0
11
+ pydantic==2.10.3
12
+ dm-control==1.0.14
13
+ MarkupSafe==3.0.2
14
+ safetensors==0.4.5
15
+ cloudpickle==3.1.0
16
+ imageio-ffmpeg==0.5.1
17
+ smmap==5.0.1
18
+ huggingface-hub==0.26.5
19
+ torch==2.6.0.dev20241112+cu121
20
+ nvidia-cusolver-cu12==11.4.5.107
21
+ inquirerpy==0.3.4
22
+ soupsieve==2.6
23
+ deepdiff==8.0.1
24
+ nvidia-nvjitlink-cu12==12.4.127
25
+ aiosignal==1.3.1
26
+ dm-tree==0.1.8
27
+ aiohappyeyeballs==2.4.4
28
+ propcache==0.2.1
29
+ gym-aloha==0.1.1
30
+ labmaze==1.0.6
31
+ pyav==14.0.1
32
+ nvidia-cuda-cupti-cu12==12.1.105
33
+ cffi==1.17.1
34
+ importlib_metadata==8.5.0
35
+ nvidia-cuda-runtime-cu12==12.1.105
36
+ pycparser==2.22
37
+ h5py==3.12.1
38
+ nvidia-nccl-cu12==2.21.5
39
+ orderly-set==5.2.2
40
+ pyarrow==18.1.0
41
+ Flask==3.1.0
42
+ multiprocess==0.70.16
43
+ blinker==1.9.0
44
+ regex==2024.11.6
45
+ Jinja2==3.1.4
46
+ tqdm==4.67.1
47
+ certifi==2024.8.30
48
+ frozenlist==1.5.0
49
+ attrs==24.2.0
50
+ pytorch-triton==3.1.0+cf34004b8a
51
+ omegaconf==2.3.0
52
+ itsdangerous==2.2.0
53
+ packaging==24.2
54
+ pfzy==0.3.4
55
+ pydantic_core==2.27.1
56
+ antlr4-python3-runtime==4.9.3
57
+ cmake==3.31.1
58
+ imageio==2.36.1
59
+ setuptools==59.6.0
60
+ nvidia-cusparselt-cu12==0.6.2
61
+ zipp==3.21.0
62
+ torchvision==0.20.0.dev20241112+cu121
63
+ nvidia-curand-cu12==10.3.2.106
64
+ PyOpenGL-accelerate==3.1.7
65
+ numpy==1.26.4
66
+ dm-env==1.6
67
+ nvidia-cusparse-cu12==12.1.0.106
68
+ networkx==3.4.2
69
+ triton==3.1.0
70
+ termcolor==2.5.0
71
+ gitdb==4.0.11
72
+ torchaudio==2.5.0.dev20241112+cu121
73
+ glfw==2.8.0
74
+ tzdata==2024.2
75
+ pillow==11.0.0
76
+ idna==3.10
77
+ pyparsing==3.2.0
78
+ typing_extensions==4.12.2
79
+ wcwidth==0.2.13
80
+ sympy==1.13.1
81
+ nvidia-cublas-cu12==12.1.3.1
82
+ zarr==2.18.3
83
+ protobuf==5.29.1
84
+ annotated-types==0.7.0
85
+ xxhash==3.5.0
86
+ aiohttp==3.11.10
87
+ Werkzeug==3.1.3
88
+ mujoco==2.3.7
89
+ gymnasium==0.29.1
90
+ rerun-sdk==0.20.3
91
+ nvidia-cufft-cu12==11.0.2.54
92
+ dill==0.3.8
93
+ scipy==1.14.1
94
+ hydra-core==1.3.2
95
+ fsspec==2024.9.0
96
+ platformdirs==4.3.6
97
+ PySocks==1.7.1
98
+ PyOpenGL==3.1.7
99
+ requests==2.32.3
100
+ lxml==5.3.0
101
+ Farama-Notifications==0.0.4
102
+ nvidia-cuda-nvrtc-cu12==12.1.105
103
+ numba==0.60.0
104
+ docker-pycreds==0.4.0
105
+ six==1.17.0
106
+ lerobot==0.1.0
107
+ nvidia-cudnn-cu12==9.1.0.70
108
+ sentry-sdk==2.19.2
109
+ absl-py==2.1.0
110
+ wandb==0.19.0
111
+ mpmath==1.3.0
112
+ llvmlite==0.43.0
113
+ numcodecs==0.13.1
114
+ GitPython==3.1.43
115
+ nvidia-nvtx-cu12==12.1.105
116
+ prompt_toolkit==3.0.48
117
+ datasets==3.1.0
118
+ opencv-python==4.10.0.84
119
+ filelock==3.16.1
120
+ async-timeout==5.0.1
121
+ diffusers==0.31.0
122
+ yarl==1.18.3
123
+ click==8.1.7
124
+ asciitree==0.3.3
125
+ psutil==6.1.0
126
+ gdown==5.2.0
127
+ PyYAML==6.0.2
128
+ urllib3==2.2.3
129
+ beautifulsoup4==4.12.3
wandb/run-20241207_010636-bwwpk9vl/files/wandb-metadata.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1015-aws-x86_64-with-glibc2.35",
3
+ "python": "CPython 3.10.12",
4
+ "startedAt": "2024-12-07T01:06:36.020217Z",
5
+ "args": [
6
+ "policy=act_aloha_real",
7
+ "env=aloha_real",
8
+ "dataset_repo_id=ccop/aloha_stationary_replay_test_v2",
9
+ "hydra.run.dir=outputs/train/2024-12-06/22-28-29_real_world_act_default",
10
+ "resume=true",
11
+ "dataset_repo_id=HumanoidTeam/aloha_real_test",
12
+ "training.offline_steps=5010"
13
+ ],
14
+ "program": "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py",
15
+ "codePath": "lerobot/scripts/train.py",
16
+ "git": {
17
+ "remote": "[email protected]:HumanoidTeam/lerobot-hackathon.git",
18
+ "commit": "ab8aa3f8e7b6e5486d7af26ccd319d358ffad579"
19
+ },
20
+ "email": "[email protected]",
21
+ "root": "outputs/train/2024-12-06/22-28-29_real_world_act_default",
22
+ "host": "ip-172-31-20-130",
23
+ "username": "humanoidteam",
24
+ "executable": "/home/ubuntu/lerobot-hackathon/lerobot/bin/python",
25
+ "codePathLocal": "lerobot/scripts/train.py",
26
+ "cpu_count": 4,
27
+ "cpu_count_logical": 8,
28
+ "gpu": "Tesla T4",
29
+ "gpu_count": 1,
30
+ "disk": {
31
+ "/": {
32
+ "total": "311993479168",
33
+ "used": "217724030976"
34
+ }
35
+ },
36
+ "memory": {
37
+ "total": "33263837184"
38
+ },
39
+ "cpu": {
40
+ "count": 4,
41
+ "countLogical": 8
42
+ },
43
+ "gpu_nvidia": [
44
+ {
45
+ "name": "Tesla T4",
46
+ "memoryTotal": "16106127360",
47
+ "cudaCores": 2560,
48
+ "architecture": "Turing"
49
+ }
50
+ ],
51
+ "cudaVersion": "12.4"
52
+ }
wandb/run-20241207_010636-bwwpk9vl/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train/num_episodes":48.01,"train/is_online":false,"train/num_epochs":48.01,"_runtime":5488.627260612,"train/dataloading_s":2.211516670999117,"train/loss":0.2502947151660919,"_wandb":{"runtime":5493},"train/l1_loss":0.09762981534004211,"train/lr":1e-05,"train/step":4800,"train/grad_norm":20.83009910583496,"_step":4800,"train/num_samples":38408,"_timestamp":1.7335293805980325e+09,"train/update_s":1.0881254139821976,"train/kld_loss":0.01526648923754692}
wandb/run-20241207_010636-bwwpk9vl/logs/debug-core.log ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-12-07T01:06:35.555739791Z","level":"INFO","msg":"started logging, with flags","port-filename":"/tmp/tmpw4k2sq2e/port-3507304.txt","pid":3507304,"debug":false,"disable-analytics":false}
2
+ {"time":"2024-12-07T01:06:35.555772863Z","level":"INFO","msg":"FeatureState","shutdownOnParentExitEnabled":false}
3
+ {"time":"2024-12-07T01:06:35.559538633Z","level":"INFO","msg":"Will exit if parent process dies.","ppid":3507304}
4
+ {"time":"2024-12-07T01:06:35.559558787Z","level":"INFO","msg":"server is running","addr":{"IP":"127.0.0.1","Port":41501,"Zone":""}}
5
+ {"time":"2024-12-07T01:06:35.744706996Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:49972"}
6
+ {"time":"2024-12-07T01:06:36.021210331Z","level":"INFO","msg":"handleInformInit: received","streamId":"bwwpk9vl","id":"127.0.0.1:49972"}
7
+ {"time":"2024-12-07T01:06:36.124059246Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"bwwpk9vl","id":"127.0.0.1:49972"}
8
+ {"time":"2024-12-07T01:06:41.270283035Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"127.0.0.1:49972"}
9
+ {"time":"2024-12-07T01:06:41.270348753Z","level":"INFO","msg":"server is shutting down"}
10
+ {"time":"2024-12-07T01:06:41.270339778Z","level":"INFO","msg":"connection: Close: initiating connection closure","id":"127.0.0.1:49972"}
11
+ {"time":"2024-12-07T01:06:41.270441093Z","level":"INFO","msg":"connection: Close: connection successfully closed","id":"127.0.0.1:49972"}
12
+ {"time":"2024-12-07T01:06:42.336511877Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"127.0.0.1:49972"}
13
+ {"time":"2024-12-07T01:06:42.336534508Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"127.0.0.1:49972"}
14
+ {"time":"2024-12-07T01:06:42.336548673Z","level":"INFO","msg":"server is closed"}
wandb/run-20241207_010636-bwwpk9vl/logs/debug-internal.log ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-12-07T01:06:36.021365256Z","level":"INFO","msg":"using version","core version":"0.19.0"}
2
+ {"time":"2024-12-07T01:06:36.021379424Z","level":"INFO","msg":"created symlink","path":"outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010636-bwwpk9vl/logs/debug-core.log"}
3
+ {"time":"2024-12-07T01:06:36.124016018Z","level":"INFO","msg":"created new stream","id":"bwwpk9vl"}
4
+ {"time":"2024-12-07T01:06:36.124052183Z","level":"INFO","msg":"stream: started","id":"bwwpk9vl"}
5
+ {"time":"2024-12-07T01:06:36.124086504Z","level":"INFO","msg":"writer: Do: started","stream_id":"bwwpk9vl"}
6
+ {"time":"2024-12-07T01:06:36.124086178Z","level":"INFO","msg":"sender: started","stream_id":"bwwpk9vl"}
7
+ {"time":"2024-12-07T01:06:36.124165775Z","level":"INFO","msg":"handler: started","stream_id":"bwwpk9vl"}
8
+ {"time":"2024-12-07T01:06:36.467542952Z","level":"INFO","msg":"Starting system monitor"}
9
+ {"time":"2024-12-07T01:06:41.27033621Z","level":"INFO","msg":"stream: closing","id":"bwwpk9vl"}
10
+ {"time":"2024-12-07T01:06:41.270379684Z","level":"INFO","msg":"Stopping system monitor"}
11
+ {"time":"2024-12-07T01:06:41.270898953Z","level":"INFO","msg":"Stopped system monitor"}
12
+ {"time":"2024-12-07T01:06:42.191128546Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
13
+ {"time":"2024-12-07T01:06:42.336356796Z","level":"INFO","msg":"handler: closed","stream_id":"bwwpk9vl"}
14
+ {"time":"2024-12-07T01:06:42.336396896Z","level":"INFO","msg":"writer: Close: closed","stream_id":"bwwpk9vl"}
15
+ {"time":"2024-12-07T01:06:42.336425596Z","level":"INFO","msg":"sender: closed","stream_id":"bwwpk9vl"}
16
+ {"time":"2024-12-07T01:06:42.336454571Z","level":"INFO","msg":"stream: closed","id":"bwwpk9vl"}
wandb/run-20241207_010636-bwwpk9vl/logs/debug.log ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Current SDK version is 0.19.0
2
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Configure stats pid to 3507304
3
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/.config/wandb/settings
4
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/lerobot-hackathon/wandb/settings
5
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] Loading settings from environment variables
6
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_setup.py:_flush():68] wandb: Using wandb-core as the SDK backend. Please refer to https://wandb.me/wandb-core for more information.
7
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:_log_setup():528] Logging user logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010636-bwwpk9vl/logs/debug.log
8
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:_log_setup():529] Logging internal logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010636-bwwpk9vl/logs/debug-internal.log
9
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:init():639] calling init triggers
10
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:init():645] wandb.init called with sweep_config: {}
11
+ config: {'resume': True, 'device': 'cuda', 'use_amp': False, 'seed': 1000, 'dataset_repo_id': 'ccop/aloha_stationary_replay_test_v2', 'video_backend': 'pyav', 'training': {'offline_steps': 5000, 'num_workers': 8, 'batch_size': 8, 'eval_freq': -1, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 10000, 'online_steps': 0, 'online_rollout_n_episodes': 1, 'online_rollout_batch_size': 1, 'online_steps_between_rollouts': 1, 'online_sampling_ratio': 0.5, 'online_env_seed': None, 'online_buffer_capacity': None, 'online_buffer_seed_size': 0, 'do_online_rollout_async': False, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'brightness': {'weight': 1, 'min_max': [0.8, 1.2]}, 'contrast': {'weight': 1, 'min_max': [0.8, 1.2]}, 'saturation': {'weight': 1, 'min_max': [0.5, 1.5]}, 'hue': {'weight': 1, 'min_max': [-0.05, 0.05]}, 'sharpness': {'weight': 1, 'min_max': [0.8, 1.2]}}, 'lr': 1e-05, 'lr_backbone': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10, 'delta_timestamps': {'action': [0.0, 0.03333333333333333, 0.06666666666666667, 0.1, 0.13333333333333333, 0.16666666666666666, 0.2, 0.23333333333333334, 0.26666666666666666, 0.3, 0.3333333333333333, 0.36666666666666664, 0.4, 0.43333333333333335, 0.4666666666666667, 0.5, 0.5333333333333333, 0.5666666666666667, 0.6, 0.6333333333333333, 0.6666666666666666, 0.7, 0.7333333333333333, 0.7666666666666667, 0.8, 0.8333333333333334, 0.8666666666666667, 0.9, 0.9333333333333333, 0.9666666666666667, 1.0, 1.0333333333333334, 1.0666666666666667, 1.1, 1.1333333333333333, 1.1666666666666667, 1.2, 1.2333333333333334, 1.2666666666666666, 1.3, 1.3333333333333333, 1.3666666666666667, 1.4, 1.4333333333333333, 1.4666666666666666, 1.5, 1.5333333333333334, 1.5666666666666667, 1.6, 1.6333333333333333, 1.6666666666666667, 1.7, 1.7333333333333334, 1.7666666666666666, 1.8, 1.8333333333333333, 1.8666666666666667, 1.9, 1.9333333333333333, 1.9666666666666666, 2.0, 2.033333333333333, 2.066666666666667, 2.1, 2.1333333333333333, 2.1666666666666665, 2.2, 2.2333333333333334, 2.2666666666666666, 2.3, 2.3333333333333335, 2.3666666666666667, 2.4, 2.433333333333333, 2.466666666666667, 2.5, 2.533333333333333, 2.566666666666667, 2.6, 2.6333333333333333, 2.6666666666666665, 2.7, 2.7333333333333334, 2.7666666666666666, 2.8, 2.8333333333333335, 2.8666666666666667, 2.9, 2.933333333333333, 2.966666666666667, 3.0, 3.033333333333333, 3.066666666666667, 3.1, 3.1333333333333333, 3.1666666666666665, 3.2, 3.2333333333333334, 3.2666666666666666, 3.3]}}, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot_real_aloha', 'notes': 'ws-lerobot-hackathon'}, 'fps': 30, 'env': {'name': 'real_world', 'task': None, 'state_dim': 14, 'action_dim': 14, 'fps': 30}, 'override_dataset_stats': {'observation.images.cam_right_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_left_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_high': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}}, 'policy': {'name': 'act', 'n_obs_steps': 1, 'chunk_size': 100, 'n_action_steps': 100, 'input_shapes': {'observation.images.cam_right_wrist': [3, 480, 640], 'observation.images.cam_left_wrist': [3, 480, 640], 'observation.images.cam_high': [3, 480, 640], 'observation.state': [14]}, 'output_shapes': {'action': [14]}, 'input_normalization_modes': {'observation.images.cam_right_wrist': 'mean_std', 'observation.images.cam_left_wrist': 'mean_std', 'observation.images.cam_high': 'mean_std', 'observation.state': 'mean_std'}, 'output_normalization_modes': {'action': 'mean_std'}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_momentum': None, 'dropout': 0.1, 'kl_weight': 10.0}}
12
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:init():688] starting backend
13
+ 2024-12-07 01:06:36,015 INFO MainThread:3507304 [wandb_init.py:init():692] sending inform_init request
14
+ 2024-12-07 01:06:36,019 INFO MainThread:3507304 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
15
+ 2024-12-07 01:06:36,020 INFO MainThread:3507304 [wandb_init.py:init():705] backend started and connected
16
+ 2024-12-07 01:06:36,022 INFO MainThread:3507304 [wandb_init.py:init():798] updated telemetry
17
+ 2024-12-07 01:06:36,027 INFO MainThread:3507304 [wandb_init.py:init():830] communicating run to backend with 90.0 second timeout
18
+ 2024-12-07 01:06:36,459 INFO MainThread:3507304 [wandb_init.py:init():875] run resumed
19
+ 2024-12-07 01:06:36,463 INFO MainThread:3507304 [wandb_init.py:init():882] starting run threads in backend
20
+ 2024-12-07 01:06:36,579 INFO MainThread:3507304 [wandb_run.py:_console_start():2443] atexit reg
21
+ 2024-12-07 01:06:36,579 INFO MainThread:3507304 [wandb_run.py:_redirect():2293] redirect: wrap_raw
22
+ 2024-12-07 01:06:36,580 INFO MainThread:3507304 [wandb_run.py:_redirect():2358] Wrapping output streams.
23
+ 2024-12-07 01:06:36,580 INFO MainThread:3507304 [wandb_run.py:_redirect():2383] Redirects installed.
24
+ 2024-12-07 01:06:36,581 INFO MainThread:3507304 [wandb_init.py:init():925] run started, returning control to user process
25
+ 2024-12-07 01:06:41,270 WARNING MsgRouterThr:3507304 [router.py:message_loop():75] message_loop has been closed
wandb/run-20241207_010636-bwwpk9vl/run-bwwpk9vl.wandb ADDED
Binary file (10.6 kB). View file
 
wandb/run-20241207_010741-bwwpk9vl/files/config.yaml ADDED
@@ -0,0 +1,296 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.19.0
4
+ m: []
5
+ python_version: 3.10.12
6
+ t:
7
+ "1":
8
+ - 1
9
+ - 41
10
+ - 49
11
+ - 50
12
+ - 51
13
+ - 55
14
+ "2":
15
+ - 1
16
+ - 41
17
+ - 49
18
+ - 50
19
+ - 51
20
+ - 55
21
+ "3":
22
+ - 5
23
+ - 13
24
+ - 14
25
+ - 15
26
+ - 16
27
+ - 23
28
+ - 55
29
+ - 62
30
+ "4": 3.10.12
31
+ "5": 0.19.0
32
+ "8":
33
+ - 5
34
+ "12": 0.19.0
35
+ "13": linux-x86_64
36
+ dataset_repo_id:
37
+ value: ccop/aloha_stationary_replay_test_v2
38
+ device:
39
+ value: cuda
40
+ env:
41
+ value:
42
+ action_dim: 14
43
+ fps: 30
44
+ name: real_world
45
+ state_dim: 14
46
+ task: null
47
+ eval:
48
+ value:
49
+ batch_size: 50
50
+ n_episodes: 50
51
+ use_async_envs: false
52
+ fps:
53
+ value: 30
54
+ override_dataset_stats:
55
+ value:
56
+ observation.images.cam_high:
57
+ mean:
58
+ - - - 0.485
59
+ - - - 0.456
60
+ - - - 0.406
61
+ std:
62
+ - - - 0.229
63
+ - - - 0.224
64
+ - - - 0.225
65
+ observation.images.cam_left_wrist:
66
+ mean:
67
+ - - - 0.485
68
+ - - - 0.456
69
+ - - - 0.406
70
+ std:
71
+ - - - 0.229
72
+ - - - 0.224
73
+ - - - 0.225
74
+ observation.images.cam_right_wrist:
75
+ mean:
76
+ - - - 0.485
77
+ - - - 0.456
78
+ - - - 0.406
79
+ std:
80
+ - - - 0.229
81
+ - - - 0.224
82
+ - - - 0.225
83
+ policy:
84
+ value:
85
+ chunk_size: 100
86
+ dim_feedforward: 3200
87
+ dim_model: 512
88
+ dropout: 0.1
89
+ feedforward_activation: relu
90
+ input_normalization_modes:
91
+ observation.images.cam_high: mean_std
92
+ observation.images.cam_left_wrist: mean_std
93
+ observation.images.cam_right_wrist: mean_std
94
+ observation.state: mean_std
95
+ input_shapes:
96
+ observation.images.cam_high:
97
+ - 3
98
+ - 480
99
+ - 640
100
+ observation.images.cam_left_wrist:
101
+ - 3
102
+ - 480
103
+ - 640
104
+ observation.images.cam_right_wrist:
105
+ - 3
106
+ - 480
107
+ - 640
108
+ observation.state:
109
+ - 14
110
+ kl_weight: 10
111
+ latent_dim: 32
112
+ n_action_steps: 100
113
+ n_decoder_layers: 1
114
+ n_encoder_layers: 4
115
+ n_heads: 8
116
+ n_obs_steps: 1
117
+ n_vae_encoder_layers: 4
118
+ name: act
119
+ output_normalization_modes:
120
+ action: mean_std
121
+ output_shapes:
122
+ action:
123
+ - 14
124
+ pre_norm: false
125
+ pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
126
+ replace_final_stride_with_dilation: false
127
+ temporal_ensemble_momentum: null
128
+ use_vae: true
129
+ vision_backbone: resnet18
130
+ resume:
131
+ value: true
132
+ seed:
133
+ value: 1000
134
+ training:
135
+ value:
136
+ batch_size: 8
137
+ delta_timestamps:
138
+ action:
139
+ - 0
140
+ - 0.03333333333333333
141
+ - 0.06666666666666667
142
+ - 0.1
143
+ - 0.13333333333333333
144
+ - 0.16666666666666666
145
+ - 0.2
146
+ - 0.23333333333333334
147
+ - 0.26666666666666666
148
+ - 0.3
149
+ - 0.3333333333333333
150
+ - 0.36666666666666664
151
+ - 0.4
152
+ - 0.43333333333333335
153
+ - 0.4666666666666667
154
+ - 0.5
155
+ - 0.5333333333333333
156
+ - 0.5666666666666667
157
+ - 0.6
158
+ - 0.6333333333333333
159
+ - 0.6666666666666666
160
+ - 0.7
161
+ - 0.7333333333333333
162
+ - 0.7666666666666667
163
+ - 0.8
164
+ - 0.8333333333333334
165
+ - 0.8666666666666667
166
+ - 0.9
167
+ - 0.9333333333333333
168
+ - 0.9666666666666667
169
+ - 1
170
+ - 1.0333333333333334
171
+ - 1.0666666666666667
172
+ - 1.1
173
+ - 1.1333333333333333
174
+ - 1.1666666666666667
175
+ - 1.2
176
+ - 1.2333333333333334
177
+ - 1.2666666666666666
178
+ - 1.3
179
+ - 1.3333333333333333
180
+ - 1.3666666666666667
181
+ - 1.4
182
+ - 1.4333333333333333
183
+ - 1.4666666666666666
184
+ - 1.5
185
+ - 1.5333333333333334
186
+ - 1.5666666666666667
187
+ - 1.6
188
+ - 1.6333333333333333
189
+ - 1.6666666666666667
190
+ - 1.7
191
+ - 1.7333333333333334
192
+ - 1.7666666666666666
193
+ - 1.8
194
+ - 1.8333333333333333
195
+ - 1.8666666666666667
196
+ - 1.9
197
+ - 1.9333333333333333
198
+ - 1.9666666666666666
199
+ - 2
200
+ - 2.033333333333333
201
+ - 2.066666666666667
202
+ - 2.1
203
+ - 2.1333333333333333
204
+ - 2.1666666666666665
205
+ - 2.2
206
+ - 2.2333333333333334
207
+ - 2.2666666666666666
208
+ - 2.3
209
+ - 2.3333333333333335
210
+ - 2.3666666666666667
211
+ - 2.4
212
+ - 2.433333333333333
213
+ - 2.466666666666667
214
+ - 2.5
215
+ - 2.533333333333333
216
+ - 2.566666666666667
217
+ - 2.6
218
+ - 2.6333333333333333
219
+ - 2.6666666666666665
220
+ - 2.7
221
+ - 2.7333333333333334
222
+ - 2.7666666666666666
223
+ - 2.8
224
+ - 2.8333333333333335
225
+ - 2.8666666666666667
226
+ - 2.9
227
+ - 2.933333333333333
228
+ - 2.966666666666667
229
+ - 3
230
+ - 3.033333333333333
231
+ - 3.066666666666667
232
+ - 3.1
233
+ - 3.1333333333333333
234
+ - 3.1666666666666665
235
+ - 3.2
236
+ - 3.2333333333333334
237
+ - 3.2666666666666666
238
+ - 3.3
239
+ do_online_rollout_async: false
240
+ eval_freq: -1
241
+ grad_clip_norm: 10
242
+ image_transforms:
243
+ brightness:
244
+ min_max:
245
+ - 0.8
246
+ - 1.2
247
+ weight: 1
248
+ contrast:
249
+ min_max:
250
+ - 0.8
251
+ - 1.2
252
+ weight: 1
253
+ enable: false
254
+ hue:
255
+ min_max:
256
+ - -0.05
257
+ - 0.05
258
+ weight: 1
259
+ max_num_transforms: 3
260
+ random_order: false
261
+ saturation:
262
+ min_max:
263
+ - 0.5
264
+ - 1.5
265
+ weight: 1
266
+ sharpness:
267
+ min_max:
268
+ - 0.8
269
+ - 1.2
270
+ weight: 1
271
+ log_freq: 200
272
+ lr: 1e-05
273
+ lr_backbone: 1e-05
274
+ num_workers: 8
275
+ offline_steps: 5000
276
+ online_buffer_capacity: null
277
+ online_buffer_seed_size: 0
278
+ online_env_seed: null
279
+ online_rollout_batch_size: 1
280
+ online_rollout_n_episodes: 1
281
+ online_sampling_ratio: 0.5
282
+ online_steps: 0
283
+ online_steps_between_rollouts: 1
284
+ save_checkpoint: true
285
+ save_freq: 10000
286
+ weight_decay: 0.0001
287
+ use_amp:
288
+ value: false
289
+ video_backend:
290
+ value: pyav
291
+ wandb:
292
+ value:
293
+ disable_artifact: false
294
+ enable: true
295
+ notes: ws-lerobot-hackathon
296
+ project: lerobot_real_aloha
wandb/run-20241207_010741-bwwpk9vl/files/output.log ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Logs will be synced with wandb.
2
+ INFO 2024-12-07 01:07:41 n/logger.py:132 Track this run --> https://wandb.ai/zaringleb/lerobot_real_aloha/runs/bwwpk9vl
3
+ INFO 2024-12-07 01:07:41 ts/train.py:312 make_dataset
4
+ WARNING 2024-12-07 01:07:41 s/factory.py:68 There might be a mismatch between your training dataset (dataset_repo_id='ccop/aloha_stationary_replay_test_v2') and your environment (cfg.env.name='real_world').
5
+ Fetching 9 files: 100%|█████████████████████████████████████████████████████████████████████████████████████████████| 9/9 [00:00<00:00, 70034.76it/s]
6
+ INFO 2024-12-07 01:07:43 ts/train.py:328 make_policy
7
+ WARNING 2024-12-07 01:07:44 s/factory.py:28 Hydra config is missing arguments: {'temporal_ensemble_coeff'}
8
+ Loading weights from local directory
9
+ /home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py:338: FutureWarning: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.
10
+ grad_scaler = GradScaler(enabled=cfg.use_amp)
11
+ Error executing job with overrides: ['resume=true', 'dataset_repo_id=HumanoidTeam/aloha_real_test', 'training.offline_steps=5010']
12
+ Traceback (most recent call last):
13
+ File "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py", line 652, in train_cli
14
+ train(
15
+ File "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py", line 343, in train
16
+ step = logger.load_last_training_state(optimizer, lr_scheduler)
17
+ File "/home/ubuntu/lerobot-hackathon/lerobot/common/logger.py", line 218, in load_last_training_state
18
+ training_state = torch.load(self.last_checkpoint_dir / self.training_state_file_name)
19
+ File "/home/ubuntu/lerobot-hackathon/lerobot/lib/python3.10/site-packages/torch/serialization.py", line 1444, in load
20
+ raise pickle.UnpicklingError(_get_wo_message(str(e))) from None
21
+ _pickle.UnpicklingError: Weights only load failed. This file can still be loaded, to do so you have two options, do those steps only if you trust the source of the checkpoint.
22
+ (1) Re-running `torch.load` with `weights_only` set to `False` will likely succeed, but it can result in arbitrary code execution. Do it only if you got the file from a trusted source.
23
+ (2) Alternatively, to load with `weights_only=True` please check the recommended steps in the following error message.
24
+ WeightsUnpickler error: Unsupported global: GLOBAL numpy.core.multiarray._reconstruct was not an allowed global by default. Please use `torch.serialization.add_safe_globals([_reconstruct])` or the `torch.serialization.safe_globals([_reconstruct])` context manager to allowlist this global if you trust this class/function.
25
+
26
+ Check the documentation of torch.load to learn more about types accepted by default with weights_only https://pytorch.org/docs/stable/generated/torch.load.html.
27
+
28
+ Set the environment variable HYDRA_FULL_ERROR=1 for a complete stack trace.
wandb/run-20241207_010741-bwwpk9vl/files/requirements.txt ADDED
@@ -0,0 +1,129 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ pymunk==6.9.0
2
+ charset-normalizer==3.4.0
3
+ pip==22.0.2
4
+ multidict==6.1.0
5
+ pytz==2024.2
6
+ pandas==2.2.3
7
+ fasteners==0.19
8
+ einops==0.8.0
9
+ setproctitle==1.3.4
10
+ python-dateutil==2.9.0.post0
11
+ pydantic==2.10.3
12
+ dm-control==1.0.14
13
+ MarkupSafe==3.0.2
14
+ safetensors==0.4.5
15
+ cloudpickle==3.1.0
16
+ imageio-ffmpeg==0.5.1
17
+ smmap==5.0.1
18
+ huggingface-hub==0.26.5
19
+ torch==2.6.0.dev20241112+cu121
20
+ nvidia-cusolver-cu12==11.4.5.107
21
+ inquirerpy==0.3.4
22
+ soupsieve==2.6
23
+ deepdiff==8.0.1
24
+ nvidia-nvjitlink-cu12==12.4.127
25
+ aiosignal==1.3.1
26
+ dm-tree==0.1.8
27
+ aiohappyeyeballs==2.4.4
28
+ propcache==0.2.1
29
+ gym-aloha==0.1.1
30
+ labmaze==1.0.6
31
+ pyav==14.0.1
32
+ nvidia-cuda-cupti-cu12==12.1.105
33
+ cffi==1.17.1
34
+ importlib_metadata==8.5.0
35
+ nvidia-cuda-runtime-cu12==12.1.105
36
+ pycparser==2.22
37
+ h5py==3.12.1
38
+ nvidia-nccl-cu12==2.21.5
39
+ orderly-set==5.2.2
40
+ pyarrow==18.1.0
41
+ Flask==3.1.0
42
+ multiprocess==0.70.16
43
+ blinker==1.9.0
44
+ regex==2024.11.6
45
+ Jinja2==3.1.4
46
+ tqdm==4.67.1
47
+ certifi==2024.8.30
48
+ frozenlist==1.5.0
49
+ attrs==24.2.0
50
+ pytorch-triton==3.1.0+cf34004b8a
51
+ omegaconf==2.3.0
52
+ itsdangerous==2.2.0
53
+ packaging==24.2
54
+ pfzy==0.3.4
55
+ pydantic_core==2.27.1
56
+ antlr4-python3-runtime==4.9.3
57
+ cmake==3.31.1
58
+ imageio==2.36.1
59
+ setuptools==59.6.0
60
+ nvidia-cusparselt-cu12==0.6.2
61
+ zipp==3.21.0
62
+ torchvision==0.20.0.dev20241112+cu121
63
+ nvidia-curand-cu12==10.3.2.106
64
+ PyOpenGL-accelerate==3.1.7
65
+ numpy==1.26.4
66
+ dm-env==1.6
67
+ nvidia-cusparse-cu12==12.1.0.106
68
+ networkx==3.4.2
69
+ triton==3.1.0
70
+ termcolor==2.5.0
71
+ gitdb==4.0.11
72
+ torchaudio==2.5.0.dev20241112+cu121
73
+ glfw==2.8.0
74
+ tzdata==2024.2
75
+ pillow==11.0.0
76
+ idna==3.10
77
+ pyparsing==3.2.0
78
+ typing_extensions==4.12.2
79
+ wcwidth==0.2.13
80
+ sympy==1.13.1
81
+ nvidia-cublas-cu12==12.1.3.1
82
+ zarr==2.18.3
83
+ protobuf==5.29.1
84
+ annotated-types==0.7.0
85
+ xxhash==3.5.0
86
+ aiohttp==3.11.10
87
+ Werkzeug==3.1.3
88
+ mujoco==2.3.7
89
+ gymnasium==0.29.1
90
+ rerun-sdk==0.20.3
91
+ nvidia-cufft-cu12==11.0.2.54
92
+ dill==0.3.8
93
+ scipy==1.14.1
94
+ hydra-core==1.3.2
95
+ fsspec==2024.9.0
96
+ platformdirs==4.3.6
97
+ PySocks==1.7.1
98
+ PyOpenGL==3.1.7
99
+ requests==2.32.3
100
+ lxml==5.3.0
101
+ Farama-Notifications==0.0.4
102
+ nvidia-cuda-nvrtc-cu12==12.1.105
103
+ numba==0.60.0
104
+ docker-pycreds==0.4.0
105
+ six==1.17.0
106
+ lerobot==0.1.0
107
+ nvidia-cudnn-cu12==9.1.0.70
108
+ sentry-sdk==2.19.2
109
+ absl-py==2.1.0
110
+ wandb==0.19.0
111
+ mpmath==1.3.0
112
+ llvmlite==0.43.0
113
+ numcodecs==0.13.1
114
+ GitPython==3.1.43
115
+ nvidia-nvtx-cu12==12.1.105
116
+ prompt_toolkit==3.0.48
117
+ datasets==3.1.0
118
+ opencv-python==4.10.0.84
119
+ filelock==3.16.1
120
+ async-timeout==5.0.1
121
+ diffusers==0.31.0
122
+ yarl==1.18.3
123
+ click==8.1.7
124
+ asciitree==0.3.3
125
+ psutil==6.1.0
126
+ gdown==5.2.0
127
+ PyYAML==6.0.2
128
+ urllib3==2.2.3
129
+ beautifulsoup4==4.12.3
wandb/run-20241207_010741-bwwpk9vl/files/wandb-metadata.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.8.0-1015-aws-x86_64-with-glibc2.35",
3
+ "python": "CPython 3.10.12",
4
+ "startedAt": "2024-12-07T01:07:41.166322Z",
5
+ "args": [
6
+ "hydra.run.dir=outputs/train/2024-12-06/22-28-29_real_world_act_default",
7
+ "resume=true",
8
+ "dataset_repo_id=HumanoidTeam/aloha_real_test",
9
+ "training.offline_steps=5010"
10
+ ],
11
+ "program": "/home/ubuntu/lerobot-hackathon/lerobot/scripts/train.py",
12
+ "codePath": "lerobot/scripts/train.py",
13
+ "git": {
14
+ "remote": "[email protected]:HumanoidTeam/lerobot-hackathon.git",
15
+ "commit": "ab8aa3f8e7b6e5486d7af26ccd319d358ffad579"
16
+ },
17
+ "email": "[email protected]",
18
+ "root": "outputs/train/2024-12-06/22-28-29_real_world_act_default",
19
+ "host": "ip-172-31-20-130",
20
+ "username": "humanoidteam",
21
+ "executable": "/home/ubuntu/lerobot-hackathon/lerobot/bin/python",
22
+ "codePathLocal": "lerobot/scripts/train.py",
23
+ "cpu_count": 4,
24
+ "cpu_count_logical": 8,
25
+ "gpu": "Tesla T4",
26
+ "gpu_count": 1,
27
+ "disk": {
28
+ "/": {
29
+ "total": "311993479168",
30
+ "used": "217724108800"
31
+ }
32
+ },
33
+ "memory": {
34
+ "total": "33263837184"
35
+ },
36
+ "cpu": {
37
+ "count": 4,
38
+ "countLogical": 8
39
+ },
40
+ "gpu_nvidia": [
41
+ {
42
+ "name": "Tesla T4",
43
+ "memoryTotal": "16106127360",
44
+ "cudaCores": 2560,
45
+ "architecture": "Turing"
46
+ }
47
+ ],
48
+ "cudaVersion": "12.4"
49
+ }
wandb/run-20241207_010741-bwwpk9vl/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train/update_s":1.0881254139821976,"train/step":4800,"train/num_episodes":48.01,"train/dataloading_s":2.211516670999117,"train/lr":1e-05,"_step":4800,"train/grad_norm":20.83009910583496,"train/num_epochs":48.01,"_runtime":5488.627260612,"_wandb":{"runtime":5498},"train/is_online":false,"train/kld_loss":0.01526648923754692,"train/l1_loss":0.09762981534004211,"_timestamp":1.7335293805980325e+09,"train/num_samples":38408,"train/loss":0.2502947151660919}
wandb/run-20241207_010741-bwwpk9vl/logs/debug-core.log ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-12-07T01:07:40.734055218Z","level":"INFO","msg":"started logging, with flags","port-filename":"/tmp/tmpnmhdaztf/port-3507456.txt","pid":3507456,"debug":false,"disable-analytics":false}
2
+ {"time":"2024-12-07T01:07:40.734088106Z","level":"INFO","msg":"FeatureState","shutdownOnParentExitEnabled":false}
3
+ {"time":"2024-12-07T01:07:40.737816002Z","level":"INFO","msg":"Will exit if parent process dies.","ppid":3507456}
4
+ {"time":"2024-12-07T01:07:40.737842301Z","level":"INFO","msg":"server is running","addr":{"IP":"127.0.0.1","Port":36119,"Zone":""}}
5
+ {"time":"2024-12-07T01:07:40.923329848Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:47356"}
6
+ {"time":"2024-12-07T01:07:41.167320115Z","level":"INFO","msg":"handleInformInit: received","streamId":"bwwpk9vl","id":"127.0.0.1:47356"}
7
+ {"time":"2024-12-07T01:07:41.270221077Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"bwwpk9vl","id":"127.0.0.1:47356"}
8
+ {"time":"2024-12-07T01:07:46.320004505Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"127.0.0.1:47356"}
9
+ {"time":"2024-12-07T01:07:46.320088721Z","level":"INFO","msg":"server is shutting down"}
10
+ {"time":"2024-12-07T01:07:46.320081333Z","level":"INFO","msg":"connection: Close: initiating connection closure","id":"127.0.0.1:47356"}
11
+ {"time":"2024-12-07T01:07:46.320187736Z","level":"INFO","msg":"connection: Close: connection successfully closed","id":"127.0.0.1:47356"}
12
+ {"time":"2024-12-07T01:07:47.027392524Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"127.0.0.1:47356"}
13
+ {"time":"2024-12-07T01:07:47.027414185Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"127.0.0.1:47356"}
14
+ {"time":"2024-12-07T01:07:47.027425094Z","level":"INFO","msg":"server is closed"}
wandb/run-20241207_010741-bwwpk9vl/logs/debug-internal.log ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-12-07T01:07:41.167467035Z","level":"INFO","msg":"using version","core version":"0.19.0"}
2
+ {"time":"2024-12-07T01:07:41.167480199Z","level":"INFO","msg":"created symlink","path":"outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug-core.log"}
3
+ {"time":"2024-12-07T01:07:41.270189094Z","level":"INFO","msg":"created new stream","id":"bwwpk9vl"}
4
+ {"time":"2024-12-07T01:07:41.270216139Z","level":"INFO","msg":"stream: started","id":"bwwpk9vl"}
5
+ {"time":"2024-12-07T01:07:41.270250461Z","level":"INFO","msg":"writer: Do: started","stream_id":"bwwpk9vl"}
6
+ {"time":"2024-12-07T01:07:41.270250342Z","level":"INFO","msg":"sender: started","stream_id":"bwwpk9vl"}
7
+ {"time":"2024-12-07T01:07:41.270317361Z","level":"INFO","msg":"handler: started","stream_id":"bwwpk9vl"}
8
+ {"time":"2024-12-07T01:07:41.601065068Z","level":"INFO","msg":"Starting system monitor"}
9
+ {"time":"2024-12-07T01:07:46.320070438Z","level":"INFO","msg":"stream: closing","id":"bwwpk9vl"}
10
+ {"time":"2024-12-07T01:07:46.320109578Z","level":"INFO","msg":"Stopping system monitor"}
11
+ {"time":"2024-12-07T01:07:46.320581424Z","level":"INFO","msg":"Stopped system monitor"}
12
+ {"time":"2024-12-07T01:07:46.890807441Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
13
+ {"time":"2024-12-07T01:07:47.027194656Z","level":"INFO","msg":"handler: closed","stream_id":"bwwpk9vl"}
14
+ {"time":"2024-12-07T01:07:47.027227034Z","level":"INFO","msg":"sender: closed","stream_id":"bwwpk9vl"}
15
+ {"time":"2024-12-07T01:07:47.027228216Z","level":"INFO","msg":"writer: Close: closed","stream_id":"bwwpk9vl"}
16
+ {"time":"2024-12-07T01:07:47.027338658Z","level":"INFO","msg":"stream: closed","id":"bwwpk9vl"}
wandb/run-20241207_010741-bwwpk9vl/logs/debug.log ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Current SDK version is 0.19.0
2
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Configure stats pid to 3507456
3
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/.config/wandb/settings
4
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from /home/ubuntu/lerobot-hackathon/wandb/settings
5
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] Loading settings from environment variables
6
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_setup.py:_flush():68] wandb: Using wandb-core as the SDK backend. Please refer to https://wandb.me/wandb-core for more information.
7
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:_log_setup():528] Logging user logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug.log
8
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:_log_setup():529] Logging internal logs to outputs/train/2024-12-06/22-28-29_real_world_act_default/wandb/run-20241207_010741-bwwpk9vl/logs/debug-internal.log
9
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():639] calling init triggers
10
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():645] wandb.init called with sweep_config: {}
11
+ config: {'resume': True, 'device': 'cuda', 'use_amp': False, 'seed': 1000, 'dataset_repo_id': 'ccop/aloha_stationary_replay_test_v2', 'video_backend': 'pyav', 'training': {'offline_steps': 5000, 'num_workers': 8, 'batch_size': 8, 'eval_freq': -1, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 10000, 'online_steps': 0, 'online_rollout_n_episodes': 1, 'online_rollout_batch_size': 1, 'online_steps_between_rollouts': 1, 'online_sampling_ratio': 0.5, 'online_env_seed': None, 'online_buffer_capacity': None, 'online_buffer_seed_size': 0, 'do_online_rollout_async': False, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'brightness': {'weight': 1, 'min_max': [0.8, 1.2]}, 'contrast': {'weight': 1, 'min_max': [0.8, 1.2]}, 'saturation': {'weight': 1, 'min_max': [0.5, 1.5]}, 'hue': {'weight': 1, 'min_max': [-0.05, 0.05]}, 'sharpness': {'weight': 1, 'min_max': [0.8, 1.2]}}, 'lr': 1e-05, 'lr_backbone': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10, 'delta_timestamps': {'action': [0.0, 0.03333333333333333, 0.06666666666666667, 0.1, 0.13333333333333333, 0.16666666666666666, 0.2, 0.23333333333333334, 0.26666666666666666, 0.3, 0.3333333333333333, 0.36666666666666664, 0.4, 0.43333333333333335, 0.4666666666666667, 0.5, 0.5333333333333333, 0.5666666666666667, 0.6, 0.6333333333333333, 0.6666666666666666, 0.7, 0.7333333333333333, 0.7666666666666667, 0.8, 0.8333333333333334, 0.8666666666666667, 0.9, 0.9333333333333333, 0.9666666666666667, 1.0, 1.0333333333333334, 1.0666666666666667, 1.1, 1.1333333333333333, 1.1666666666666667, 1.2, 1.2333333333333334, 1.2666666666666666, 1.3, 1.3333333333333333, 1.3666666666666667, 1.4, 1.4333333333333333, 1.4666666666666666, 1.5, 1.5333333333333334, 1.5666666666666667, 1.6, 1.6333333333333333, 1.6666666666666667, 1.7, 1.7333333333333334, 1.7666666666666666, 1.8, 1.8333333333333333, 1.8666666666666667, 1.9, 1.9333333333333333, 1.9666666666666666, 2.0, 2.033333333333333, 2.066666666666667, 2.1, 2.1333333333333333, 2.1666666666666665, 2.2, 2.2333333333333334, 2.2666666666666666, 2.3, 2.3333333333333335, 2.3666666666666667, 2.4, 2.433333333333333, 2.466666666666667, 2.5, 2.533333333333333, 2.566666666666667, 2.6, 2.6333333333333333, 2.6666666666666665, 2.7, 2.7333333333333334, 2.7666666666666666, 2.8, 2.8333333333333335, 2.8666666666666667, 2.9, 2.933333333333333, 2.966666666666667, 3.0, 3.033333333333333, 3.066666666666667, 3.1, 3.1333333333333333, 3.1666666666666665, 3.2, 3.2333333333333334, 3.2666666666666666, 3.3]}}, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot_real_aloha', 'notes': 'ws-lerobot-hackathon'}, 'fps': 30, 'env': {'name': 'real_world', 'task': None, 'state_dim': 14, 'action_dim': 14, 'fps': 30}, 'override_dataset_stats': {'observation.images.cam_right_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_left_wrist': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}, 'observation.images.cam_high': {'mean': [[[0.485]], [[0.456]], [[0.406]]], 'std': [[[0.229]], [[0.224]], [[0.225]]]}}, 'policy': {'name': 'act', 'n_obs_steps': 1, 'chunk_size': 100, 'n_action_steps': 100, 'input_shapes': {'observation.images.cam_right_wrist': [3, 480, 640], 'observation.images.cam_left_wrist': [3, 480, 640], 'observation.images.cam_high': [3, 480, 640], 'observation.state': [14]}, 'output_shapes': {'action': [14]}, 'input_normalization_modes': {'observation.images.cam_right_wrist': 'mean_std', 'observation.images.cam_left_wrist': 'mean_std', 'observation.images.cam_high': 'mean_std', 'observation.state': 'mean_std'}, 'output_normalization_modes': {'action': 'mean_std'}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_momentum': None, 'dropout': 0.1, 'kl_weight': 10.0}}
12
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():688] starting backend
13
+ 2024-12-07 01:07:41,161 INFO MainThread:3507456 [wandb_init.py:init():692] sending inform_init request
14
+ 2024-12-07 01:07:41,165 INFO MainThread:3507456 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
15
+ 2024-12-07 01:07:41,166 INFO MainThread:3507456 [wandb_init.py:init():705] backend started and connected
16
+ 2024-12-07 01:07:41,168 INFO MainThread:3507456 [wandb_init.py:init():798] updated telemetry
17
+ 2024-12-07 01:07:41,174 INFO MainThread:3507456 [wandb_init.py:init():830] communicating run to backend with 90.0 second timeout
18
+ 2024-12-07 01:07:41,592 INFO MainThread:3507456 [wandb_init.py:init():875] run resumed
19
+ 2024-12-07 01:07:41,597 INFO MainThread:3507456 [wandb_init.py:init():882] starting run threads in backend
20
+ 2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_console_start():2443] atexit reg
21
+ 2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2293] redirect: wrap_raw
22
+ 2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2358] Wrapping output streams.
23
+ 2024-12-07 01:07:41,711 INFO MainThread:3507456 [wandb_run.py:_redirect():2383] Redirects installed.
24
+ 2024-12-07 01:07:41,713 INFO MainThread:3507456 [wandb_init.py:init():925] run started, returning control to user process
25
+ 2024-12-07 01:07:46,320 WARNING MsgRouterThr:3507456 [router.py:message_loop():75] message_loop has been closed
wandb/run-20241207_010741-bwwpk9vl/run-bwwpk9vl.wandb ADDED
Binary file (10.5 kB). View file