LouisLi commited on
Commit
4bba054
·
verified ·
1 Parent(s): 590bb1e

Upload 7 files

Browse files
configs/instant-mesh-base.yaml ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_config:
2
+ target: src.models.lrm_mesh.InstantMesh
3
+ params:
4
+ encoder_feat_dim: 768
5
+ encoder_freeze: false
6
+ encoder_model_name: facebook/dino-vitb16
7
+ transformer_dim: 1024
8
+ transformer_layers: 12
9
+ transformer_heads: 16
10
+ triplane_low_res: 32
11
+ triplane_high_res: 64
12
+ triplane_dim: 40
13
+ rendering_samples_per_ray: 96
14
+ grid_res: 128
15
+ grid_scale: 2.1
16
+
17
+
18
+ infer_config:
19
+ unet_path: ckpts/diffusion_pytorch_model.bin
20
+ model_path: ckpts/instant_mesh_base.ckpt
21
+ texture_resolution: 1024
22
+ render_resolution: 512
configs/instant-mesh-large-train.yaml ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ base_learning_rate: 4.0e-05
3
+ target: src.model_mesh.MVRecon
4
+ params:
5
+ init_ckpt: logs/instant-nerf-large-train/checkpoints/last.ckpt
6
+ input_size: 320
7
+ render_size: 512
8
+
9
+ lrm_generator_config:
10
+ target: src.models.lrm_mesh.InstantMesh
11
+ params:
12
+ encoder_feat_dim: 768
13
+ encoder_freeze: false
14
+ encoder_model_name: facebook/dino-vitb16
15
+ transformer_dim: 1024
16
+ transformer_layers: 16
17
+ transformer_heads: 16
18
+ triplane_low_res: 32
19
+ triplane_high_res: 64
20
+ triplane_dim: 80
21
+ rendering_samples_per_ray: 128
22
+ grid_res: 128
23
+ grid_scale: 2.1
24
+
25
+
26
+ data:
27
+ target: src.data.objaverse.DataModuleFromConfig
28
+ params:
29
+ batch_size: 2
30
+ num_workers: 8
31
+ train:
32
+ target: src.data.objaverse.ObjaverseData
33
+ params:
34
+ root_dir: data/objaverse
35
+ meta_fname: filtered_obj_name.json
36
+ input_image_dir: rendering_random_32views
37
+ target_image_dir: rendering_random_32views
38
+ input_view_num: 6
39
+ target_view_num: 4
40
+ total_view_n: 32
41
+ fov: 50
42
+ camera_rotation: true
43
+ validation: false
44
+ validation:
45
+ target: src.data.objaverse.ValidationData
46
+ params:
47
+ root_dir: data/valid_samples
48
+ input_view_num: 6
49
+ input_image_size: 320
50
+ fov: 30
51
+
52
+
53
+ lightning:
54
+ modelcheckpoint:
55
+ params:
56
+ every_n_train_steps: 2000
57
+ save_top_k: -1
58
+ save_last: true
59
+ callbacks: {}
60
+
61
+ trainer:
62
+ benchmark: true
63
+ max_epochs: -1
64
+ val_check_interval: 1000
65
+ num_sanity_val_steps: 0
66
+ accumulate_grad_batches: 1
67
+ check_val_every_n_epoch: null # if not set this, validation does not run
configs/instant-mesh-large.yaml ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_config:
2
+ target: src.models.lrm_mesh.InstantMesh
3
+ params:
4
+ encoder_feat_dim: 768
5
+ encoder_freeze: false
6
+ encoder_model_name: facebook/dino-vitb16
7
+ transformer_dim: 1024
8
+ transformer_layers: 16
9
+ transformer_heads: 16
10
+ triplane_low_res: 32
11
+ triplane_high_res: 64
12
+ triplane_dim: 80
13
+ rendering_samples_per_ray: 128
14
+ grid_res: 128
15
+ grid_scale: 2.1
16
+
17
+
18
+ infer_config:
19
+ unet_path: ckpts/diffusion_pytorch_model.bin
20
+ model_path: ckpts/instant_mesh_large.ckpt
21
+ texture_resolution: 1024
22
+ render_resolution: 512
configs/instant-nerf-base.yaml ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_config:
2
+ target: src.models.lrm.InstantNeRF
3
+ params:
4
+ encoder_feat_dim: 768
5
+ encoder_freeze: false
6
+ encoder_model_name: facebook/dino-vitb16
7
+ transformer_dim: 1024
8
+ transformer_layers: 12
9
+ transformer_heads: 16
10
+ triplane_low_res: 32
11
+ triplane_high_res: 64
12
+ triplane_dim: 40
13
+ rendering_samples_per_ray: 96
14
+
15
+
16
+ infer_config:
17
+ unet_path: ckpts/diffusion_pytorch_model.bin
18
+ model_path: ckpts/instant_nerf_base.ckpt
19
+ mesh_threshold: 10.0
20
+ mesh_resolution: 256
21
+ render_resolution: 384
configs/instant-nerf-large-train.yaml ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ base_learning_rate: 4.0e-04
3
+ target: src.model.MVRecon
4
+ params:
5
+ input_size: 320
6
+ render_size: 192
7
+
8
+ lrm_generator_config:
9
+ target: src.models.lrm.InstantNeRF
10
+ params:
11
+ encoder_feat_dim: 768
12
+ encoder_freeze: false
13
+ encoder_model_name: facebook/dino-vitb16
14
+ transformer_dim: 1024
15
+ transformer_layers: 16
16
+ transformer_heads: 16
17
+ triplane_low_res: 32
18
+ triplane_high_res: 64
19
+ triplane_dim: 80
20
+ rendering_samples_per_ray: 128
21
+
22
+
23
+ data:
24
+ target: src.data.objaverse.DataModuleFromConfig
25
+ params:
26
+ batch_size: 2
27
+ num_workers: 8
28
+ train:
29
+ target: src.data.objaverse.ObjaverseData
30
+ params:
31
+ root_dir: data/objaverse
32
+ meta_fname: filtered_obj_name.json
33
+ input_image_dir: rendering_random_32views
34
+ target_image_dir: rendering_random_32views
35
+ input_view_num: 6
36
+ target_view_num: 4
37
+ total_view_n: 32
38
+ fov: 50
39
+ camera_rotation: true
40
+ validation: false
41
+ validation:
42
+ target: src.data.objaverse.ValidationData
43
+ params:
44
+ root_dir: data/valid_samples
45
+ input_view_num: 6
46
+ input_image_size: 320
47
+ fov: 30
48
+
49
+
50
+ lightning:
51
+ modelcheckpoint:
52
+ params:
53
+ every_n_train_steps: 1000
54
+ save_top_k: -1
55
+ save_last: true
56
+ callbacks: {}
57
+
58
+ trainer:
59
+ benchmark: true
60
+ max_epochs: -1
61
+ gradient_clip_val: 1.0
62
+ val_check_interval: 1000
63
+ num_sanity_val_steps: 0
64
+ accumulate_grad_batches: 1
65
+ check_val_every_n_epoch: null # if not set this, validation does not run
configs/instant-nerf-large.yaml ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model_config:
2
+ target: src.models.lrm.InstantNeRF
3
+ params:
4
+ encoder_feat_dim: 768
5
+ encoder_freeze: false
6
+ encoder_model_name: facebook/dino-vitb16
7
+ transformer_dim: 1024
8
+ transformer_layers: 16
9
+ transformer_heads: 16
10
+ triplane_low_res: 32
11
+ triplane_high_res: 64
12
+ triplane_dim: 80
13
+ rendering_samples_per_ray: 128
14
+
15
+
16
+ infer_config:
17
+ unet_path: ckpts/diffusion_pytorch_model.bin
18
+ model_path: ckpts/instant_nerf_large.ckpt
19
+ mesh_threshold: 10.0
20
+ mesh_resolution: 256
21
+ render_resolution: 384
configs/zero123plus-finetune.yaml ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ base_learning_rate: 1.0e-05
3
+ target: zero123plus.model.MVDiffusion
4
+ params:
5
+ drop_cond_prob: 0.1
6
+
7
+ stable_diffusion_config:
8
+ pretrained_model_name_or_path: sudo-ai/zero123plus-v1.2
9
+ custom_pipeline: ./zero123plus
10
+
11
+ data:
12
+ target: src.data.objaverse_zero123plus.DataModuleFromConfig
13
+ params:
14
+ batch_size: 6
15
+ num_workers: 8
16
+ train:
17
+ target: src.data.objaverse_zero123plus.ObjaverseData
18
+ params:
19
+ root_dir: data/objaverse
20
+ meta_fname: lvis-annotations.json
21
+ image_dir: rendering_zero123plus
22
+ validation: false
23
+ validation:
24
+ target: src.data.objaverse_zero123plus.ObjaverseData
25
+ params:
26
+ root_dir: data/objaverse
27
+ meta_fname: lvis-annotations.json
28
+ image_dir: rendering_zero123plus
29
+ validation: true
30
+
31
+
32
+ lightning:
33
+ modelcheckpoint:
34
+ params:
35
+ every_n_train_steps: 1000
36
+ save_top_k: -1
37
+ save_last: true
38
+ callbacks: {}
39
+
40
+ trainer:
41
+ benchmark: true
42
+ max_epochs: -1
43
+ gradient_clip_val: 1.0
44
+ val_check_interval: 1000
45
+ num_sanity_val_steps: 0
46
+ accumulate_grad_batches: 1
47
+ check_val_every_n_epoch: null # if not set this, validation does not run