Zkli commited on
Commit
07ffde3
·
verified ·
1 Parent(s): 1952ac8

Upload args.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. args.yaml +168 -0
args.yaml ADDED
@@ -0,0 +1,168 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ M: 4
2
+ N: 2
3
+ aa: rand-m8-inc1-mstd101
4
+ amp: true
5
+ amp_dtype: float16
6
+ amp_impl: native
7
+ aug_repeats: 0
8
+ aug_splits: 0
9
+ batch_size: 128
10
+ bce_loss: false
11
+ bce_pos_weight: null
12
+ bce_sum: false
13
+ bce_target_thresh: null
14
+ bn_eps: null
15
+ bn_momentum: null
16
+ channels_last: false
17
+ checkpoint_hist: 10
18
+ class_map: ''
19
+ clip_grad: 2.0
20
+ clip_mode: norm
21
+ color_jitter: 0.4
22
+ color_jitter_prob: null
23
+ cooldown_epochs: 0
24
+ crop_pct: 0.9
25
+ cutmix: 1.0
26
+ cutmix_minmax: null
27
+ data: null
28
+ data_dir: data/imagenet
29
+ dataset: ''
30
+ dataset_download: false
31
+ decay_epochs: 90
32
+ decay_milestones:
33
+ - 90
34
+ - 180
35
+ - 270
36
+ decay_rate: 0.1
37
+ device: cuda
38
+ device_modules: null
39
+ dist_bn: reduce
40
+ drop: 0.0
41
+ drop_block: null
42
+ drop_connect: null
43
+ drop_path: 0.1
44
+ epoch_repeats: 0.0
45
+ epochs: 20
46
+ eval_metric: top1
47
+ experiment: MaskLLM-4V
48
+ fast_norm: false
49
+ finetune_classifier: false
50
+ fuser: ''
51
+ gaussian_blur_prob: null
52
+ gp: null
53
+ grad_accum_steps: 1
54
+ grad_checkpointing: false
55
+ grayscale_prob: null
56
+ hard: false
57
+ head_init_bias: null
58
+ head_init_scale: null
59
+ hflip: 0.5
60
+ img_size: null
61
+ in_chans: null
62
+ initial_checkpoint: ''
63
+ input_img_mode: null
64
+ input_key: null
65
+ input_size: null
66
+ interpolation: ''
67
+ jsd_loss: false
68
+ layer_decay: null
69
+ local_rank: 0
70
+ log_interval: 50
71
+ log_wandb: false
72
+ lr: 0.1
73
+ lr_base: 0.1
74
+ lr_base_scale: ''
75
+ lr_base_size: 256
76
+ lr_cycle_decay: 0.5
77
+ lr_cycle_limit: 1
78
+ lr_cycle_mul: 1.0
79
+ lr_k_decay: 1.0
80
+ lr_noise: null
81
+ lr_noise_pct: 0.67
82
+ lr_noise_std: 1.0
83
+ mask_only: true
84
+ mean:
85
+ - 0.5
86
+ - 0.5
87
+ - 0.5
88
+ min_lr: 1.0e-05
89
+ mixup: 0.8
90
+ mixup_mode: batch
91
+ mixup_off_epoch: 0
92
+ mixup_prob: 1.0
93
+ mixup_switch_prob: 0.5
94
+ model: vit_base_patch16_224.augreg_in1k
95
+ model_ema: false
96
+ model_ema_decay: 0.9998
97
+ model_ema_force_cpu: false
98
+ model_ema_warmup: false
99
+ model_kwargs: {}
100
+ momentum: 0.9
101
+ no_aug: false
102
+ no_ddp_bb: false
103
+ no_prefetcher: false
104
+ no_resume_opt: false
105
+ num_classes: null
106
+ opt: adamw
107
+ opt_betas: null
108
+ opt_eps: null
109
+ opt_kwargs: {}
110
+ output: output/lpermutation_vit_base_patch16_224.augreg_in1k_group_auxloss_biglr_less_iter
111
+ patience_epochs: 10
112
+ pin_mem: false
113
+ pretrained: true
114
+ pretrained_path: null
115
+ prior_strength: 3.0
116
+ ratio:
117
+ - 0.75
118
+ - 1.3333333333333333
119
+ recount: 1
120
+ recovery_interval: 0
121
+ remode: pixel
122
+ reprob: 0.3
123
+ resplit: false
124
+ resume: ''
125
+ save_images: false
126
+ scale:
127
+ - 0.08
128
+ - 1.0
129
+ scaling_range:
130
+ - 10.0
131
+ - 100.0
132
+ sched: cosine
133
+ sched_on_updates: false
134
+ seed: 42
135
+ smoothing: 0.1
136
+ sparse_checkpoint: null
137
+ sparse_weight_reg: 1.0e-05
138
+ sparsity_mode: permutation
139
+ split_bn: false
140
+ start_epoch: null
141
+ std:
142
+ - 0.5
143
+ - 0.5
144
+ - 0.5
145
+ sync_bn: false
146
+ synchronize_step: false
147
+ target_key: null
148
+ tau_range:
149
+ - 4.0
150
+ - 0.05
151
+ torchcompile: null
152
+ torchscript: false
153
+ train_crop_mode: null
154
+ train_interpolation: random
155
+ train_num_samples: null
156
+ train_split: train
157
+ tta: 0
158
+ use_multi_epochs_loader: false
159
+ val_num_samples: null
160
+ val_split: validation
161
+ validation_batch_size: null
162
+ vflip: 0.0
163
+ warmup_epochs: 0
164
+ warmup_lr: 1.0e-05
165
+ warmup_prefix: false
166
+ weight_decay: 0.01
167
+ worker_seeding: all
168
+ workers: 4