Upload lpermute_vit_base_patch16_224.augreg_in1k_group_auxloss_biglr_less_iter.sh with huggingface_hub
Browse files
lpermute_vit_base_patch16_224.augreg_in1k_group_auxloss_biglr_less_iter.sh
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
export HIP_VISIBLE_DEVICES=0,1
|
2 |
+
|
3 |
+
torchrun --nnodes=1 --nproc_per_node=2 --master_port 23419 timm_permutation_train_group_auxloss_less_iters.py \
|
4 |
+
--model vit_base_patch16_224.augreg_in1k \
|
5 |
+
--pretrained \
|
6 |
+
--sparsity-mode permutation \
|
7 |
+
--mask-only \
|
8 |
+
-b 128 \
|
9 |
+
--opt adamw \
|
10 |
+
--lr 1e-1 \
|
11 |
+
--weight-decay 0.01 \
|
12 |
+
--epochs 20 \
|
13 |
+
--warmup-epochs 0 \
|
14 |
+
--mixup 0.8 \
|
15 |
+
--cutmix 1.0 \
|
16 |
+
--sched cosine \
|
17 |
+
--smoothing 0.1 \
|
18 |
+
--drop-path 0.1 \
|
19 |
+
--aa rand-m8-inc1-mstd101 \
|
20 |
+
--remode pixel --reprob 0.3 \
|
21 |
+
--amp \
|
22 |
+
--crop-pct 0.9 \
|
23 |
+
--mean 0.5 0.5 0.5 \
|
24 |
+
--std 0.5 0.5 0.5 \
|
25 |
+
--output output/lpermutation_vit_base_patch16_224.augreg_in1k_group_auxloss_biglr_less_iter \
|
26 |
+
--scaling-range 1e1 1e2 \
|
27 |
+
--tau-range 4 0.05 \
|
28 |
+
--sparse-weight-reg 1e-5 \
|
29 |
+
--clip-grad 2.0 \
|
30 |
+
--min-lr 1e-5 \
|
31 |
+
--model-ema-decay 0.9998 \
|
32 |
+
--prior-strength 3 \
|