forked from affjljoo3581/deit3-jax
-
Notifications
You must be signed in to change notification settings - Fork 0
/
deit-b16-224-in1k-300ep.sh
49 lines (49 loc) · 1.39 KB
/
deit-b16-224-in1k-300ep.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
python3 src/main.py \
--output-dir $GCS_MODEL_DIR \
--train-dataset-shards "$GCS_DATASET_DIR/imagenet-1k-wds/imagenet1k-train-{0000..1023}.tar" \
--valid-dataset-shards "$GCS_DATASET_DIR/imagenet-1k-wds/imagenet1k-validation-{00..63}.tar" \
--train-batch-size 1024 \
--valid-batch-size 512 \
--train-loader-workers 40 \
--valid-loader-workers 10 \
--random-crop rrc \
--color-jitter 0.0 \
--auto-augment rand-m9-mstd0.5-inc1 \
--random-erasing 0.25 \
--augment-repeats 3 \
--test-crop-ratio 0.875 \
--mixup 0.8 \
--cutmix 1.0 \
--criterion ce \
--label-smoothing 0.1 \
--layers 12 \
--dim 768 \
--heads 12 \
--labels 1000 \
--patch-size 16 \
--image-size 224 \
--posemb learnable \
--pooling cls \
--dropout 0.0 \
--droppath 0.05 \
--init-seed 1 \
--mixup-seed 1 \
--dropout-seed 1 \
--shuffle-seed 1 \
--optimizer adamw \
--learning-rate 0.001 \
--weight-decay 0.05 \
--adam-b1 0.9 \
--adam-b2 0.999 \
--adam-eps 1e-8 \
--lr-decay 1.0 \
--clip-grad 0.0 \
--grad-accum 1 \
--warmup-steps $((1281167 * 5 / 1024)) \
--training-steps $((1281167 * 300 / 1024)) \
--log-interval 100 \
--eval-interval $((1281167 * 1 / 1024)) \
--project deit3-jax \
--name $(basename $0 .sh) \
--ipaddr $(curl -s ifconfig.me) \
--hostname $(hostname)