-
Notifications
You must be signed in to change notification settings - Fork 31
/
divide.yml
90 lines (81 loc) · 2.33 KB
/
divide.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
name: DOVER
num_epochs: 20
l_num_epochs: 10
warmup_epochs: 2.5
ema: true
save_model: true
batch_size: 16
num_workers: 8
split_seed: 42
wandb:
project_name: DOVER
data:
val-dividemaxwell:
type: ViewDecompositionDataset
args:
weight: 0.572
phase: test
anno_file: ./examplar_data_labels/DIVIDE_MaxWell/val_labels.txt
data_prefix: ../datasets/DIVIDE_MaxWell/videos/
sample_types:
technical:
fragments_h: 7
fragments_w: 7
fsize_h: 32
fsize_w: 32
aligned: 32
clip_len: 32
frame_interval: 2
num_clips: 3
aesthetic:
size_h: 224
size_w: 224
clip_len: 32
frame_interval: 2
t_frag: 32
num_clips: 1
train-dividemaxwell:
type: ViewDecompositionDataset
args:
weight: 0.598
phase: train
fully_supervised: True
anno_file: ./examplar_data_labels/DIVIDE_MaxWell/train_labels.txt
data_prefix: ../datasets/DIVIDE_MaxWell/videos/
sample_types:
technical:
fragments_h: 7
fragments_w: 7
fsize_h: 32
fsize_w: 32
aligned: 32
clip_len: 32
frame_interval: 2
num_clips: 1
aesthetic:
size_h: 224
size_w: 224
clip_len: 32
frame_interval: 2
t_frag: 32
num_clips: 1
model:
type: DOVER
args:
backbone:
technical:
type: swin_tiny_grpb
checkpoint: true
pretrained:
aesthetic:
type: conv_tiny
backbone_preserve_keys: technical,aesthetic
divide_head: true
vqa_head:
in_channels: 768
hidden_channels: 64
optimizer:
lr: !!float 1e-3
backbone_lr_mult: !!float 1e-1
wd: 0.05
test_load_path: ./pretrained_weights/DOVER.pth