forked from e-bug/volta
-
Notifications
You must be signed in to change notification settings - Fork 0
/
ctrl_trainval_tasks.yml
78 lines (78 loc) · 2 KB
/
ctrl_trainval_tasks.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
TASK1:
name: VQA
type: VL-classifier
num_labels: 3129
loss: BCEWithLogitLoss
process: normal
task_id: 1
dataroot: datasets/vqa/annotations
features_h5path1: datasets/mscoco/resnet101_faster_rcnn_genome_imgfeats/volta/trainval_feat.lmdb
features_h5path2: ''
train_annotations_jsonpath: ''
val_annotations_jsonpath: ''
max_seq_length: 23
max_region_num: 36
batch_size: 256
eval_batch_size: 1024
train_split: train
val_split: val
lr: 0.0001
num_epoch: 20
TASK8:
name: RetrievalFlickr30k
type: VL-logit
num_labels: 1
loss: CrossEntropyLoss
process: retrieval
task_id: 8
dataroot: datasets/flickr30k
features_h5path1: datasets/flickr30k/resnet101_faster_rcnn_genome_imgfeats/volta/flickr30k_feat.lmdb
features_h5path2: ''
train_annotations_jsonpath: datasets/flickr30k/annotations/train_ann.jsonl
val_annotations_jsonpath: datasets/flickr30k/annotations/valid_ann.jsonl
max_seq_length: 30
max_region_num: 36
batch_size: 64
train_split: train
val_split: val
lr: 0.00002
num_epoch: 20
TASK10:
name: refcoco+
type: V-logit
loss: BCEWithLogitLoss
process: normal
task_id: 10
dataroot: datasets/refcoco+_unc/annotations
features_h5path1: datasets/refcoco+_unc/resnet101_faster_rcnn_genome_imgfeats/volta/refcoco+_unc_dets36_feat.lmdb
features_h5path2: ''
train_annotations_jsonpath: ''
val_annotations_jsonpath: ''
max_seq_length: 20
max_region_num: 36
batch_size: 256
eval_batch_size: 1024
train_split: train
val_split: val
lr: 0.0001
num_epoch: 20
TASK12:
name: NLVR2
type: VL-binary-classifier
num_labels: 2
loss: BCEWithLogitLoss
process: nlvr
task_id: 12
dataroot: datasets/nlvr2/annotations
features_h5path1: datasets/nlvr2/resnet101_faster_rcnn_genome_imgfeats/volta/nlvr2_feat.lmdb
features_h5path2: ''
train_annotations_jsonpath: ''
val_annotations_jsonpath: ''
max_seq_length: 40
max_region_num: 36
batch_size: 64
eval_batch_size: 512
train_split: train
val_split: dev
lr: 0.00001
num_epoch: 20