forked from jiasenlu/vilbert_beta
-
Notifications
You must be signed in to change notification settings - Fork 0
/
vlbert_tasks.yml
87 lines (87 loc) · 2.31 KB
/
vlbert_tasks.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
TASK0:
name: VQA
type: VL-classifier
loss: BCEWithLogitLoss
task_id: 1
dataroot: data/VQA
features_h5path1: data/coco/coco_trainval_resnet101_faster_rcnn_genome.lmdb
features_h5path2: ''
train_annotations_jsonpath: ''
val_annotations_jsonpath: ''
max_seq_length: 16
max_region_num: 100
batch_size: 256
eval_batch_size: 1024
train_split: trainval
val_split: minval
lr: 0.00004
num_epoch: 20
TASK1:
name: VCR_Q-A
type: VL-logit
loss: CrossEntropyLoss
task_id: 6
dataroot: data/VCR
features_h5path1: data/VCR/VCR_resnet101_faster_rcnn_genome.lmdb
features_h5path2: data/VCR/VCR_gt_resnet101_faster_rcnn_genome.lmdb
train_annotations_jsonpath: data/VCR/train.jsonl
val_annotations_jsonpath: data/VCR/val.jsonl
max_seq_length: 60
max_region_num: 100
batch_size: 64
train_split: train
val_split: val
lr: 0.00002
num_epoch: 20
TASK2:
name: VCR_QA-R
type: VL-logit
loss: CrossEntropyLoss
task_id: 7
dataroot: data/VCR
features_h5path1: data/VCR/VCR_resnet101_faster_rcnn_genome.lmdb
features_h5path2: data/VCR/VCR_gt_resnet101_faster_rcnn_genome.lmdb
train_annotations_jsonpath: data/VCR/train.jsonl
val_annotations_jsonpath: data/VCR/val.jsonl
max_seq_length: 80
max_region_num: 100
batch_size: 64
train_split: train
val_split: val
lr: 0.00002
num_epoch: 20
TASK3:
name: RetrievalFlickr30k
type: VL-logit
loss: CrossEntropyLoss
task_id: 9
dataroot: data/flickr30k
features_h5path1: data/flickr30k/flickr30k_test_resnet101_faster_rcnn_genome.lmdb
features_h5path2: ''
train_annotations_jsonpath: data/flickr30k/all_data_final_train_2014.jsonline
val_annotations_jsonpath: data/flickr30k/all_data_final_test_set0_2014.jsonline
max_seq_length: 30
max_region_num: 100
batch_size: 64
train_split: train
val_split: val
lr: 0.00002
num_epoch: 20
TASK4:
name: refcoco+
type: V-logit
loss: BCEWithLogitLoss
task_id: 11
dataroot: data/referExpression
features_h5path1: data/referExpression/refcoco+_resnet101_faster_rcnn_genome.lmdb
features_h5path2: data/referExpression/refcoco+_gt_resnet101_faster_rcnn_genome.lmdb
train_annotations_jsonpath: ''
val_annotations_jsonpath: ''
max_seq_length: 20
max_region_num: 100
batch_size: 256
eval_batch_size: 1024
train_split: train
val_split: val
lr: 0.00004
num_epoch: 20