-
Notifications
You must be signed in to change notification settings - Fork 6
/
rva.yml
executable file
·40 lines (34 loc) · 914 Bytes
/
rva.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
# Dataset reader arguments
dataset:
image_features_train_h5: '/features_faster_rcnn_x101_train.h5'
image_features_val_h5: '/features_faster_rcnn_x101_val.h5'
image_features_test_h5: '/features_faster_rcnn_x101_test.h5'
word_counts_json: '/visdial_1.0_word_counts_train.json'
glove_npy: '/glove.npy'
img_norm: 1
concat_history: false
max_sequence_length: 20
vocab_min_count: 5
# Model related arguments
model:
encoder: 'rva'
decoder: 'disc'
img_feature_size: 2048
word_embedding_size: 300
lstm_hidden_size: 512
lstm_num_layers: 2
dropout: 0.5
dropout_fc: 0.3
relu: 'ReLU'
# Optimization related arguments
solver:
batch_size: 24 # 32 x num_gpus is a good rule of thumb
num_epochs: 15
initial_lr: 0.01
training_splits: "train" # "trainval"
lr_gamma: 0.1
lr_milestones: # epochs when lr —> lr * lr_gamma
- 5
- 10
warmup_factor: 0.2
warmup_epochs: 1