nlvr.yaml 441 B

123456789101112131415161718192021
  1. image_root: '/export/share/datasets/vision/NLVR2/'
  2. ann_root: 'annotation'
  3. # set pretrained as a file path or an url
  4. pretrained: 'https://storage.googleapis.com/sfr-vision-language-research/BLIP/models/model_base_nlvr.pth'
  5. #size of vit model; base or large
  6. vit: 'base'
  7. batch_size_train: 16
  8. batch_size_test: 64
  9. vit_grad_ckpt: False
  10. vit_ckpt_layer: 0
  11. max_epoch: 15
  12. image_size: 384
  13. # optimizer
  14. weight_decay: 0.05
  15. init_lr: 3e-5
  16. min_lr: 0