retrieval_msrvtt.yaml 354 B

123456789101112
  1. video_root: '/export/share/dongxuli/data/msrvtt_retrieval/videos'
  2. ann_root: 'annotation'
  3. # set pretrained as a file path or an url
  4. pretrained: 'https://storage.googleapis.com/sfr-vision-language-research/BLIP/models/model_base_retrieval_coco.pth'
  5. # size of vit model; base or large
  6. vit: 'base'
  7. batch_size: 64
  8. k_test: 128
  9. image_size: 384
  10. num_frm_test: 8