FuseCap-image-captioning / BLIP /configs /retrieval_msrvtt.yaml
noamrot's picture
demo fix commit
85e9f46
raw
history blame
354 Bytes
video_root: '/export/share/dongxuli/data/msrvtt_retrieval/videos'
ann_root: 'annotation'
# set pretrained as a file path or an url
pretrained: 'https://storage.googleapis.com/sfr-vision-language-research/BLIP/models/model_base_retrieval_coco.pth'
# size of vit model; base or large
vit: 'base'
batch_size: 64
k_test: 128
image_size: 384
num_frm_test: 8