instructblip / lavis /configs /datasets /ocrvqa /defaults_instruct.yaml
Thien Huynh
Initialization
be13417
# Copyright (c) 2022, salesforce.com, inc.
# All rights reserved.
# SPDX-License-Identifier: BSD-3-Clause
# For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause
datasets:
ocr_vqa_instruct: # 1002146 train examples
# data_dir: ${env.data_dir}/datasets
data_type: images # [images|videos|features]
vis_processor:
train:
name: "clip_image_train"
image_size: 224
text_processor:
train:
name: blip_instruction
modality: image
task: qa
eval:
name: blip_question
build_info:
# Be careful not to append minus sign (-) before split to avoid itemizing
annotations:
train:
url:
- https://storage.googleapis.com/sfr-xinstructblip-data-research/data/ocrvqa/ocrvqa.json
# - /export/video-language-dataset/ocrvqa/ocrvqa.json
storage:
- ocrvqa/annotations/ocrvqa.json
# - /export/video-language-dataset/ocrvqa/ocrvqa.json
images:
storage: /export/video-language-dataset/ocrvqa/images/