From f976c7800f171fb71569762d3b3dc47f139356f2 Mon Sep 17 00:00:00 2001 From: junchen14 Date: Tue, 24 Oct 2023 23:49:23 +0300 Subject: [PATCH] update visual genome --- dataset/README_MINIGPTv2_FINETUNE.md | 8 +++++--- minigpt4/configs/datasets/gqa/balanced_val.yaml | 4 ++-- minigpt4/configs/datasets/llava/conversation.yaml | 2 +- minigpt4/configs/datasets/llava/detail.yaml | 2 +- minigpt4/configs/datasets/llava/reason.yaml | 2 +- .../configs/datasets/multitask_conversation/default.yaml | 2 +- minigpt4/configs/datasets/nlp/unnatural_instruction.yaml | 2 +- minigpt4/configs/datasets/ocrvqa/ocrvqa.yaml | 4 ++-- minigpt4/configs/datasets/okvqa/defaults.yaml | 2 +- minigpt4/configs/datasets/textcaps/caption.yaml | 4 ++-- minigpt4/configs/datasets/vg/ref.yaml | 2 +- 11 files changed, 18 insertions(+), 16 deletions(-) diff --git a/dataset/README_MINIGPTv2_FINETUNE.md b/dataset/README_MINIGPTv2_FINETUNE.md index 4056b1b..be99f23 100644 --- a/dataset/README_MINIGPTv2_FINETUNE.md +++ b/dataset/README_MINIGPTv2_FINETUNE.md @@ -7,16 +7,16 @@ Image source | Download path --- | :---: COCO 2014 images | images    captions COCO VQA | vqa train    vqa val -Visual Genome | images part1 images part2 +Visual Genome | images part1    images part2    image meta data TextCaps | images    annotations RefCOCO | annotations RefCOCO+ | annotations RefCOCOg | annotations OKVQA | annotations -AOK-VQA | annotations +AOK-VQA | annotations OCR-VQA | annotations GQA | images    annotations -Filtered Flickr-30k | annotations +Filtered flickr-30k | annotations Multi-task conversation | annotations Filtered unnatural instruction | annotations LLaVA | Compelex reasoning    Detailed description    Conversation @@ -65,6 +65,8 @@ ${MINIGPTv2_DATASET} │ ├── VG_100K │ ├── VG_100K_2 │ └── region_descriptions.json +│ └── image_data.json + ... ``` diff --git a/minigpt4/configs/datasets/gqa/balanced_val.yaml b/minigpt4/configs/datasets/gqa/balanced_val.yaml index 5a9e55c..2de8c21 100644 --- a/minigpt4/configs/datasets/gqa/balanced_val.yaml +++ b/minigpt4/configs/datasets/gqa/balanced_val.yaml @@ -28,6 +28,6 @@ datasets: url: - https://storage.googleapis.com/sfr-vision-language-research/LAVIS/datasets/gqa/train_balanced_questions.json storage: - - /ibex/project/c2133/minigpt4_v2_dataset/gqa/annotations/train_balanced_questions.json + - /ibex/project/c2090/minigptv2_dataset/gqa/train_balanced_questions.json images: - storage: /ibex/project/c2133/minigpt4_v2_dataset/gqa/images_copy/ \ No newline at end of file + storage: /ibex/project/c2090/minigptv2_dataset/gqa/images \ No newline at end of file diff --git a/minigpt4/configs/datasets/llava/conversation.yaml b/minigpt4/configs/datasets/llava/conversation.yaml index 6978069..c074de1 100755 --- a/minigpt4/configs/datasets/llava/conversation.yaml +++ b/minigpt4/configs/datasets/llava/conversation.yaml @@ -9,4 +9,4 @@ datasets: data_type: images build_info: image_path: /ibex/reference/CV/COCO/cocoapi/data/2014/images/jpeg/train - ann_path: /ibex/project/c2133/minigpt4_v2_dataset/llava/conversation_58k.json \ No newline at end of file + ann_path: /ibex/project/c2090/minigptv2_dataset/llava/conversation_58k.json \ No newline at end of file diff --git a/minigpt4/configs/datasets/llava/detail.yaml b/minigpt4/configs/datasets/llava/detail.yaml index f4d0f0a..324dd18 100755 --- a/minigpt4/configs/datasets/llava/detail.yaml +++ b/minigpt4/configs/datasets/llava/detail.yaml @@ -9,4 +9,4 @@ datasets: data_type: images build_info: image_path: /ibex/reference/CV/COCO/cocoapi/data/2014/images/jpeg/train - ann_path: /ibex/project/c2133/minigpt4_v2_dataset/llava/detail_23k.json \ No newline at end of file + ann_path: /ibex/project/c2090/minigptv2_dataset/llava/detail_23k.json \ No newline at end of file diff --git a/minigpt4/configs/datasets/llava/reason.yaml b/minigpt4/configs/datasets/llava/reason.yaml index ea6cb06..88deed6 100755 --- a/minigpt4/configs/datasets/llava/reason.yaml +++ b/minigpt4/configs/datasets/llava/reason.yaml @@ -9,4 +9,4 @@ datasets: data_type: images build_info: image_path: /ibex/reference/CV/COCO/cocoapi/data/2014/images/jpeg/train - ann_path: /ibex/project/c2133/minigpt4_v2_dataset/llava/complex_reasoning_77k.json \ No newline at end of file + ann_path: /ibex/project/c2090/minigptv2_dataset/llava/complex_reasoning_77k.json \ No newline at end of file diff --git a/minigpt4/configs/datasets/multitask_conversation/default.yaml b/minigpt4/configs/datasets/multitask_conversation/default.yaml index 29200ee..5f51a9b 100644 --- a/minigpt4/configs/datasets/multitask_conversation/default.yaml +++ b/minigpt4/configs/datasets/multitask_conversation/default.yaml @@ -11,4 +11,4 @@ datasets: build_info: image_path: /ibex/reference/CV/COCO/cocoapi/data/2014/images/jpeg/train - ann_path: /ibex/project/c2133/minigpt4_v2_dataset/multitask_conversation/multi_task_conversation.json \ No newline at end of file + ann_path: /ibex/project/c2090/minigptv2_dataset/multitask_conversation/multi_task_conversation.json \ No newline at end of file diff --git a/minigpt4/configs/datasets/nlp/unnatural_instruction.yaml b/minigpt4/configs/datasets/nlp/unnatural_instruction.yaml index d9f31de..cac939e 100644 --- a/minigpt4/configs/datasets/nlp/unnatural_instruction.yaml +++ b/minigpt4/configs/datasets/nlp/unnatural_instruction.yaml @@ -7,4 +7,4 @@ datasets: unnatural_instruction: data_type: text build_info: - ann_path: /ibex/project/c2133/minigpt4_v2_dataset/unnatural-instructions/data/unnatural_instruction_filer.json \ No newline at end of file + ann_path: /ibex/project/c2090/minigptv2_dataset/unnatural_instructions/unnatural_instruction_filer.json \ No newline at end of file diff --git a/minigpt4/configs/datasets/ocrvqa/ocrvqa.yaml b/minigpt4/configs/datasets/ocrvqa/ocrvqa.yaml index d2f6a94..605d80f 100755 --- a/minigpt4/configs/datasets/ocrvqa/ocrvqa.yaml +++ b/minigpt4/configs/datasets/ocrvqa/ocrvqa.yaml @@ -8,5 +8,5 @@ datasets: ocrvqa: data_type: images build_info: - image_path: /ibex/project/c2133/minigpt4_v2_dataset/ocrvqa/images - ann_path: /ibex/project/c2133/minigpt4_v2_dataset/ocrvqa/dataset.json \ No newline at end of file + image_path: /ibex/project/c2090/minigptv2_dataset/ocrvqa/images + ann_path: /ibex/project/c2090/minigptv2_dataset/ocrvqa/dataset.json \ No newline at end of file diff --git a/minigpt4/configs/datasets/okvqa/defaults.yaml b/minigpt4/configs/datasets/okvqa/defaults.yaml index 402212c..d98ccbf 100755 --- a/minigpt4/configs/datasets/okvqa/defaults.yaml +++ b/minigpt4/configs/datasets/okvqa/defaults.yaml @@ -31,6 +31,6 @@ datasets: # - https://storage.googleapis.com/sfr-vision-language-research/LAVIS/datasets/okvqa/OpenEnded_mscoco_train2014_questions.json # - https://storage.googleapis.com/sfr-vision-language-research/LAVIS/datasets/okvqa/mscoco_train2014_annotations.json storage: - - /ibex/project/c2133/minigpt4_v2_dataset/okvqa_v2/annotations/okvqa_train.json + - /ibex/project/c2090/minigptv2_dataset/okvqa/okvqa_train.json images: storage: /ibex/reference/CV/COCO/cocoapi/data/2014/images/jpeg \ No newline at end of file diff --git a/minigpt4/configs/datasets/textcaps/caption.yaml b/minigpt4/configs/datasets/textcaps/caption.yaml index 61a92c7..eee1d93 100755 --- a/minigpt4/configs/datasets/textcaps/caption.yaml +++ b/minigpt4/configs/datasets/textcaps/caption.yaml @@ -10,7 +10,7 @@ datasets: data_type: images build_info: - image_path: /ibex/project/c2133/minigpt4_v2_dataset/TextCaps/train_images - ann_path: /ibex/project/c2133/minigpt4_v2_dataset/TextCaps/TextCaps_0.1_train.json + image_path: /ibex/project/c2090/minigptv2_dataset/textcaps/train_images + ann_path: /ibex/project/c2090/minigptv2_dataset/textcaps/TextCaps_0.1_train.json diff --git a/minigpt4/configs/datasets/vg/ref.yaml b/minigpt4/configs/datasets/vg/ref.yaml index 8b793a2..ffd5d70 100755 --- a/minigpt4/configs/datasets/vg/ref.yaml +++ b/minigpt4/configs/datasets/vg/ref.yaml @@ -7,4 +7,4 @@ datasets: refvg: data_type: images build_info: - data_dir: /ibex/project/c2133/minigpt4_v2_dataset/visual_genome \ No newline at end of file + data_dir: /ibex/project/c2090/minigptv2_dataset/visual_genome \ No newline at end of file