MiniGPT-4/eval_scripts/eval_utils.py
Bingyi Kang 05220fe3c1
init audio data config (#2)
- Add audio datasets
- Add audio processors 
- Add audio support in bindgpt
- Add audio training config

---------

Co-authored-by: bingyikang <bingyikang@bytedance.com>
Co-authored-by: zhaoyang <913556700@qq.com>
2023-05-26 11:44:18 +08:00

26 lines
758 B
Python

import torch
import torchaudio
from PIL import Image
def load_image(image, image_processor):
if isinstance(image, str): # is a image path
raw_image = Image.open(image).convert('RGB')
image = image_processor(raw_image).unsqueeze(0)
elif isinstance(image, Image.Image):
raw_image = image
image = image_processor(raw_image).unsqueeze(0)
elif isinstance(image, torch.Tensor):
if len(image.shape) == 3:
image = image.unsqueeze(0)
return image
def load_audio(audio, audio_processor):
if isinstance(audio, str): # is a audio path
raw_audio = torchaudio.load(audio)
audio = audio_processor(audio)
# elif isinstance(audio, )
else:
raise NotImplementedError