mirror of
https://github.com/modelscope/modelscope.git
synced 2025-12-18 01:07:44 +01:00
60 lines
2.3 KiB
Python
60 lines
2.3 KiB
Python
# Copyright (c) Alibaba, Inc. and its affiliates.
|
|
import unittest
|
|
|
|
from modelscope.models import Model
|
|
from modelscope.outputs import OutputKeys
|
|
from modelscope.pipelines import pipeline
|
|
from modelscope.utils.constant import Tasks
|
|
from modelscope.utils.test_utils import test_level
|
|
|
|
|
|
class HiTeATasksTest(unittest.TestCase):
|
|
|
|
@unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
|
|
def test_run_with_video_captioning_with_model(self):
|
|
model = Model.from_pretrained(
|
|
'damo/multi-modal_hitea_video-captioning_base_en')
|
|
pipeline_caption = pipeline(
|
|
task=Tasks.video_captioning,
|
|
model=model,
|
|
)
|
|
video = 'data/test/videos/video_caption_and_qa_test.mp4'
|
|
result = pipeline_caption(video)
|
|
print(result[OutputKeys.CAPTION])
|
|
|
|
@unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
|
|
def test_run_with_video_captioning_with_name(self):
|
|
model = 'damo/multi-modal_hitea_video-captioning_base_en'
|
|
pipeline_caption = pipeline(
|
|
Tasks.video_captioning,
|
|
model=model,
|
|
)
|
|
video = 'data/test/videos/video_caption_and_qa_test.mp4'
|
|
result = pipeline_caption(video)
|
|
print(result[OutputKeys.CAPTION])
|
|
|
|
@unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
|
|
def test_run_with_video_question_answering_with_model(self):
|
|
model = Model.from_pretrained(
|
|
'damo/multi-modal_hitea_video-question-answering_base_en')
|
|
pipeline_vqa = pipeline(Tasks.video_question_answering, model=model)
|
|
video = 'data/test/videos/video_caption_and_qa_test.mp4'
|
|
text = 'How many people are there?'
|
|
input = {'video': video, 'text': text}
|
|
result = pipeline_vqa(input)
|
|
print(result)
|
|
|
|
@unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
|
|
def test_run_with_video_question_answering_with_name(self):
|
|
model = 'damo/multi-modal_hitea_video-question-answering_base_en'
|
|
pipeline_vqa = pipeline(Tasks.video_question_answering, model=model)
|
|
video = 'data/test/videos/video_caption_and_qa_test.mp4'
|
|
text = 'Who teaches a girl how to paint eggs?'
|
|
input = {'video': video, 'text': text}
|
|
result = pipeline_vqa(input)
|
|
print(result)
|
|
|
|
|
|
if __name__ == '__main__':
|
|
unittest.main()
|