tests/pipelines/test_text_to_360panorama_image.py

# Copyright (c) Alibaba, Inc. and its affiliates.
import subprocess
import sys
import tempfile
import unittest

import cv2

from modelscope.hub.snapshot_download import snapshot_download
from modelscope.outputs import OutputKeys
from modelscope.pipelines import pipeline
from modelscope.utils.constant import Tasks
from modelscope.utils.logger import get_logger
from modelscope.utils.test_utils import test_level

logger = get_logger()


@unittest.skip('For need realesrgan')
class Text2360PanoramaImageTest(unittest.TestCase):

    def setUp(self) -> None:
        logger.info('start install xformers')
        cmd = [
            sys.executable, '-m', 'pip', 'install', 'xformers', '-f',
            'https://modelscope.oss-cn-beijing.aliyuncs.com/releases/repo.html'
        ]
        subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)

        logger.info('install xformers finished')

        self.task = Tasks.text_to_360panorama_image
        self.model_id = 'damo/cv_diffusion_text-to-360panorama-image_generation'
        self.prompt = 'The living room'
        self.upscale = False
        self.refinement = False

        self.input = {
            'prompt': self.prompt,
            'upscale': self.upscale,
            'refinement': self.refinement,
        }

    @unittest.skipUnless(test_level() >= 3, 'skip test due to gpu oom')
    def test_run_by_direct_model_download(self):
        from modelscope.pipelines.cv import Text2360PanoramaImagePipeline
        output_image_path = tempfile.NamedTemporaryFile(suffix='.png').name
        cache_path = snapshot_download(self.model_id)
        pipeline = Text2360PanoramaImagePipeline(cache_path)
        pipeline.group_key = self.task
        output = pipeline(inputs=self.input)[OutputKeys.OUTPUT_IMG]
        cv2.imwrite(output_image_path, output)
        print(
            'pipeline: the output image path is {}'.format(output_image_path))

    @unittest.skipUnless(test_level() >= 3, 'skip test due to gpu oom')
    def test_run_with_model_from_modelhub(self):
        from modelscope.pipelines.cv import Text2360PanoramaImagePipeline
        output_image_path = tempfile.NamedTemporaryFile(suffix='.png').name
        pipeline_ins = pipeline(
            task=Tasks.text_to_360panorama_image,
            model=self.model_id,
            model_revision='v1.0.0')
        output = pipeline_ins(inputs=self.input)[OutputKeys.OUTPUT_IMG]
        cv2.imwrite(output_image_path, output)
        print(
            'pipeline: the output image path is {}'.format(output_image_path))


if __name__ == '__main__':
    unittest.main()
add text-to-360pano-image pipeline, mod cv requirements 7月份计划上线的360全景图生成模型，自研模型权重文件地址https://www.modelscope.cn/models/damo/cv_diffusion_text-to-360panorama-image_generation/summary #### 依赖项说明 ##### 由于要使用xformers，torch版本最好使用1.13.1 ``` pip install torch==1.13.1+cu116 torchvision==0.14.1+cu116 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116 ``` ##### 对应的diffusers和xformers版本如下 ``` pip install -U diffusers==0.18.0 pip install xformers==0.0.16 pip install triton, accelerate, transformers ``` ##### ModelScope Library 需要使用cv ``` pip install modelscope pip install "modelscope[cv]" -f https://modelscope.oss-cn-beijing.aliyuncs.com/releases/repo.html ``` ##### 此外，还需要安装第三方的一个库，Real-ESRGAN，安装方法如下 ``` # Install basicsr - https://github.com/xinntao/BasicSR # We use BasicSR for both training and inference pip install basicsr # facexlib and gfpgan are for face enhancement pip install facexlib pip install gfpgan pip install Pillow pip install tqdm pip install realesrgan==0.3.0 ``` Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13346430 * add text-to-360pano-image pipeline * add text-to-360pano-image pipeline, mod cv requirements * rm redundant files and cv requirements; add standard input and output definations * fix diffusers==0.18.0 and run test * fix diffusers==0.18.0 in multi-modal and run test again * add model_revision='v1.0.0' * fix yapf * add trycatch for enabling xformers * fix key error * add install xformers in test/setup * skip highres.fix in ci * feat: Fix conflict, auto commit by WebIDE 2023-07-27 11:33:39 +08:00			`# Copyright (c) Alibaba, Inc. and its affiliates.`
			`import subprocess`
			`import sys`
			`import tempfile`
			`import unittest`

			`import cv2`

			`from modelscope.hub.snapshot_download import snapshot_download`
			`from modelscope.outputs import OutputKeys`
			`from modelscope.pipelines import pipeline`
			`from modelscope.utils.constant import Tasks`
			`from modelscope.utils.logger import get_logger`
			`from modelscope.utils.test_utils import test_level`

			`logger = get_logger()`


fix numpy pandas compatible issue 明确受影响的模型(damo)： ONE-PEACE-4B ModuleNotFoundError: MyCustomPipeline: MyCustomModel: No module named 'one_peace'，缺少依赖。 cv_resnet50_face-reconstruction 不兼容tf2 nlp_automatic_post_editing_for_translation_en2de tf2.0兼容性问题，tf1.x需要 cv_resnet18_ocr-detection-word-level_damo tf2.x兼容性问题 cv_resnet18_ocr-detection-line-level_damo tf兼容性问题 cv_resnet101_detection_fewshot-defrcn 模型限制必须detection0.3+torch1.11.0" speech_dfsmn_ans_psm_48k_causal "librosa， numpy兼容性问题 cv_mdm_motion-generation "依赖numpy版本兼容性问题： File ""/opt/conda/lib/python3.8/site-packages/smplx/body_models.py"", cv_resnet50_ocr-detection-vlpt numpy兼容性问题 cv_clip-it_video-summarization_language-guided_en tf兼容性问题 Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13744636 * numpy and pandas no version * modify compatible issue * fix numpy compatible issue * modify ci * fix lint issue * replace Image.ANTIALIAS to Image.Resampling.LANCZOS pillow compatible * skip uncompatible cases * fix numpy compatible issue, skip cases that can not compatbile numpy or tensorflow2.x * skip compatible cases * fix clip model issue * fix body 3d keypoints compatible issue 2023-08-22 23:04:31 +08:00			`@unittest.skip('For need realesrgan')`
add text-to-360pano-image pipeline, mod cv requirements 7月份计划上线的360全景图生成模型，自研模型权重文件地址https://www.modelscope.cn/models/damo/cv_diffusion_text-to-360panorama-image_generation/summary #### 依赖项说明 ##### 由于要使用xformers，torch版本最好使用1.13.1 ``` pip install torch==1.13.1+cu116 torchvision==0.14.1+cu116 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116 ``` ##### 对应的diffusers和xformers版本如下 ``` pip install -U diffusers==0.18.0 pip install xformers==0.0.16 pip install triton, accelerate, transformers ``` ##### ModelScope Library 需要使用cv ``` pip install modelscope pip install "modelscope[cv]" -f https://modelscope.oss-cn-beijing.aliyuncs.com/releases/repo.html ``` ##### 此外，还需要安装第三方的一个库，Real-ESRGAN，安装方法如下 ``` # Install basicsr - https://github.com/xinntao/BasicSR # We use BasicSR for both training and inference pip install basicsr # facexlib and gfpgan are for face enhancement pip install facexlib pip install gfpgan pip install Pillow pip install tqdm pip install realesrgan==0.3.0 ``` Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13346430 * add text-to-360pano-image pipeline * add text-to-360pano-image pipeline, mod cv requirements * rm redundant files and cv requirements; add standard input and output definations * fix diffusers==0.18.0 and run test * fix diffusers==0.18.0 in multi-modal and run test again * add model_revision='v1.0.0' * fix yapf * add trycatch for enabling xformers * fix key error * add install xformers in test/setup * skip highres.fix in ci * feat: Fix conflict, auto commit by WebIDE 2023-07-27 11:33:39 +08:00			`class Text2360PanoramaImageTest(unittest.TestCase):`

			`def setUp(self) -> None:`
			`logger.info('start install xformers')`
			`cmd = [`
			`sys.executable, '-m', 'pip', 'install', 'xformers', '-f',`
			`'https://modelscope.oss-cn-beijing.aliyuncs.com/releases/repo.html'`
			`]`
			`subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)`

			`logger.info('install xformers finished')`

			`self.task = Tasks.text_to_360panorama_image`
			`self.model_id = 'damo/cv_diffusion_text-to-360panorama-image_generation'`
			`self.prompt = 'The living room'`
			`self.upscale = False`
			`self.refinement = False`

			`self.input = {`
			`'prompt': self.prompt,`
			`'upscale': self.upscale,`
			`'refinement': self.refinement,`
			`}`

fix ut error Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13716099 * fix ut error 2023-08-19 21:16:07 +08:00			`@unittest.skipUnless(test_level() >= 3, 'skip test due to gpu oom')`
add text-to-360pano-image pipeline, mod cv requirements 7月份计划上线的360全景图生成模型，自研模型权重文件地址https://www.modelscope.cn/models/damo/cv_diffusion_text-to-360panorama-image_generation/summary #### 依赖项说明 ##### 由于要使用xformers，torch版本最好使用1.13.1 ``` pip install torch==1.13.1+cu116 torchvision==0.14.1+cu116 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116 ``` ##### 对应的diffusers和xformers版本如下 ``` pip install -U diffusers==0.18.0 pip install xformers==0.0.16 pip install triton, accelerate, transformers ``` ##### ModelScope Library 需要使用cv ``` pip install modelscope pip install "modelscope[cv]" -f https://modelscope.oss-cn-beijing.aliyuncs.com/releases/repo.html ``` ##### 此外，还需要安装第三方的一个库，Real-ESRGAN，安装方法如下 ``` # Install basicsr - https://github.com/xinntao/BasicSR # We use BasicSR for both training and inference pip install basicsr # facexlib and gfpgan are for face enhancement pip install facexlib pip install gfpgan pip install Pillow pip install tqdm pip install realesrgan==0.3.0 ``` Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13346430 * add text-to-360pano-image pipeline * add text-to-360pano-image pipeline, mod cv requirements * rm redundant files and cv requirements; add standard input and output definations * fix diffusers==0.18.0 and run test * fix diffusers==0.18.0 in multi-modal and run test again * add model_revision='v1.0.0' * fix yapf * add trycatch for enabling xformers * fix key error * add install xformers in test/setup * skip highres.fix in ci * feat: Fix conflict, auto commit by WebIDE 2023-07-27 11:33:39 +08:00			`def test_run_by_direct_model_download(self):`
fix ut error Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13716099 * fix ut error 2023-08-19 21:16:07 +08:00			`from modelscope.pipelines.cv import Text2360PanoramaImagePipeline`
add text-to-360pano-image pipeline, mod cv requirements 7月份计划上线的360全景图生成模型，自研模型权重文件地址https://www.modelscope.cn/models/damo/cv_diffusion_text-to-360panorama-image_generation/summary #### 依赖项说明 ##### 由于要使用xformers，torch版本最好使用1.13.1 ``` pip install torch==1.13.1+cu116 torchvision==0.14.1+cu116 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116 ``` ##### 对应的diffusers和xformers版本如下 ``` pip install -U diffusers==0.18.0 pip install xformers==0.0.16 pip install triton, accelerate, transformers ``` ##### ModelScope Library 需要使用cv ``` pip install modelscope pip install "modelscope[cv]" -f https://modelscope.oss-cn-beijing.aliyuncs.com/releases/repo.html ``` ##### 此外，还需要安装第三方的一个库，Real-ESRGAN，安装方法如下 ``` # Install basicsr - https://github.com/xinntao/BasicSR # We use BasicSR for both training and inference pip install basicsr # facexlib and gfpgan are for face enhancement pip install facexlib pip install gfpgan pip install Pillow pip install tqdm pip install realesrgan==0.3.0 ``` Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13346430 * add text-to-360pano-image pipeline * add text-to-360pano-image pipeline, mod cv requirements * rm redundant files and cv requirements; add standard input and output definations * fix diffusers==0.18.0 and run test * fix diffusers==0.18.0 in multi-modal and run test again * add model_revision='v1.0.0' * fix yapf * add trycatch for enabling xformers * fix key error * add install xformers in test/setup * skip highres.fix in ci * feat: Fix conflict, auto commit by WebIDE 2023-07-27 11:33:39 +08:00			`output_image_path = tempfile.NamedTemporaryFile(suffix='.png').name`
			`cache_path = snapshot_download(self.model_id)`
			`pipeline = Text2360PanoramaImagePipeline(cache_path)`
			`pipeline.group_key = self.task`
			`output = pipeline(inputs=self.input)[OutputKeys.OUTPUT_IMG]`
			`cv2.imwrite(output_image_path, output)`
			`print(`
			`'pipeline: the output image path is {}'.format(output_image_path))`

fix ut error Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13716099 * fix ut error 2023-08-19 21:16:07 +08:00			`@unittest.skipUnless(test_level() >= 3, 'skip test due to gpu oom')`
add text-to-360pano-image pipeline, mod cv requirements 7月份计划上线的360全景图生成模型，自研模型权重文件地址https://www.modelscope.cn/models/damo/cv_diffusion_text-to-360panorama-image_generation/summary #### 依赖项说明 ##### 由于要使用xformers，torch版本最好使用1.13.1 ``` pip install torch==1.13.1+cu116 torchvision==0.14.1+cu116 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116 ``` ##### 对应的diffusers和xformers版本如下 ``` pip install -U diffusers==0.18.0 pip install xformers==0.0.16 pip install triton, accelerate, transformers ``` ##### ModelScope Library 需要使用cv ``` pip install modelscope pip install "modelscope[cv]" -f https://modelscope.oss-cn-beijing.aliyuncs.com/releases/repo.html ``` ##### 此外，还需要安装第三方的一个库，Real-ESRGAN，安装方法如下 ``` # Install basicsr - https://github.com/xinntao/BasicSR # We use BasicSR for both training and inference pip install basicsr # facexlib and gfpgan are for face enhancement pip install facexlib pip install gfpgan pip install Pillow pip install tqdm pip install realesrgan==0.3.0 ``` Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13346430 * add text-to-360pano-image pipeline * add text-to-360pano-image pipeline, mod cv requirements * rm redundant files and cv requirements; add standard input and output definations * fix diffusers==0.18.0 and run test * fix diffusers==0.18.0 in multi-modal and run test again * add model_revision='v1.0.0' * fix yapf * add trycatch for enabling xformers * fix key error * add install xformers in test/setup * skip highres.fix in ci * feat: Fix conflict, auto commit by WebIDE 2023-07-27 11:33:39 +08:00			`def test_run_with_model_from_modelhub(self):`
fix ut error Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13716099 * fix ut error 2023-08-19 21:16:07 +08:00			`from modelscope.pipelines.cv import Text2360PanoramaImagePipeline`
add text-to-360pano-image pipeline, mod cv requirements 7月份计划上线的360全景图生成模型，自研模型权重文件地址https://www.modelscope.cn/models/damo/cv_diffusion_text-to-360panorama-image_generation/summary #### 依赖项说明 ##### 由于要使用xformers，torch版本最好使用1.13.1 ``` pip install torch==1.13.1+cu116 torchvision==0.14.1+cu116 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116 ``` ##### 对应的diffusers和xformers版本如下 ``` pip install -U diffusers==0.18.0 pip install xformers==0.0.16 pip install triton, accelerate, transformers ``` ##### ModelScope Library 需要使用cv ``` pip install modelscope pip install "modelscope[cv]" -f https://modelscope.oss-cn-beijing.aliyuncs.com/releases/repo.html ``` ##### 此外，还需要安装第三方的一个库，Real-ESRGAN，安装方法如下 ``` # Install basicsr - https://github.com/xinntao/BasicSR # We use BasicSR for both training and inference pip install basicsr # facexlib and gfpgan are for face enhancement pip install facexlib pip install gfpgan pip install Pillow pip install tqdm pip install realesrgan==0.3.0 ``` Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13346430 * add text-to-360pano-image pipeline * add text-to-360pano-image pipeline, mod cv requirements * rm redundant files and cv requirements; add standard input and output definations * fix diffusers==0.18.0 and run test * fix diffusers==0.18.0 in multi-modal and run test again * add model_revision='v1.0.0' * fix yapf * add trycatch for enabling xformers * fix key error * add install xformers in test/setup * skip highres.fix in ci * feat: Fix conflict, auto commit by WebIDE 2023-07-27 11:33:39 +08:00			`output_image_path = tempfile.NamedTemporaryFile(suffix='.png').name`
			`pipeline_ins = pipeline(`
			`task=Tasks.text_to_360panorama_image,`
			`model=self.model_id,`
			`model_revision='v1.0.0')`
			`output = pipeline_ins(inputs=self.input)[OutputKeys.OUTPUT_IMG]`
			`cv2.imwrite(output_image_path, output)`
			`print(`
			`'pipeline: the output image path is {}'.format(output_image_path))`


			`if __name__ == '__main__':`
			`unittest.main()`