From 8db088d2cb45fe64e3855d98ed88f22e55fea58b Mon Sep 17 00:00:00 2001
From: "wenmeng.zwm" <wenmeng.zwm@alibaba-inc.com>
Date: Tue, 15 Aug 2023 16:47:52 +0800
Subject: [PATCH 01/22] fix virtural tryon ut error

---
 modelscope/pipeline_inputs.py          | 9 ++++++++-
 tests/pipelines/test_virtual_try_on.py | 6 +++++-
 2 files changed, 13 insertions(+), 2 deletions(-)

diff --git a/modelscope/pipeline_inputs.py b/modelscope/pipeline_inputs.py
index b18e0979..8c7d3780 100644
--- a/modelscope/pipeline_inputs.py
+++ b/modelscope/pipeline_inputs.py
@@ -204,7 +204,14 @@ TASK_INPUTS = {
     InputType.IMAGE,
     Tasks.video_embedding:
     InputType.VIDEO,
-    Tasks.virtual_try_on: (InputType.IMAGE, InputType.IMAGE, InputType.IMAGE),
+    Tasks.virtual_try_on: [
+        (InputType.IMAGE, InputType.IMAGE, InputType.IMAGE),
+        {
+            'masked_model': InputType.IMAGE,
+            'pose': InputType.IMAGE,
+            'cloth': InputType.IMAGE,
+        }
+    ],
     Tasks.text_driven_segmentation: {
         InputKeys.IMAGE: InputType.IMAGE,
         InputKeys.TEXT: InputType.TEXT
diff --git a/tests/pipelines/test_virtual_try_on.py b/tests/pipelines/test_virtual_try_on.py
index c8a55f79..2e399d8f 100644
--- a/tests/pipelines/test_virtual_try_on.py
+++ b/tests/pipelines/test_virtual_try_on.py
@@ -20,7 +20,11 @@ class VirtualTryonTest(unittest.TestCase):
     masked_model = Image.open('data/test/images/virtual_tryon_model.jpg')
     pose = Image.open('data/test/images/virtual_tryon_pose.jpg')
     cloth = Image.open('data/test/images/virtual_tryon_cloth.jpg')
-    input_imgs = (masked_model, pose, cloth)
+    input_imgs = {
+        'masked_model': masked_model,
+        'pose': pose,
+        'cloth': cloth,
+    }
 
     @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
     def test_run_with_model_name(self):

From 1ec8fe4a961759f8889db1b8b11fe9dca9327beb Mon Sep 17 00:00:00 2001
From: ccyhxg <103231034+ccyhxg@users.noreply.github.com>
Date: Tue, 29 Aug 2023 20:53:26 +0800
Subject: [PATCH 02/22] damo/nlp_seqgpt-560m pipeline bugfix (#511)

Co-authored-by: chengchen.cc <chengchen.cc@MacBook-Pro-7.local>
---
 modelscope/pipelines/nlp/text_generation_pipeline.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/modelscope/pipelines/nlp/text_generation_pipeline.py b/modelscope/pipelines/nlp/text_generation_pipeline.py
index ee747444..b26b84b1 100644
--- a/modelscope/pipelines/nlp/text_generation_pipeline.py
+++ b/modelscope/pipelines/nlp/text_generation_pipeline.py
@@ -445,9 +445,9 @@ class SeqGPTPipeline(Pipeline):
     # define the forward pass
     def forward(self, prompt: str, **forward_params) -> Dict[str, Any]:
         # gen & decode
-        prompt += '[GEN]'
+        # prompt += '[GEN]'
         input_ids = self.tokenizer(
-            prompt,
+            prompt + '[GEN]',
             return_tensors='pt',
             padding=True,
             truncation=True,

From 0405fc95a9c6e3c554b56366f2b7eb50f4461f5f Mon Sep 17 00:00:00 2001
From: Wang Qiang <37444407+XDUWQ@users.noreply.github.com>
Date: Wed, 30 Aug 2023 13:34:29 +0800
Subject: [PATCH 03/22] support a10 video to video model (#512)

---
 .../multi_modal/video_to_video/video_to_video_model.py      | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/modelscope/models/multi_modal/video_to_video/video_to_video_model.py b/modelscope/models/multi_modal/video_to_video/video_to_video_model.py
index bd485da5..1a13a3fc 100755
--- a/modelscope/models/multi_modal/video_to_video/video_to_video_model.py
+++ b/modelscope/models/multi_modal/video_to_video/video_to_video_model.py
@@ -112,7 +112,7 @@ class VideoToVideo(TorchModel):
         generator.eval()
         load_dict = torch.load(cfg.model_path, map_location='cpu')
         ret = generator.load_state_dict(load_dict['state_dict'], strict=True)
-        self.generator = generator
+        self.generator = generator.half()
         logger.info('Load model {} path {}, with local status {}'.format(
             cfg.UNet.type, cfg.model_path, ret))
 
@@ -175,7 +175,7 @@ class VideoToVideo(TorchModel):
         video_data = rearrange(video_data, 'b f c h w -> (b f) c h w')
 
         video_data_list = torch.chunk(
-            video_data, video_data.shape[0] // 2, dim=0)
+            video_data, video_data.shape[0] // 1, dim=0)
         with torch.no_grad():
             decode_data = []
             for vd_data in video_data_list:
@@ -185,6 +185,7 @@ class VideoToVideo(TorchModel):
             video_data_feature = torch.cat(decode_data, dim=0)
             video_data_feature = rearrange(
                 video_data_feature, '(b f) c h w -> b c f h w', b=batch_size)
+        torch.cuda.empty_cache()
 
         with amp.autocast(enabled=True):
             total_noise_levels = 600
@@ -209,6 +210,7 @@ class VideoToVideo(TorchModel):
                 t_min=0,
                 discretization='trailing')
 
+            torch.cuda.empty_cache()
             scale_factor = 0.18215
             vid_tensor_feature = 1. / scale_factor * gen_vid
 

From d1478db172cbb1ffdccdbda73837b0fcf350238b Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 10:11:48 +0800
Subject: [PATCH 04/22] fix crossattention of diffusers

---
 .../efficient_diffusion_tuning/efficient_stable_diffusion.py  | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
index 901c44d9..e9f136ce 100644
--- a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
+++ b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
@@ -11,7 +11,7 @@ import torch.nn.functional as F
 from diffusers import (AutoencoderKL, DDPMScheduler, DiffusionPipeline,
                        DPMSolverMultistepScheduler, UNet2DConditionModel,
                        utils)
-from diffusers.models import cross_attention
+from diffusers.models import attention
 from diffusers.utils import deprecation_utils
 from swift import AdapterConfig, LoRAConfig, PromptConfig, Swift
 from transformers import CLIPTextModel, CLIPTokenizer
@@ -30,7 +30,7 @@ from .control_sd_lora import ControlLoRATuner
 
 utils.deprecate = lambda *arg, **kwargs: None
 deprecation_utils.deprecate = lambda *arg, **kwargs: None
-cross_attention.deprecate = lambda *arg, **kwargs: None
+attention.deprecate = lambda *arg, **kwargs: None
 
 __tuner_MAP__ = {'lora': LoRATuner, 'control_lora': ControlLoRATuner}
 

From c217d293096bfa52822055bd160efd0388d0fe48 Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 10:40:59 +0800
Subject: [PATCH 05/22] fix bugs

---
 .../efficient_diffusion_tuning/control_sd_lora.py          | 7 ++++---
 .../multi_modal/efficient_diffusion_tuning/sd_lora.py      | 5 +++--
 2 files changed, 7 insertions(+), 5 deletions(-)

diff --git a/modelscope/models/multi_modal/efficient_diffusion_tuning/control_sd_lora.py b/modelscope/models/multi_modal/efficient_diffusion_tuning/control_sd_lora.py
index a2c53e24..aaa588d3 100644
--- a/modelscope/models/multi_modal/efficient_diffusion_tuning/control_sd_lora.py
+++ b/modelscope/models/multi_modal/efficient_diffusion_tuning/control_sd_lora.py
@@ -10,7 +10,8 @@ import torch
 import torch.nn as nn
 import torch.nn.functional as F
 from diffusers.configuration_utils import ConfigMixin, register_to_config
-from diffusers.models.cross_attention import CrossAttention, LoRALinearLayer
+from diffusers.models.attention_processor import Attention
+from diffusers.models.lora import LoRALinearLayer
 from diffusers.models.modeling_utils import ModelMixin
 from diffusers.models.resnet import (Downsample2D, Upsample2D, downsample_2d,
                                      partial, upsample_2d)
@@ -467,7 +468,7 @@ class ControlLoRACrossAttnProcessor(LoRACrossAttnProcessor):
         return control_states
 
     def __call__(self,
-                 attn: CrossAttention,
+                 attn: Attention,
                  hidden_states,
                  encoder_hidden_states=None,
                  attention_mask=None,
@@ -619,7 +620,7 @@ class ControlLoRACrossAttnProcessorV2(LoRACrossAttnProcessor):
         return control_states
 
     def __call__(self,
-                 attn: CrossAttention,
+                 attn: Attention,
                  hidden_states,
                  encoder_hidden_states=None,
                  attention_mask=None,
diff --git a/modelscope/models/multi_modal/efficient_diffusion_tuning/sd_lora.py b/modelscope/models/multi_modal/efficient_diffusion_tuning/sd_lora.py
index feff05f4..306ca2b0 100644
--- a/modelscope/models/multi_modal/efficient_diffusion_tuning/sd_lora.py
+++ b/modelscope/models/multi_modal/efficient_diffusion_tuning/sd_lora.py
@@ -8,7 +8,8 @@ from typing import List, Tuple, Union
 import torch
 import torch.nn as nn
 from diffusers.configuration_utils import ConfigMixin, register_to_config
-from diffusers.models.cross_attention import CrossAttention, LoRALinearLayer
+from diffusers.models.attention_processor import Attention
+from diffusers.models.lora import LoRALinearLayer
 from diffusers.models.modeling_utils import ModelMixin
 from diffusers.utils.outputs import BaseOutput
 
@@ -84,7 +85,7 @@ class LoRACrossAttnProcessor(nn.Module):
         self.output_states_skipped = is_skipped
 
     def __call__(self,
-                 attn: CrossAttention,
+                 attn: Attention,
                  hidden_states,
                  encoder_hidden_states=None,
                  attention_mask=None,

From 6d13b58eae7e4447f5b3077d7ec2172bfb7e733d Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 12:05:04 +0800
Subject: [PATCH 06/22] fix bugx bugs

---
 .../efficient_diffusion_tuning/efficient_stable_diffusion.py    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
index e9f136ce..583d5ac0 100644
--- a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
+++ b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
@@ -139,7 +139,7 @@ class EfficientStableDiffusion(TorchModel):
                     320, 320, 640, 640, 1280, 1280, 1280, 1280, 1280, 640, 640,
                     640, 320, 320, 320
                 ],
-                module_layer_name=
+                target_modules=
                 r'.*[down_blocks|up_blocks|mid_block]\.\d+\.attentions\.\d+\.transformer_blocks\.\d+$',
                 embedding_pos=0,
                 prompt_length=prompt_length,

From a9de26f683f58b4e18f9b74e9500e5ff665a6559 Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 12:56:30 +0800
Subject: [PATCH 07/22] fix bugs

---
 .../efficient_diffusion_tuning/efficient_stable_diffusion.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
index 583d5ac0..7a989070 100644
--- a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
+++ b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
@@ -113,7 +113,7 @@ class EfficientStableDiffusion(TorchModel):
             rank = tuner_config[
                 'rank'] if tuner_config and 'rank' in tuner_config else 4
             lora_config = LoRAConfig(
-                rank=rank,
+                r=rank,
                 replace_modules=['to_q', 'to_k', 'to_v', 'to_out.0'],
                 merge_weights=False,
                 only_lora_trainable=False,
@@ -126,7 +126,7 @@ class EfficientStableDiffusion(TorchModel):
             adapter_config = AdapterConfig(
                 dim=-1,
                 hidden_pos=0,
-                module_name=r'.*ff\.net\.2$',
+                target_modules=r'.*ff\.net\.2$',
                 adapter_length=adapter_length,
                 only_adapter_trainable=False,
                 pretrained_weights=pretrained_tuner)
@@ -143,7 +143,6 @@ class EfficientStableDiffusion(TorchModel):
                 r'.*[down_blocks|up_blocks|mid_block]\.\d+\.attentions\.\d+\.transformer_blocks\.\d+$',
                 embedding_pos=0,
                 prompt_length=prompt_length,
-                only_prompt_trainable=False,
                 attach_front=False,
                 pretrained_weights=pretrained_tuner,
                 extract_embedding=True)

From 7715050047840d46814e333840aa788f974bffe8 Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 16:59:18 +0800
Subject: [PATCH 08/22] fix bugs

---
 .../efficient_stable_diffusion.py                        | 9 +++------
 1 file changed, 3 insertions(+), 6 deletions(-)

diff --git a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
index 7a989070..d3919166 100644
--- a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
+++ b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
@@ -114,11 +114,10 @@ class EfficientStableDiffusion(TorchModel):
                 'rank'] if tuner_config and 'rank' in tuner_config else 4
             lora_config = LoRAConfig(
                 r=rank,
-                replace_modules=['to_q', 'to_k', 'to_v', 'to_out.0'],
+                target_modules=['to_q', 'to_k', 'to_v', 'to_out.0'],
                 merge_weights=False,
                 only_lora_trainable=False,
-                use_merged_linear=False,
-                pretrained_weights=pretrained_tuner)
+                use_merged_linear=False)
             self.unet = Swift.prepare_model(self.unet, lora_config)
         elif tuner_name == 'swift-adapter':
             adapter_length = tuner_config[
@@ -127,9 +126,7 @@ class EfficientStableDiffusion(TorchModel):
                 dim=-1,
                 hidden_pos=0,
                 target_modules=r'.*ff\.net\.2$',
-                adapter_length=adapter_length,
-                only_adapter_trainable=False,
-                pretrained_weights=pretrained_tuner)
+                adapter_length=adapter_length)
             self.unet = Swift.prepare_model(self.unet, adapter_config)
         elif tuner_name == 'swift-prompt':
             prompt_length = tuner_config[

From 83ee5b9d111b1b516c44ff99394147fa728c8c61 Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 19:12:49 +0800
Subject: [PATCH 09/22] fix bugs

---
 .../efficient_diffusion_tuning/efficient_stable_diffusion.py     | 1 -
 1 file changed, 1 deletion(-)

diff --git a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
index d3919166..c4f46cbf 100644
--- a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
+++ b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
@@ -141,7 +141,6 @@ class EfficientStableDiffusion(TorchModel):
                 embedding_pos=0,
                 prompt_length=prompt_length,
                 attach_front=False,
-                pretrained_weights=pretrained_tuner,
                 extract_embedding=True)
             self.unet = Swift.prepare_model(self.unet, prompt_config)
         elif tuner_name in ('lora', 'control_lora'):

From da58f397e1acc115d56bd739c6daa3e4b4e3b099 Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 19:24:17 +0800
Subject: [PATCH 10/22] fix bugs

---
 .../efficient_diffusion_tuning/efficient_stable_diffusion.py   | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
index c4f46cbf..18f655c2 100644
--- a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
+++ b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
@@ -140,8 +140,7 @@ class EfficientStableDiffusion(TorchModel):
                 r'.*[down_blocks|up_blocks|mid_block]\.\d+\.attentions\.\d+\.transformer_blocks\.\d+$',
                 embedding_pos=0,
                 prompt_length=prompt_length,
-                attach_front=False,
-                extract_embedding=True)
+                attach_front=False)
             self.unet = Swift.prepare_model(self.unet, prompt_config)
         elif tuner_name in ('lora', 'control_lora'):
             # if not set the config of control-tuner, we add the lora tuner directly to the original framework,

From bb7a1c497e655be8b41794b2ee155afc1209bf90 Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 20:17:29 +0800
Subject: [PATCH 11/22] fix bugs

---
 .../efficient_diffusion_tuning/efficient_stable_diffusion.py     | 1 -
 1 file changed, 1 deletion(-)

diff --git a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
index 18f655c2..2fcd1df8 100644
--- a/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
+++ b/modelscope/models/multi_modal/efficient_diffusion_tuning/efficient_stable_diffusion.py
@@ -116,7 +116,6 @@ class EfficientStableDiffusion(TorchModel):
                 r=rank,
                 target_modules=['to_q', 'to_k', 'to_v', 'to_out.0'],
                 merge_weights=False,
-                only_lora_trainable=False,
                 use_merged_linear=False)
             self.unet = Swift.prepare_model(self.unet, lora_config)
         elif tuner_name == 'swift-adapter':

From 3b0006f52c3cd4e049c9da01a185d58e07df354a Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 20:46:41 +0800
Subject: [PATCH 12/22] skip tests

---
 .../test_efficient_diffusion_tuning_trainer_swift.py        | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/trainers/test_efficient_diffusion_tuning_trainer_swift.py b/tests/trainers/test_efficient_diffusion_tuning_trainer_swift.py
index 9e12335e..c661b8ee 100644
--- a/tests/trainers/test_efficient_diffusion_tuning_trainer_swift.py
+++ b/tests/trainers/test_efficient_diffusion_tuning_trainer_swift.py
@@ -33,7 +33,7 @@ class TestEfficientDiffusionTuningTrainerSwift(unittest.TestCase):
         shutil.rmtree(self.tmp_dir)
         super().tearDown()
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_efficient_diffusion_tuning_swift_lora_train(self):
         model_id = 'damo/multi-modal_efficient-diffusion-tuning-swift-lora'
         model_revision = 'v1.0.2'
@@ -62,7 +62,7 @@ class TestEfficientDiffusionTuningTrainerSwift(unittest.TestCase):
         self.assertIn(f'{trainer.timestamp}.log.json', results_files)
         self.assertIn(f'epoch_{self.max_epochs}.pth', results_files)
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_efficient_diffusion_tuning_swift_adapter_train(self):
         model_id = 'damo/multi-modal_efficient-diffusion-tuning-swift-adapter'
         model_revision = 'v1.0.2'
@@ -91,7 +91,7 @@ class TestEfficientDiffusionTuningTrainerSwift(unittest.TestCase):
         self.assertIn(f'{trainer.timestamp}.log.json', results_files)
         self.assertIn(f'epoch_{self.max_epochs}.pth', results_files)
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_efficient_diffusion_tuning_swift_prompt_train(self):
         model_id = 'damo/multi-modal_efficient-diffusion-tuning-swift-prompt'
         model_revision = 'v1.0.2'

From c89de1a825be958029f08878a3162ef20c6cda9d Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 21:46:12 +0800
Subject: [PATCH 13/22] skip tests

---
 .../test_efficient_diffusion_tuning_swift.py         | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/tests/pipelines/test_efficient_diffusion_tuning_swift.py b/tests/pipelines/test_efficient_diffusion_tuning_swift.py
index 09b739a0..a2af7dec 100644
--- a/tests/pipelines/test_efficient_diffusion_tuning_swift.py
+++ b/tests/pipelines/test_efficient_diffusion_tuning_swift.py
@@ -16,7 +16,7 @@ class EfficientDiffusionTuningTestSwift(unittest.TestCase):
     def setUp(self) -> None:
         self.task = Tasks.efficient_diffusion_tuning
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_efficient_diffusion_tuning_swift_lora_run_pipeline(self):
         model_id = 'damo/multi-modal_efficient-diffusion-tuning-swift-lora'
         model_revision = 'v1.0.2'
@@ -33,7 +33,7 @@ class EfficientDiffusionTuningTestSwift(unittest.TestCase):
             f'Efficient-diffusion-tuning-swift-lora output: {output_image_path}'
         )
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_efficient_diffusion_tuning_swift_lora_load_model_from_pretrained(
             self):
         model_id = 'damo/multi-modal_efficient-diffusion-tuning-swift-lora'
@@ -41,7 +41,7 @@ class EfficientDiffusionTuningTestSwift(unittest.TestCase):
         model = Model.from_pretrained(model_id, model_revision=model_revision)
         self.assertTrue(model.__class__ == EfficientStableDiffusion)
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_efficient_diffusion_tuning_swift_adapter_run_pipeline(self):
         model_id = 'damo/multi-modal_efficient-diffusion-tuning-swift-adapter'
         model_revision = 'v1.0.2'
@@ -58,7 +58,7 @@ class EfficientDiffusionTuningTestSwift(unittest.TestCase):
             f'Efficient-diffusion-tuning-swift-adapter output: {output_image_path}'
         )
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_efficient_diffusion_tuning_swift_adapter_load_model_from_pretrained(
             self):
         model_id = 'damo/multi-modal_efficient-diffusion-tuning-swift-adapter'
@@ -66,7 +66,7 @@ class EfficientDiffusionTuningTestSwift(unittest.TestCase):
         model = Model.from_pretrained(model_id, model_revision=model_revision)
         self.assertTrue(model.__class__ == EfficientStableDiffusion)
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_efficient_diffusion_tuning_swift_prompt_run_pipeline(self):
         model_id = 'damo/multi-modal_efficient-diffusion-tuning-swift-prompt'
         model_revision = 'v1.0.2'
@@ -83,7 +83,7 @@ class EfficientDiffusionTuningTestSwift(unittest.TestCase):
             f'Efficient-diffusion-tuning-swift-prompt output: {output_image_path}'
         )
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_efficient_diffusion_tuning_swift_prompt_load_model_from_pretrained(
             self):
         model_id = 'damo/multi-modal_efficient-diffusion-tuning-swift-prompt'

From cf43991981efbb45c5a95f8a90459ed66eec4f22 Mon Sep 17 00:00:00 2001
From: XDUWQ <1300964705@qq.com>
Date: Thu, 31 Aug 2023 23:42:01 +0800
Subject: [PATCH 14/22] skip tests

---
 tests/export/test_export_stable_diffusion.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/export/test_export_stable_diffusion.py b/tests/export/test_export_stable_diffusion.py
index a2e20198..91a877da 100644
--- a/tests/export/test_export_stable_diffusion.py
+++ b/tests/export/test_export_stable_diffusion.py
@@ -20,7 +20,7 @@ class TestExportStableDiffusion(unittest.TestCase):
             os.makedirs(self.tmp_dir)
         self.model_id = 'AI-ModelScope/stable-diffusion-v1-5'
 
-    @unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
+    @unittest.skipUnless(test_level() >= 1, 'skip test in current test level')
     def test_export_stable_diffusion(self):
         model = Model.from_pretrained(self.model_id)
         Exporter.from_model(model).export_onnx(

From 8c139ea437eb6b8a673d53a1e5bc6a483e779eee Mon Sep 17 00:00:00 2001
From: "mulin.lyh" <mulin.lyh@taobao.com>
Date: Wed, 30 Aug 2023 10:13:41 +0800
Subject: [PATCH 15/22] version to 1.9.0rc0

---
 modelscope/version.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/modelscope/version.py b/modelscope/version.py
index bb262e90..0a98fac3 100644
--- a/modelscope/version.py
+++ b/modelscope/version.py
@@ -1,5 +1,5 @@
 # Make sure to modify __release_datetime__ to release time when making official release.
-__version__ = '1.8.1'
+__version__ = '1.9.0rc0'
 # default release datetime for branches under active development is set
 # to be a time far-far-away-into-the-future
-__release_datetime__ = '2099-10-13 08:56:12'
+__release_datetime__ = '2023-09-03 00:00:00'

From 550e8954527e92b61189153923abcbab03747977 Mon Sep 17 00:00:00 2001
From: "mulin.lyh" <mulin.lyh@taobao.com>
Date: Fri, 1 Sep 2023 18:05:11 +0800
Subject: [PATCH 16/22] fix docker file bug

---
 docker/Dockerfile.ubuntu | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/docker/Dockerfile.ubuntu b/docker/Dockerfile.ubuntu
index c4669dfc..0c9c15c4 100644
--- a/docker/Dockerfile.ubuntu
+++ b/docker/Dockerfile.ubuntu
@@ -48,10 +48,10 @@ ENV SETUPTOOLS_USE_DISTUTILS=stdlib
 RUN CUDA_HOME=/usr/local/cuda TORCH_CUDA_ARCH_LIST="6.0 6.1 7.0 7.5 8.0 8.6" pip install --no-cache-dir  'git+https://github.com/facebookresearch/detectron2.git'
 
 # torchmetrics==0.11.4 for ofa
-RUN pip install --no-cache-dir tiktoken torchmetrics==0.11.4 'protobuf<=3.20.0' bitsandbytes basicsr && \
-    git clone -b v1.0.8 https://github.com/Dao-AILab/flash-attention && \
-    cd flash-attention && pip install . && \
-    pip install csrc/layer_norm && \
-    pip install csrc/rotary && \
-    cd .. && \
-    rm -rf flash-attention
+RUN pip install --no-cache-dir tiktoken torchmetrics==0.11.4 'transformers<4.31.0' transformers_stream_generator 'protobuf<=3.20.0' bitsandbytes basicsr
+COPY docker/scripts/install_flash_attension.sh /tmp/install_flash_attension.sh
+RUN if [ "$USE_GPU" = "True" ] ; then \
+        bash /tmp/install_flash_attension.sh; \
+    else \
+        echo 'cpu unsupport flash attention'; \
+    fi

From 84647801c1898cdb4eeb444d65858b12f95a7a89 Mon Sep 17 00:00:00 2001
From: "mulin.lyh" <mulin.lyh@taobao.com>
Date: Fri, 1 Sep 2023 18:02:50 +0800
Subject: [PATCH 17/22] fix pipeline and image build issue Link:
 https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13884178 * fix
 pipeline and image build issue

---
 docker/scripts/install_flash_attension.sh                   | 6 ++++++
 .../pipelines/cv/face_human_hand_detection_pipeline.py      | 2 +-
 modelscope/pipelines/cv/product_segmentation_pipeline.py    | 3 ++-
 tests/pipelines/test_face_human_hand_detection.py           | 4 +---
 tests/pipelines/test_product_segmentation.py                | 4 +---
 5 files changed, 11 insertions(+), 8 deletions(-)
 create mode 100644 docker/scripts/install_flash_attension.sh

diff --git a/docker/scripts/install_flash_attension.sh b/docker/scripts/install_flash_attension.sh
new file mode 100644
index 00000000..6a3301c2
--- /dev/null
+++ b/docker/scripts/install_flash_attension.sh
@@ -0,0 +1,6 @@
+    git clone -b v1.0.8 https://github.com/Dao-AILab/flash-attention && \
+    cd flash-attention && pip install . && \
+    pip install csrc/layer_norm && \
+    pip install csrc/rotary && \
+    cd .. && \
+    rm -rf flash-attention
diff --git a/modelscope/pipelines/cv/face_human_hand_detection_pipeline.py b/modelscope/pipelines/cv/face_human_hand_detection_pipeline.py
index d41a14dd..a387703c 100644
--- a/modelscope/pipelines/cv/face_human_hand_detection_pipeline.py
+++ b/modelscope/pipelines/cv/face_human_hand_detection_pipeline.py
@@ -32,7 +32,7 @@ class NanoDettForFaceHumanHandDetectionPipeline(Pipeline):
         logger.info('load model done')
 
     def preprocess(self, input: Input) -> Dict[str, Any]:
-        img = LoadImage.convert_to_ndarray(input['input_path'])
+        img = LoadImage.convert_to_ndarray(input)
         return img
 
     def forward(self, input: Dict[str, Any]) -> Dict[str, Any]:
diff --git a/modelscope/pipelines/cv/product_segmentation_pipeline.py b/modelscope/pipelines/cv/product_segmentation_pipeline.py
index 3b1b2381..d5cf2eab 100644
--- a/modelscope/pipelines/cv/product_segmentation_pipeline.py
+++ b/modelscope/pipelines/cv/product_segmentation_pipeline.py
@@ -31,7 +31,8 @@ class F3NetForProductSegmentationPipeline(Pipeline):
         logger.info('load model done')
 
     def preprocess(self, input: Input) -> Dict[str, Any]:
-        img = LoadImage.convert_to_ndarray(input['input_path'])
+        img = LoadImage.convert_to_ndarray(input)
+
         img = img.astype(np.float32)
         return img
 
diff --git a/tests/pipelines/test_face_human_hand_detection.py b/tests/pipelines/test_face_human_hand_detection.py
index 7aaa67e7..d2237e52 100644
--- a/tests/pipelines/test_face_human_hand_detection.py
+++ b/tests/pipelines/test_face_human_hand_detection.py
@@ -14,9 +14,7 @@ class FaceHumanHandTest(unittest.TestCase):
 
     def setUp(self) -> None:
         self.model_id = 'damo/cv_nanodet_face-human-hand-detection'
-        self.input = {
-            'input_path': 'data/test/images/face_human_hand_detection.jpg',
-        }
+        self.input = 'data/test/images/face_human_hand_detection.jpg'
 
     def pipeline_inference(self, pipeline: Pipeline, input: str):
         result = pipeline(input)
diff --git a/tests/pipelines/test_product_segmentation.py b/tests/pipelines/test_product_segmentation.py
index 8f41c13c..90137dea 100644
--- a/tests/pipelines/test_product_segmentation.py
+++ b/tests/pipelines/test_product_segmentation.py
@@ -17,9 +17,7 @@ class ProductSegmentationTest(unittest.TestCase):
 
     def setUp(self) -> None:
         self.model_id = 'damo/cv_F3Net_product-segmentation'
-        self.input = {
-            'input_path': 'data/test/images/product_segmentation.jpg'
-        }
+        self.input = 'data/test/images/product_segmentation.jpg'
 
     def pipeline_inference(self, pipeline: Pipeline, input: str):
         result = pipeline(input)

From 4780b5fb2f35d03f313dd5832f2f2f23dba406ab Mon Sep 17 00:00:00 2001
From: zsl01670416 <zsl01670416@alibaba-inc.com>
Date: Sat, 2 Sep 2023 08:04:54 +0800
Subject: [PATCH 18/22] modify parameter model_id to model

fix stable_diffusion_cones2, parameter model_id was modified to model, following file was changed:
1. examples/pytorch/stable_diffusion/cones2/finetune_stable_diffusion_cones2.py
Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13886743
* modify parameter model_id to model
---
 .../stable_diffusion/cones2/finetune_stable_diffusion_cones2.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/pytorch/stable_diffusion/cones2/finetune_stable_diffusion_cones2.py b/examples/pytorch/stable_diffusion/cones2/finetune_stable_diffusion_cones2.py
index de97b3c9..135a5c7d 100644
--- a/examples/pytorch/stable_diffusion/cones2/finetune_stable_diffusion_cones2.py
+++ b/examples/pytorch/stable_diffusion/cones2/finetune_stable_diffusion_cones2.py
@@ -77,7 +77,7 @@ def cfg_modify_fn(cfg):
 
 
 kwargs = dict(
-    model=training_args.model_id,
+    model=training_args.model,
     model_revision=args.model_revision,
     work_dir=training_args.work_dir,
     train_dataset=train_dataset,

From db8ec462c2a9cd009b062061a496ac8672616b07 Mon Sep 17 00:00:00 2001
From: "mulin.lyh" <mulin.lyh@taobao.com>
Date: Mon, 4 Sep 2023 11:16:28 +0800
Subject: [PATCH 19/22] fix select case error Link:
 https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13889257 * fix
 select case error

---
 .dev_scripts/dockerci.sh | 2 +-
 tests/run_analysis.py    | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/.dev_scripts/dockerci.sh b/.dev_scripts/dockerci.sh
index b4332f39..0278a785 100644
--- a/.dev_scripts/dockerci.sh
+++ b/.dev_scripts/dockerci.sh
@@ -9,7 +9,7 @@ cpu_sets_arr=($cpu_sets)
 is_get_file_lock=false
 CI_COMMAND=${CI_COMMAND:-bash .dev_scripts/ci_container_test.sh python tests/run.py --parallel 2 --run_config tests/run_config.yaml}
 echo "ci command: $CI_COMMAND"
-PR_CHANGED_FILES="${PR_CHANGED_FILES:-''}"
+PR_CHANGED_FILES="${PR_CHANGED_FILES:-}"
 echo "PR modified files: $PR_CHANGED_FILES"
 PR_CHANGED_FILES=${PR_CHANGED_FILES//[ ]/#}
 echo "PR_CHANGED_FILES: $PR_CHANGED_FILES"
diff --git a/tests/run_analysis.py b/tests/run_analysis.py
index 95c24698..1fb12ff6 100644
--- a/tests/run_analysis.py
+++ b/tests/run_analysis.py
@@ -126,11 +126,12 @@ def get_current_branch():
 
 def get_modified_files():
     if 'PR_CHANGED_FILES' in os.environ and os.environ[
-            'PR_CHANGED_FILES'] != '':
+            'PR_CHANGED_FILES'].strip() != '':
         logger.info('Getting PR modified files.')
         # get modify file from environment
         diff_files = os.environ['PR_CHANGED_FILES'].replace('#', '\n')
     else:
+        logger.info('Getting diff of branch.')
         cmd = ['git', 'diff', '--name-only', 'origin/master...']
         diff_files = run_command_get_output(cmd)
     logger.info('Diff files: ')

From bb63a8d4650d2e23cee6b4765897e8f6edd6eb77 Mon Sep 17 00:00:00 2001
From: "mulin.lyh" <mulin.lyh@taobao.com>
Date: Mon, 4 Sep 2023 13:30:38 +0800
Subject: [PATCH 20/22] remove error log Link:
 https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13891446

---
 .../models/cv/referring_video_object_segmentation/utils/mttr.py | 1 +
 modelscope/pipelines/cv/face_emotion_pipeline.py                | 2 +-
 modelscope/pipelines/cv/face_human_hand_detection_pipeline.py   | 1 -
 modelscope/pipelines/cv/hand_static_pipeline.py                 | 2 +-
 4 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/modelscope/models/cv/referring_video_object_segmentation/utils/mttr.py b/modelscope/models/cv/referring_video_object_segmentation/utils/mttr.py
index 48d4bf70..136208cd 100644
--- a/modelscope/models/cv/referring_video_object_segmentation/utils/mttr.py
+++ b/modelscope/models/cv/referring_video_object_segmentation/utils/mttr.py
@@ -65,6 +65,7 @@ class MTTR(nn.Module):
         # keep only the valid frames (frames which are annotated):
         # (for example, in a2d-sentences only the center frame in each window is annotated).
         for layer_out in backbone_out:
+            valid_indices = valid_indices.to(layer_out.tensors.device)
             layer_out.tensors = layer_out.tensors.index_select(
                 0, valid_indices)
             layer_out.mask = layer_out.mask.index_select(0, valid_indices)
diff --git a/modelscope/pipelines/cv/face_emotion_pipeline.py b/modelscope/pipelines/cv/face_emotion_pipeline.py
index 9d9aa6ee..f7882969 100644
--- a/modelscope/pipelines/cv/face_emotion_pipeline.py
+++ b/modelscope/pipelines/cv/face_emotion_pipeline.py
@@ -31,7 +31,7 @@ class FaceEmotionPipeline(Pipeline):
         logger.info('load model done')
 
     def preprocess(self, input: Input) -> Dict[str, Any]:
-        img = LoadImage.convert_to_ndarray(input['img_path'])
+        img = LoadImage.convert_to_ndarray(input)
         return img
 
     def forward(self, input: Dict[str, Any]) -> Dict[str, Any]:
diff --git a/modelscope/pipelines/cv/face_human_hand_detection_pipeline.py b/modelscope/pipelines/cv/face_human_hand_detection_pipeline.py
index a387703c..5fc70821 100644
--- a/modelscope/pipelines/cv/face_human_hand_detection_pipeline.py
+++ b/modelscope/pipelines/cv/face_human_hand_detection_pipeline.py
@@ -39,7 +39,6 @@ class NanoDettForFaceHumanHandDetectionPipeline(Pipeline):
 
         cls_list, bbox_list, score_list = det_infer.inference(
             self.model, self.device, input)
-        logger.info(cls_list, bbox_list, score_list)
         return {
             OutputKeys.LABELS: cls_list,
             OutputKeys.BOXES: bbox_list,
diff --git a/modelscope/pipelines/cv/hand_static_pipeline.py b/modelscope/pipelines/cv/hand_static_pipeline.py
index c020b7aa..ea908ed0 100644
--- a/modelscope/pipelines/cv/hand_static_pipeline.py
+++ b/modelscope/pipelines/cv/hand_static_pipeline.py
@@ -30,7 +30,7 @@ class HandStaticPipeline(Pipeline):
         logger.info('load model done')
 
     def preprocess(self, input: Input) -> Dict[str, Any]:
-        img = LoadImage.convert_to_ndarray(input['img_path'])
+        img = LoadImage.convert_to_ndarray(input)
         return img
 
     def forward(self, input: Dict[str, Any]) -> Dict[str, Any]:

From 797dda70bb14819692488d6d8d58757e45c180da Mon Sep 17 00:00:00 2001
From: "mulin.lyh" <mulin.lyh@taobao.com>
Date: Tue, 5 Sep 2023 10:42:43 +0800
Subject: [PATCH 21/22] merge github pull #519

Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/13900895
* merge github pull #519

* fix bug

* fix case issue

* merge github #519
---
 .../multi_modal/custom_diffusion/custom_diffusion_trainer.py   | 3 ++-
 tests/pipelines/test_face_emotion.py                           | 2 +-
 tests/pipelines/test_hand_static.py                            | 2 +-
 3 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/modelscope/trainers/multi_modal/custom_diffusion/custom_diffusion_trainer.py b/modelscope/trainers/multi_modal/custom_diffusion/custom_diffusion_trainer.py
index 1183c167..a18b546e 100644
--- a/modelscope/trainers/multi_modal/custom_diffusion/custom_diffusion_trainer.py
+++ b/modelscope/trainers/multi_modal/custom_diffusion/custom_diffusion_trainer.py
@@ -40,7 +40,8 @@ class CustomCheckpointProcessor(CheckpointProcessor):
     def __init__(self,
                  modifier_token,
                  modifier_token_id,
-                 torch_type=torch.float32):
+                 torch_type=torch.float32,
+                 safe_serialization=False):
         """Checkpoint processor for custom diffusion.
 
         Args:
diff --git a/tests/pipelines/test_face_emotion.py b/tests/pipelines/test_face_emotion.py
index 96fe51a7..b0070edc 100644
--- a/tests/pipelines/test_face_emotion.py
+++ b/tests/pipelines/test_face_emotion.py
@@ -11,7 +11,7 @@ class FaceEmotionTest(unittest.TestCase):
 
     def setUp(self) -> None:
         self.model = 'damo/cv_face-emotion'
-        self.img = {'img_path': 'data/test/images/face_emotion.jpg'}
+        self.img = 'data/test/images/face_emotion.jpg'
 
     def pipeline_inference(self, pipeline: Pipeline, input: str):
         result = pipeline(input)
diff --git a/tests/pipelines/test_hand_static.py b/tests/pipelines/test_hand_static.py
index 37181899..ae18c1d7 100644
--- a/tests/pipelines/test_hand_static.py
+++ b/tests/pipelines/test_hand_static.py
@@ -11,7 +11,7 @@ class HandStaticTest(unittest.TestCase):
 
     def setUp(self) -> None:
         self.model = 'damo/cv_mobileface_hand-static'
-        self.input = {'img_path': 'data/test/images/hand_static.jpg'}
+        self.input = 'data/test/images/hand_static.jpg'
 
     def pipeline_inference(self, pipeline: Pipeline, input: str):
         result = pipeline(input)

From f1629afd70e9024f1ef993841ce716a02c7d8c93 Mon Sep 17 00:00:00 2001
From: "mulin.lyh" <mulin.lyh@taobao.com>
Date: Tue, 5 Sep 2023 10:49:28 +0800
Subject: [PATCH 22/22] version to 1.9.0

---
 modelscope/version.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/modelscope/version.py b/modelscope/version.py
index 0a98fac3..46db9e93 100644
--- a/modelscope/version.py
+++ b/modelscope/version.py
@@ -1,5 +1,5 @@
 # Make sure to modify __release_datetime__ to release time when making official release.
-__version__ = '1.9.0rc0'
+__version__ = '1.9.0'
 # default release datetime for branches under active development is set
 # to be a time far-far-away-into-the-future
-__release_datetime__ = '2023-09-03 00:00:00'
+__release_datetime__ = '2023-09-06 00:00:00'