From ffa7975ba2d2fa2ba23bad6ff7c23e133f3f0f30 Mon Sep 17 00:00:00 2001
From: shuaigezhu <zhuyufengca@gmail.com>
Date: Fri, 17 Mar 2023 14:05:58 +0800
Subject: [PATCH] init

---
 modelscope/metainfo.py                        |  2 +
 modelscope/models/nlp/__init__.py             |  2 +
 modelscope/models/nlp/chatglm_6b/__init__.py  | 22 +++++++++
 .../chatglm6b_for_text_generation.py          | 46 +++++++++++++++++++
 modelscope/pipelines/nlp/__init__.py          |  2 +
 .../nlp/chatglm6b_text_generation_pipeline.py | 39 ++++++++++++++++
 6 files changed, 113 insertions(+)
 create mode 100644 modelscope/models/nlp/chatglm_6b/__init__.py
 create mode 100644 modelscope/models/nlp/chatglm_6b/chatglm6b_for_text_generation.py
 create mode 100644 modelscope/pipelines/nlp/chatglm6b_text_generation_pipeline.py

diff --git a/modelscope/metainfo.py b/modelscope/metainfo.py
index 197999bb..f1edca9c 100644
--- a/modelscope/metainfo.py
+++ b/modelscope/metainfo.py
@@ -147,6 +147,7 @@ class Models(object):
     T5 = 'T5'
     mglm = 'mglm'
     codegeex = 'codegeex'
+    chatglm6b = 'chatglm6b'
     bloom = 'bloom'
     unite = 'unite'
     megatron_bert = 'megatron-bert'
@@ -424,6 +425,7 @@ class Pipelines(object):
     feature_extraction = 'feature-extraction'
     mglm_text_summarization = 'mglm-text-summarization'
     codegeex_code_translation = 'codegeex-code-translation'
+    chatglm6b_text_generation = 'chatglm6b-text-generation'
     codegeex_code_generation = 'codegeex-code-generation'
     translation_en_to_de = 'translation_en_to_de'  # keep it underscore
     translation_en_to_ro = 'translation_en_to_ro'  # keep it underscore
diff --git a/modelscope/models/nlp/__init__.py b/modelscope/models/nlp/__init__.py
index 66a53a00..723bc586 100644
--- a/modelscope/models/nlp/__init__.py
+++ b/modelscope/models/nlp/__init__.py
@@ -18,6 +18,7 @@ if TYPE_CHECKING:
     )
     from .bloom import BloomModel
     from .codegeex import CodeGeeXForCodeTranslation, CodeGeeXForCodeGeneration
+    from .chatglm_6b import ChatGLM6bForTextGeneration
     from .csanmt import CsanmtForTranslation
     from .deberta_v2 import DebertaV2ForMaskedLM, DebertaV2Model
     from .gpt_neo import GPTNeoModel
@@ -89,6 +90,7 @@ else:
         'csanmt': ['CsanmtForTranslation'],
         'codegeex':
         ['CodeGeeXForCodeTranslation', 'CodeGeeXForCodeGeneration'],
+        'chatglm_6b': ['ChatGLM6bForTextGeneration'],
         'deberta_v2': ['DebertaV2ForMaskedLM', 'DebertaV2Model'],
         'heads': ['TextClassificationHead'],
         'hf_transformers': ['TransformersModel'],
diff --git a/modelscope/models/nlp/chatglm_6b/__init__.py b/modelscope/models/nlp/chatglm_6b/__init__.py
new file mode 100644
index 00000000..b1ec0118
--- /dev/null
+++ b/modelscope/models/nlp/chatglm_6b/__init__.py
@@ -0,0 +1,22 @@
+# Modified by Zhipu.AI
+# Original Copyright (c) Alibaba, Inc. and its affiliates.
+from typing import TYPE_CHECKING
+
+from modelscope.utils.import_utils import LazyImportModule
+
+if TYPE_CHECKING:
+    from .chatglm6b_for_text_generation import ChatGLM6bForTextGeneration
+else:
+    _import_structure = {
+        'chatglm6b_for_text_generation': ['ChatGLM6bForTextGeneration']
+    }
+
+    import sys
+
+    sys.modules[__name__] = LazyImportModule(
+        __name__,
+        globals()['__file__'],
+        _import_structure,
+        module_spec=__spec__,
+        extra_objects={},
+    )
diff --git a/modelscope/models/nlp/chatglm_6b/chatglm6b_for_text_generation.py b/modelscope/models/nlp/chatglm_6b/chatglm6b_for_text_generation.py
new file mode 100644
index 00000000..bdf68641
--- /dev/null
+++ b/modelscope/models/nlp/chatglm_6b/chatglm6b_for_text_generation.py
@@ -0,0 +1,46 @@
+# Copyright (c) 2022 Zhipu.AI
+import copy
+from typing import Any, Dict
+
+import torch
+
+from modelscope.metainfo import Models
+from modelscope.models.base import TorchModel
+from modelscope.models.builder import MODELS
+from modelscope.outputs import OutputKeys
+from modelscope.utils.constant import Tasks
+from modelscope.utils.logger import get_logger
+from transformers import AutoTokenizer, AutoModel
+
+
+@MODELS.register_module(Tasks.text_generation, module_name=Models.chatglm6b)
+class ChatGLM6bForTextGeneration(TorchModel):
+
+    def __init__(self, model_dir: str, *args, **kwargs):
+        """initialize the chatglm6b from the `model_dir` path.
+
+        Args:
+            model_dir (str): the model path.
+        """
+        super().__init__(model_dir, *args, **kwargs)
+        self.logger = get_logger()
+        # loading tokenizer
+        self.tokenizer = AutoTokenizer.from_pretrained(model_dir, trust_remote_code=True)
+        # loading model
+        self.model = AutoModel.from_pretrained(model_dir, trust_remote_code=True).half().cuda()
+
+
+    def forward(self, input: Dict) -> Dict:
+        return {OutputKeys.TEXT: self.chat(input)}
+
+    def chat(self, input: Dict) -> Dict:
+        text = input['text']
+        history = input['history']
+        response, history = self.model.chat(self.tokenizer, text, history)
+        self.logger.info('Generation finished.')
+        res = {'response': response, 'history': history}
+        return {OutputKeys.TEXT: res}
+    
+    def quantize(self, bits: int):
+        self.model = self.model.quantize(bits)
+        return self
\ No newline at end of file
diff --git a/modelscope/pipelines/nlp/__init__.py b/modelscope/pipelines/nlp/__init__.py
index cc8487fe..24216b87 100644
--- a/modelscope/pipelines/nlp/__init__.py
+++ b/modelscope/pipelines/nlp/__init__.py
@@ -35,6 +35,7 @@ if TYPE_CHECKING:
     from .mglm_text_summarization_pipeline import MGLMTextSummarizationPipeline
     from .codegeex_code_translation_pipeline import CodeGeeXCodeTranslationPipeline
     from .codegeex_code_generation_pipeline import CodeGeeXCodeGenerationPipeline
+    from .chatglm6b_text_generation_pipeline import ChatGLM6bTextGenerationPipeline
     from .translation_evaluation_pipeline import TranslationEvaluationPipeline
     from .user_satisfaction_estimation_pipeline import UserSatisfactionEstimationPipeline
     from .siamese_uie_pipeline import SiameseUiePipeline
@@ -89,6 +90,7 @@ else:
         ['CodeGeeXCodeTranslationPipeline'],
         'codegeex_code_generation_pipeline':
         ['CodeGeeXCodeGenerationPipeline'],
+        'chatglm6b_text_generation_pipeline': ['ChatGLM6bTextGenerationPipeline'],
         'translation_evaluation_pipeline': ['TranslationEvaluationPipeline'],
         'user_satisfaction_estimation_pipeline':
         ['UserSatisfactionEstimationPipeline'],
diff --git a/modelscope/pipelines/nlp/chatglm6b_text_generation_pipeline.py b/modelscope/pipelines/nlp/chatglm6b_text_generation_pipeline.py
new file mode 100644
index 00000000..6ef14f0b
--- /dev/null
+++ b/modelscope/pipelines/nlp/chatglm6b_text_generation_pipeline.py
@@ -0,0 +1,39 @@
+# Copyright (c) 2022 Zhipu.AI
+
+from typing import Any, Dict, Union
+
+from modelscope.metainfo import Pipelines
+from modelscope.models.nlp import ChatGLM6bForTextGeneration
+from modelscope.pipelines.base import Pipeline
+from modelscope.pipelines.builder import PIPELINES
+from modelscope.preprocessors import Preprocessor
+from modelscope.utils.constant import Tasks
+
+
+@PIPELINES.register_module(
+    group_key=Tasks.text_generation,
+    module_name=Pipelines.chatglm6b_text_generation)
+class ChatGLM6bTextGenerationPipeline(Pipeline):
+
+    def __init__(self,
+                 model: Union[ChatGLM6bForTextGeneration, str],
+                 preprocessor: [Preprocessor] = None,
+                 *args,
+                 **kwargs):
+        model = ChatGLM6bForTextGeneration(model) if isinstance(model,
+                                                               str) else model
+        self.model = model
+        self.model.eval()
+
+        super().__init__(model=model, **kwargs)
+
+    def preprocess(self, inputs, **preprocess_params) -> Dict[str, Any]:
+        return inputs
+
+    # define the forward pass
+    def forward(self, inputs: Dict, **forward_params) -> Dict[str, Any]:
+        return self.model(inputs)
+
+    # format the outputs from pipeline
+    def postprocess(self, input, **kwargs) -> Dict[str, Any]:
+        return input
\ No newline at end of file