Files
modelscope/tests/pipelines/test_text_classification.py

64 lines
2.3 KiB
Python
Raw Normal View History

# Copyright (c) Alibaba, Inc. and its affiliates.
import tempfile
import unittest
import zipfile
from pathlib import Path
from maas_lib.fileio import File
from maas_lib.models import Model
from maas_lib.models.nlp import SequenceClassificationModel
from maas_lib.pipelines import SequenceClassificationPipeline, pipeline
from maas_lib.preprocessors import SequenceClassificationPreprocessor
class SequenceClassificationTest(unittest.TestCase):
def predict(self, pipeline_ins: SequenceClassificationPipeline):
from easynlp.appzoo import load_dataset
set = load_dataset('glue', 'sst2')
data = set['test']['sentence'][:3]
results = pipeline_ins(data[0])
print(results)
results = pipeline_ins(data[1])
print(results)
print(data)
def test_run(self):
model_url = 'https://atp-modelzoo-sh.oss-cn-shanghai.aliyuncs.com' \
'/release/easynlp_modelzoo/alibaba-pai/bert-base-sst2.zip'
cache_path_str = r'.cache/easynlp/bert-base-sst2.zip'
cache_path = Path(cache_path_str)
if not cache_path.exists():
cache_path.parent.mkdir(parents=True, exist_ok=True)
cache_path.touch(exist_ok=True)
with cache_path.open('wb') as ofile:
ofile.write(File.read(model_url))
with zipfile.ZipFile(cache_path_str, 'r') as zipf:
zipf.extractall(cache_path.parent)
path = r'.cache/easynlp/bert-base-sst2'
model = SequenceClassificationModel(path)
preprocessor = SequenceClassificationPreprocessor(
path, first_sequence='sentence', second_sequence=None)
pipeline1 = SequenceClassificationPipeline(model, preprocessor)
self.predict(pipeline1)
pipeline2 = pipeline(
'text-classification', model=model, preprocessor=preprocessor)
print(pipeline2('Hello world!'))
def test_run_modelhub(self):
model = Model.from_pretrained('damo/bert-base-sst2')
preprocessor = SequenceClassificationPreprocessor(
model.model_dir, first_sequence='sentence', second_sequence=None)
pipeline_ins = pipeline(
task='text-classification', model=model, preprocessor=preprocessor)
self.predict(pipeline_ins)
if __name__ == '__main__':
unittest.main()