wip

2025-12-17 00:37:43 +01:00 · 2024-12-29 14:41:36 +08:00
parent 225d1058e3
commit c42a0aca1f
5 changed files with 474 additions and 543 deletions
--- a/modelscope/utils/hf_util.py
+++ b/modelscope/utils/hf_util.py
@@ -1,543 +0,0 @@
-# Copyright (c) Alibaba, Inc. and its affiliates.
-import os
-from functools import partial
-from pathlib import Path
-from types import MethodType
-from typing import BinaryIO, Dict, List, Optional, Union
-
-from huggingface_hub.hf_api import CommitInfo, future_compatible
-from transformers import AutoConfig as AutoConfigHF
-from transformers import AutoFeatureExtractor as AutoFeatureExtractorHF
-from transformers import AutoImageProcessor as AutoImageProcessorHF
-from transformers import AutoModel as AutoModelHF
-from transformers import \
-    AutoModelForAudioClassification as AutoModelForAudioClassificationHF
-from transformers import AutoModelForCausalLM as AutoModelForCausalLMHF
-from transformers import \
-    AutoModelForDocumentQuestionAnswering as \
-    AutoModelForDocumentQuestionAnsweringHF
-from transformers import \
-    AutoModelForImageClassification as AutoModelForImageClassificationHF
-from transformers import \
-    AutoModelForImageSegmentation as AutoModelForImageSegmentationHF
-from transformers import \
-    AutoModelForInstanceSegmentation as AutoModelForInstanceSegmentationHF
-from transformers import \
-    AutoModelForMaskedImageModeling as AutoModelForMaskedImageModelingHF
-from transformers import AutoModelForMaskedLM as AutoModelForMaskedLMHF
-from transformers import \
-    AutoModelForMaskGeneration as AutoModelForMaskGenerationHF
-from transformers import \
-    AutoModelForObjectDetection as AutoModelForObjectDetectionHF
-from transformers import AutoModelForPreTraining as AutoModelForPreTrainingHF
-from transformers import \
-    AutoModelForQuestionAnswering as AutoModelForQuestionAnsweringHF
-from transformers import \
-    AutoModelForSemanticSegmentation as AutoModelForSemanticSegmentationHF
-from transformers import AutoModelForSeq2SeqLM as AutoModelForSeq2SeqLMHF
-from transformers import \
-    AutoModelForSequenceClassification as AutoModelForSequenceClassificationHF
-from transformers import \
-    AutoModelForSpeechSeq2Seq as AutoModelForSpeechSeq2SeqHF
-from transformers import \
-    AutoModelForTableQuestionAnswering as AutoModelForTableQuestionAnsweringHF
-from transformers import AutoModelForTextEncoding as AutoModelForTextEncodingHF
-from transformers import \
-    AutoModelForTokenClassification as AutoModelForTokenClassificationHF
-from transformers import \
-    AutoModelForUniversalSegmentation as AutoModelForUniversalSegmentationHF
-from transformers import AutoModelForVision2Seq as AutoModelForVision2SeqHF
-from transformers import \
-    AutoModelForVisualQuestionAnswering as \
-    AutoModelForVisualQuestionAnsweringHF
-from transformers import \
-    AutoModelForZeroShotImageClassification as \
-    AutoModelForZeroShotImageClassificationHF
-from transformers import \
-    AutoModelForZeroShotObjectDetection as \
-    AutoModelForZeroShotObjectDetectionHF
-from transformers import AutoProcessor as AutoProcessorHF
-from transformers import AutoTokenizer as AutoTokenizerHF
-from transformers import BatchFeature as BatchFeatureHF
-from transformers import BitsAndBytesConfig as BitsAndBytesConfigHF
-from transformers import GenerationConfig as GenerationConfigHF
-from transformers import (PretrainedConfig, PreTrainedModel,
-                          PreTrainedTokenizerBase)
-from transformers import T5EncoderModel as T5EncoderModelHF
-from transformers import __version__ as transformers_version
-
-from modelscope import snapshot_download
-from modelscope.utils.constant import DEFAULT_MODEL_REVISION, Invoke
-from .logger import get_logger
-
-try:
-    from transformers import GPTQConfig as GPTQConfigHF
-    from transformers import AwqConfig as AwqConfigHF
-except ImportError:
-    GPTQConfigHF = None
-    AwqConfigHF = None
-
-try:
-    from peft import (
-        PeftConfig as PeftConfigHF,
-        PeftModel as PeftModelHF,
-        PeftModelForCausalLM as PeftModelForCausalLMHF,
-        PeftModelForSequenceClassification as
-        PeftModelForSequenceClassificationHF,
-        PeftMixedModel as PeftMixedModelHF,
-    )
-except ImportError:
-    PeftConfigHF = None
-    PeftModelHF = None
-    PeftModelForCausalLMHF = None
-    PeftModelForSequenceClassificationHF = None
-    PeftMixedModelHF = None
-
-logger = get_logger()
-
-
-class UnsupportedAutoClass:
-
-    def __init__(self, name: str):
-        self.error_msg = \
-            f'{name} is not supported with your installed Transformers version {transformers_version}. ' + \
-            'Please update your Transformers by "pip install transformers -U".'
-
-    def from_pretrained(self, pretrained_model_name_or_path, *model_args,
-                        **kwargs):
-        raise ImportError(self.error_msg)
-
-    def from_config(self, cls, config):
-        raise ImportError(self.error_msg)
-
-
-def user_agent(invoked_by=None):
-    if invoked_by is None:
-        invoked_by = Invoke.PRETRAINED
-    uagent = '%s/%s' % (Invoke.KEY, invoked_by)
-    return uagent
-
-
-def _file_exists(
-    self,
-    repo_id: str,
-    filename: str,
-    *,
-    repo_type: Optional[str] = None,
-    revision: Optional[str] = None,
-    token: Union[str, bool, None] = None,
-):
-    """Patch huggingface_hub.file_exists"""
-    if repo_type is not None:
-        logger.warning(
-            'The passed in repo_type will not be used in modelscope. Now only model repo can be queried.'
-        )
-    from modelscope.hub.api import HubApi
-    api = HubApi()
-    api.try_login(token)
-    return api.file_exists(repo_id, filename, revision=revision)
-
-
-def _file_download(repo_id: str,
-                   filename: str,
-                   *,
-                   subfolder: Optional[str] = None,
-                   repo_type: Optional[str] = None,
-                   revision: Optional[str] = None,
-                   cache_dir: Union[str, Path, None] = None,
-                   local_dir: Union[str, Path, None] = None,
-                   token: Union[bool, str, None] = None,
-                   local_files_only: bool = False,
-                   **kwargs):
-    """Patch huggingface_hub.hf_hub_download"""
-    if len(kwargs) > 0:
-        logger.warning(
-            'The passed in library_name,library_version,user_agent,force_download,proxies'
-            'etag_timeout,headers,endpoint '
-            'will not be used in modelscope.')
-    assert repo_type in (
-        None, 'model',
-        'dataset'), f'repo_type={repo_type} is not supported in ModelScope'
-    if repo_type in (None, 'model'):
-        from modelscope.hub.file_download import model_file_download as file_download
-    else:
-        from modelscope.hub.file_download import dataset_file_download as file_download
-    from modelscope import HubApi
-    api = HubApi()
-    api.try_login(token)
-    return file_download(
-        repo_id,
-        file_path=os.path.join(subfolder, filename) if subfolder else filename,
-        cache_dir=cache_dir,
-        local_dir=local_dir,
-        local_files_only=local_files_only,
-        revision=revision)
-
-
-def _whoami(self, token: Union[bool, str, None] = None) -> Dict:
-    from modelscope.hub.api import ModelScopeConfig
-    return {'name': ModelScopeConfig.get_user_info()[0] or 'unknown'}
-
-
-def _patch_pretrained_class():
-
-    def get_model_dir(pretrained_model_name_or_path, ignore_file_pattern,
-                      **kwargs):
-        if not os.path.exists(pretrained_model_name_or_path):
-            revision = kwargs.pop('revision', None)
-            model_dir = snapshot_download(
-                pretrained_model_name_or_path,
-                revision=revision,
-                ignore_file_pattern=ignore_file_pattern)
-        else:
-            model_dir = pretrained_model_name_or_path
-        return model_dir
-
-    ignore_file_pattern = [
-        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt'
-    ]
-
-    def patch_pretrained_model_name_or_path(cls, pretrained_model_name_or_path,
-                                            *model_args, **kwargs):
-        model_dir = get_model_dir(pretrained_model_name_or_path,
-                                  kwargs.pop('ignore_file_pattern', None),
-                                  **kwargs)
-        return kwargs.pop('ori_func')(cls, model_dir, *model_args, **kwargs)
-
-    PreTrainedTokenizerBase.from_pretrained = partial(
-        patch_pretrained_model_name_or_path,
-        ori_func=PreTrainedTokenizerBase.from_pretrained,
-        ignore_file_pattern=ignore_file_pattern)
-    PretrainedConfig.from_pretrained = partial(
-        patch_pretrained_model_name_or_path,
-        ori_func=PretrainedConfig.from_pretrained,
-        ignore_file_pattern=ignore_file_pattern)
-    PretrainedConfig.get_config_dict = partial(
-        patch_pretrained_model_name_or_path,
-        ori_func=PretrainedConfig.get_config_dict,
-        ignore_file_pattern=ignore_file_pattern)
-    PreTrainedModel.from_pretrained = partial(
-        patch_pretrained_model_name_or_path,
-        ori_func=PreTrainedModel.from_pretrained)
-    AutoImageProcessorHF.from_pretrained = partial(
-        patch_pretrained_model_name_or_path,
-        ori_func=PreTrainedModel.from_pretrained)
-    AutoProcessorHF.from_pretrained = partial(
-        patch_pretrained_model_name_or_path,
-        ori_func=AutoProcessorHF.from_pretrained)
-    AutoFeatureExtractorHF.from_pretrained = partial(
-        patch_pretrained_model_name_or_path,
-        ori_func=AutoFeatureExtractorHF.from_pretrained)
-    if PeftConfigHF is not None:
-        PeftConfigHF.from_pretrained = partial(
-            patch_pretrained_model_name_or_path,
-            ori_func=PeftConfigHF.from_pretrained,
-            ignore_file_pattern=ignore_file_pattern)
-
-    def patch_peft_model_id(cls, model, model_id, *model_args, **kwargs):
-        model_dir = get_model_dir(model_id,
-                                  kwargs.pop('ignore_file_pattern', None),
-                                  **kwargs)
-        return kwargs.pop('ori_func')(cls, model, model_dir, *model_args,
-                                      **kwargs)
-
-    if PeftModelHF is not None:
-        PeftModelHF.from_pretrained = partial(
-            patch_peft_model_id, ori_func=PeftModelHF.from_pretrained)
-        PeftModelForCausalLMHF.from_pretrained = partial(
-            patch_peft_model_id,
-            ori_func=PeftModelForCausalLMHF.from_pretrained)
-        PeftModelForSequenceClassificationHF.from_pretrained = partial(
-            patch_peft_model_id,
-            ori_func=PeftModelForSequenceClassificationHF.from_pretrained)
-        PeftMixedModelHF.from_pretrained = partial(
-            patch_peft_model_id, ori_func=PeftMixedModelHF.from_pretrained)
-
-    def _get_peft_type(cls, model_id, **kwargs):
-        model_dir = get_model_dir(model_id, ignore_file_pattern, **kwargs)
-        return kwargs.pop('ori_func')(cls, model_dir, **kwargs)
-
-    if PeftConfigHF is not None:
-        PeftConfigHF._get_peft_type = partial(
-            _get_peft_type,
-            ori_func=PeftConfigHF._get_peft_type,
-            ignore_file_pattern=ignore_file_pattern)
-
-
-def patch_hub():
-    """Patch hf hub, which to make users can download models from modelscope to speed up.
-    """
-    import huggingface_hub
-    from huggingface_hub import hf_api
-    from huggingface_hub.hf_api import api
-
-    # Patch hf_hub_download
-    huggingface_hub.hf_hub_download = _file_download
-    huggingface_hub.file_download.hf_hub_download = _file_download
-
-    # Patch file_exists
-    hf_api.file_exists = MethodType(_file_exists, api)
-    huggingface_hub.file_exists = hf_api.file_exists
-    huggingface_hub.hf_api.file_exists = hf_api.file_exists
-
-    # Patch whoami
-    hf_api.whoami = MethodType(_whoami, api)
-    huggingface_hub.whoami = hf_api.whoami
-    huggingface_hub.hf_api.whoami = hf_api.whoami
-
-    # Patch repocard.validate
-    from huggingface_hub import repocard
-    repocard.RepoCard.validate = lambda *args, **kwargs: None
-
-    def create_repo(self,
-                    repo_id: str,
-                    *,
-                    token: Union[str, bool, None] = None,
-                    private: bool = False,
-                    **kwargs) -> 'RepoUrl':
-        """
-        Create a new repository on the hub.
-
-        Args:
-            repo_id: The ID of the repository to create.
-            token: The authentication token to use.
-            private: Whether the repository should be private.
-            **kwargs: Additional arguments.
-
-        Returns:
-            RepoUrl: The URL of the created repository.
-        """
-        from modelscope.hub.create_model import create_model_repo
-        hub_model_id = create_model_repo(repo_id, token, private)
-        from huggingface_hub import RepoUrl
-        return RepoUrl(url=hub_model_id, )
-
-    @future_compatible
-    def upload_folder(
-        *,
-        repo_id: str,
-        folder_path: Union[str, Path],
-        path_in_repo: Optional[str] = None,
-        commit_message: Optional[str] = None,
-        commit_description: Optional[str] = None,
-        token: Union[str, bool, None] = None,
-        revision: Optional[str] = 'master',
-        ignore_patterns: Optional[Union[List[str], str]] = None,
-        **kwargs,
-    ):
-        from modelscope.hub.push_to_hub import push_model_to_hub
-        push_model_to_hub(repo_id, folder_path, path_in_repo, commit_message,
-                          commit_description, token, True, revision,
-                          ignore_patterns)
-        return CommitInfo(
-            commit_url=f'https://www.modelscope.cn/models/{repo_id}/files',
-            commit_message=commit_message,
-            commit_description=commit_description,
-            oid=None,
-        )
-
-    @future_compatible
-    def upload_file(
-        self,
-        *,
-        path_or_fileobj: Union[str, Path, bytes, BinaryIO],
-        path_in_repo: str,
-        repo_id: str,
-        token: Union[str, bool, None] = None,
-        revision: Optional[str] = None,
-        commit_message: Optional[str] = None,
-        commit_description: Optional[str] = None,
-        **kwargs,
-    ):
-        from modelscope.hub.push_to_hub import push_files_to_hub
-        push_files_to_hub(path_or_fileobj, path_in_repo, repo_id, token,
-                          revision, commit_message, commit_description)
-
-    # Patch create_repo
-    from transformers.utils import hub
-    hf_api.create_repo = MethodType(create_repo, api)
-    huggingface_hub.create_repo = hf_api.create_repo
-    huggingface_hub.hf_api.create_repo = hf_api.create_repo
-    hub.create_repo = create_repo
-
-    # Patch upload_folder
-    hf_api.upload_folder = MethodType(upload_folder, api)
-    huggingface_hub.upload_folder = hf_api.upload_folder
-    huggingface_hub.hf_api.upload_folder = hf_api.upload_folder
-
-    # Patch upload_file
-    hf_api.upload_file = MethodType(upload_file, api)
-    huggingface_hub.upload_file = hf_api.upload_file
-    huggingface_hub.hf_api.upload_file = hf_api.upload_file
-    repocard.upload_file = hf_api.upload_file
-
-    _patch_pretrained_class()
-
-
-def get_wrapped_class(module_class,
-                      ignore_file_pattern=[],
-                      file_filter=None,
-                      **kwargs):
-    """Get a custom wrapper class for  auto classes to download the models from the ModelScope hub
-    Args:
-        module_class: The actual module class
-        ignore_file_pattern (`str` or `List`, *optional*, default to `None`):
-            Any file pattern to be ignored in downloading, like exact file names or file extensions.
-    Returns:
-        The wrapper
-    """
-    default_ignore_file_pattern = ignore_file_pattern
-    default_file_filter = file_filter
-
-    class ClassWrapper(module_class):
-
-        @classmethod
-        def from_pretrained(cls, pretrained_model_name_or_path, *model_args,
-                            **kwargs):
-            ignore_file_pattern = kwargs.pop('ignore_file_pattern',
-                                             default_ignore_file_pattern)
-            subfolder = kwargs.pop('subfolder', default_file_filter)
-            file_filter = None
-            if subfolder:
-                file_filter = f'{subfolder}/*'
-            if not os.path.exists(pretrained_model_name_or_path):
-                revision = kwargs.pop('revision', DEFAULT_MODEL_REVISION)
-                if file_filter is None:
-                    model_dir = snapshot_download(
-                        pretrained_model_name_or_path,
-                        revision=revision,
-                        ignore_file_pattern=ignore_file_pattern,
-                        user_agent=user_agent())
-                else:
-                    model_dir = os.path.join(
-                        snapshot_download(
-                            pretrained_model_name_or_path,
-                            revision=revision,
-                            ignore_file_pattern=ignore_file_pattern,
-                            allow_file_pattern=file_filter,
-                            user_agent=user_agent()), subfolder)
-            else:
-                model_dir = pretrained_model_name_or_path
-
-            module_obj = module_class.from_pretrained(model_dir, *model_args,
-                                                      **kwargs)
-
-            if module_class.__name__.startswith('AutoModel'):
-                module_obj.model_dir = model_dir
-            return module_obj
-
-    ClassWrapper.__name__ = module_class.__name__
-    ClassWrapper.__qualname__ = module_class.__qualname__
-    return ClassWrapper
-
-
-AutoModel = get_wrapped_class(AutoModelHF)
-AutoModelForCausalLM = get_wrapped_class(AutoModelForCausalLMHF)
-AutoModelForSeq2SeqLM = get_wrapped_class(AutoModelForSeq2SeqLMHF)
-AutoModelForVision2Seq = get_wrapped_class(AutoModelForVision2SeqHF)
-AutoModelForSequenceClassification = get_wrapped_class(
-    AutoModelForSequenceClassificationHF)
-AutoModelForTokenClassification = get_wrapped_class(
-    AutoModelForTokenClassificationHF)
-AutoModelForImageSegmentation = get_wrapped_class(
-    AutoModelForImageSegmentationHF)
-AutoModelForImageClassification = get_wrapped_class(
-    AutoModelForImageClassificationHF)
-AutoModelForZeroShotImageClassification = get_wrapped_class(
-    AutoModelForZeroShotImageClassificationHF)
-try:
-    from transformers import AutoModelForImageToImage as AutoModelForImageToImageHF
-
-    AutoModelForImageToImage = get_wrapped_class(AutoModelForImageToImageHF)
-except ImportError:
-    AutoModelForImageToImage = UnsupportedAutoClass('AutoModelForImageToImage')
-
-try:
-    from transformers import AutoModelForImageTextToText as AutoModelForImageTextToTextHF
-
-    AutoModelForImageTextToText = get_wrapped_class(
-        AutoModelForImageTextToTextHF)
-except ImportError:
-    AutoModelForImageTextToText = UnsupportedAutoClass(
-        'AutoModelForImageTextToText')
-
-try:
-    from transformers import AutoModelForKeypointDetection as AutoModelForKeypointDetectionHF
-
-    AutoModelForKeypointDetection = get_wrapped_class(
-        AutoModelForKeypointDetectionHF)
-except ImportError:
-    AutoModelForKeypointDetection = UnsupportedAutoClass(
-        'AutoModelForKeypointDetection')
-
-AutoModelForQuestionAnswering = get_wrapped_class(
-    AutoModelForQuestionAnsweringHF)
-AutoModelForTableQuestionAnswering = get_wrapped_class(
-    AutoModelForTableQuestionAnsweringHF)
-AutoModelForVisualQuestionAnswering = get_wrapped_class(
-    AutoModelForVisualQuestionAnsweringHF)
-AutoModelForDocumentQuestionAnswering = get_wrapped_class(
-    AutoModelForDocumentQuestionAnsweringHF)
-AutoModelForSemanticSegmentation = get_wrapped_class(
-    AutoModelForSemanticSegmentationHF)
-AutoModelForUniversalSegmentation = get_wrapped_class(
-    AutoModelForUniversalSegmentationHF)
-AutoModelForInstanceSegmentation = get_wrapped_class(
-    AutoModelForInstanceSegmentationHF)
-AutoModelForObjectDetection = get_wrapped_class(AutoModelForObjectDetectionHF)
-AutoModelForZeroShotObjectDetection = get_wrapped_class(
-    AutoModelForZeroShotObjectDetectionHF)
-AutoModelForAudioClassification = get_wrapped_class(
-    AutoModelForAudioClassificationHF)
-AutoModelForSpeechSeq2Seq = get_wrapped_class(AutoModelForSpeechSeq2SeqHF)
-AutoModelForMaskedImageModeling = get_wrapped_class(
-    AutoModelForMaskedImageModelingHF)
-AutoModelForMaskedLM = get_wrapped_class(AutoModelForMaskedLMHF)
-AutoModelForMaskGeneration = get_wrapped_class(AutoModelForMaskGenerationHF)
-AutoModelForPreTraining = get_wrapped_class(AutoModelForPreTrainingHF)
-AutoModelForTextEncoding = get_wrapped_class(AutoModelForTextEncodingHF)
-T5EncoderModel = get_wrapped_class(T5EncoderModelHF)
-try:
-    from transformers import \
-        Qwen2VLForConditionalGeneration as Qwen2VLForConditionalGenerationHF
-
-    Qwen2VLForConditionalGeneration = get_wrapped_class(
-        Qwen2VLForConditionalGenerationHF)
-except ImportError:
-    Qwen2VLForConditionalGeneration = UnsupportedAutoClass(
-        'Qwen2VLForConditionalGeneration')
-
-AutoTokenizer = get_wrapped_class(
-    AutoTokenizerHF,
-    ignore_file_pattern=[
-        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
-    ])
-AutoProcessor = get_wrapped_class(
-    AutoProcessorHF,
-    ignore_file_pattern=[
-        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
-    ])
-AutoConfig = get_wrapped_class(
-    AutoConfigHF,
-    ignore_file_pattern=[
-        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
-    ])
-GenerationConfig = get_wrapped_class(
-    GenerationConfigHF,
-    ignore_file_pattern=[
-        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
-    ])
-BitsAndBytesConfig = get_wrapped_class(
-    BitsAndBytesConfigHF,
-    ignore_file_pattern=[
-        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
-    ])
-AutoImageProcessor = get_wrapped_class(
-    AutoImageProcessorHF,
-    ignore_file_pattern=[
-        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
-    ])
-
-GPTQConfig = GPTQConfigHF
-AwqConfig = AwqConfigHF
-BatchFeature = get_wrapped_class(BatchFeatureHF)
--- a/modelscope/utils/hf_util/init.py
+++ b/modelscope/utils/hf_util/init.py
--- a/modelscope/utils/hf_util/auto_class.py
+++ b/modelscope/utils/hf_util/auto_class.py
@@ -0,0 +1,187 @@
+# Copyright (c) Alibaba, Inc. and its affiliates.
+import inspect
+import os
+import sys
+from functools import partial
+from pathlib import Path
+import importlib
+from types import MethodType
+from typing import BinaryIO, Dict, List, Optional, Union
+
+from huggingface_hub.hf_api import CommitInfo, future_compatible
+from modelscope import snapshot_download
+from modelscope.utils.constant import DEFAULT_MODEL_REVISION, Invoke
+from modelscope.utils.logger import get_logger
+
+try:
+    from transformers import AutoModelForImageToImage as AutoModelForImageToImageHF
+
+    AutoModelForImageToImage = get_wrapped_class(AutoModelForImageToImageHF)
+except ImportError:
+    AutoModelForImageToImage = UnsupportedAutoClass('AutoModelForImageToImage')
+
+try:
+    from transformers import AutoModelForImageTextToText as AutoModelForImageTextToTextHF
+
+    AutoModelForImageTextToText = get_wrapped_class(
+        AutoModelForImageTextToTextHF)
+except ImportError:
+    AutoModelForImageTextToText = UnsupportedAutoClass(
+        'AutoModelForImageTextToText')
+
+try:
+    from transformers import AutoModelForKeypointDetection as AutoModelForKeypointDetectionHF
+
+    AutoModelForKeypointDetection = get_wrapped_class(
+        AutoModelForKeypointDetectionHF)
+except ImportError:
+    AutoModelForKeypointDetection = UnsupportedAutoClass(
+        'AutoModelForKeypointDetection')
+
+try:
+    from transformers import \
+        Qwen2VLForConditionalGeneration as Qwen2VLForConditionalGenerationHF
+
+    Qwen2VLForConditionalGeneration = get_wrapped_class(
+        Qwen2VLForConditionalGenerationHF)
+except ImportError:
+    Qwen2VLForConditionalGeneration = UnsupportedAutoClass(
+        'Qwen2VLForConditionalGeneration')
+
+    
+logger = get_logger()
+
+
+def get_wrapped_class(module_class,
+                      ignore_file_pattern=[],
+                      file_filter=None,
+                      **kwargs):
+    """Get a custom wrapper class for  auto classes to download the models from the ModelScope hub
+    Args:
+        module_class: The actual module class
+        ignore_file_pattern (`str` or `List`, *optional*, default to `None`):
+            Any file pattern to be ignored in downloading, like exact file names or file extensions.
+    Returns:
+        The wrapper
+    """
+    default_ignore_file_pattern = ignore_file_pattern
+    default_file_filter = file_filter
+
+    class ClassWrapper(module_class):
+
+        @classmethod
+        def from_pretrained(cls, pretrained_model_name_or_path, *model_args,
+                            **kwargs):
+            ignore_file_pattern = kwargs.pop('ignore_file_pattern',
+                                             default_ignore_file_pattern)
+            subfolder = kwargs.pop('subfolder', default_file_filter)
+            file_filter = None
+            if subfolder:
+                file_filter = f'{subfolder}/*'
+            if not os.path.exists(pretrained_model_name_or_path):
+                revision = kwargs.pop('revision', DEFAULT_MODEL_REVISION)
+                if file_filter is None:
+                    model_dir = snapshot_download(
+                        pretrained_model_name_or_path,
+                        revision=revision,
+                        ignore_file_pattern=ignore_file_pattern,
+                        user_agent=user_agent())
+                else:
+                    model_dir = os.path.join(
+                        snapshot_download(
+                            pretrained_model_name_or_path,
+                            revision=revision,
+                            ignore_file_pattern=ignore_file_pattern,
+                            allow_file_pattern=file_filter,
+                            user_agent=user_agent()), subfolder)
+            else:
+                model_dir = pretrained_model_name_or_path
+
+            module_obj = module_class.from_pretrained(model_dir, *model_args,
+                                                      **kwargs)
+
+            if module_class.__name__.startswith('AutoModel'):
+                module_obj.model_dir = model_dir
+            return module_obj
+
+    ClassWrapper.__name__ = module_class.__name__
+    ClassWrapper.__qualname__ = module_class.__qualname__
+    return ClassWrapper
+
+
+AutoModel = get_wrapped_class(AutoModelHF)
+AutoModelForCausalLM = get_wrapped_class(AutoModelForCausalLMHF)
+AutoModelForSeq2SeqLM = get_wrapped_class(AutoModelForSeq2SeqLMHF)
+AutoModelForVision2Seq = get_wrapped_class(AutoModelForVision2SeqHF)
+AutoModelForSequenceClassification = get_wrapped_class(
+    AutoModelForSequenceClassificationHF)
+AutoModelForTokenClassification = get_wrapped_class(
+    AutoModelForTokenClassificationHF)
+AutoModelForImageSegmentation = get_wrapped_class(
+    AutoModelForImageSegmentationHF)
+AutoModelForImageClassification = get_wrapped_class(
+    AutoModelForImageClassificationHF)
+AutoModelForZeroShotImageClassification = get_wrapped_class(
+    AutoModelForZeroShotImageClassificationHF)
+AutoModelForQuestionAnswering = get_wrapped_class(
+    AutoModelForQuestionAnsweringHF)
+AutoModelForTableQuestionAnswering = get_wrapped_class(
+    AutoModelForTableQuestionAnsweringHF)
+AutoModelForVisualQuestionAnswering = get_wrapped_class(
+    AutoModelForVisualQuestionAnsweringHF)
+AutoModelForDocumentQuestionAnswering = get_wrapped_class(
+    AutoModelForDocumentQuestionAnsweringHF)
+AutoModelForSemanticSegmentation = get_wrapped_class(
+    AutoModelForSemanticSegmentationHF)
+AutoModelForUniversalSegmentation = get_wrapped_class(
+    AutoModelForUniversalSegmentationHF)
+AutoModelForInstanceSegmentation = get_wrapped_class(
+    AutoModelForInstanceSegmentationHF)
+AutoModelForObjectDetection = get_wrapped_class(AutoModelForObjectDetectionHF)
+AutoModelForZeroShotObjectDetection = get_wrapped_class(
+    AutoModelForZeroShotObjectDetectionHF)
+AutoModelForAudioClassification = get_wrapped_class(
+    AutoModelForAudioClassificationHF)
+AutoModelForSpeechSeq2Seq = get_wrapped_class(AutoModelForSpeechSeq2SeqHF)
+AutoModelForMaskedImageModeling = get_wrapped_class(
+    AutoModelForMaskedImageModelingHF)
+AutoModelForMaskedLM = get_wrapped_class(AutoModelForMaskedLMHF)
+AutoModelForMaskGeneration = get_wrapped_class(AutoModelForMaskGenerationHF)
+AutoModelForPreTraining = get_wrapped_class(AutoModelForPreTrainingHF)
+AutoModelForTextEncoding = get_wrapped_class(AutoModelForTextEncodingHF)
+T5EncoderModel = get_wrapped_class(T5EncoderModelHF)
+
+AutoTokenizer = get_wrapped_class(
+    AutoTokenizerHF,
+    ignore_file_pattern=[
+        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
+    ])
+AutoProcessor = get_wrapped_class(
+    AutoProcessorHF,
+    ignore_file_pattern=[
+        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
+    ])
+AutoConfig = get_wrapped_class(
+    AutoConfigHF,
+    ignore_file_pattern=[
+        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
+    ])
+GenerationConfig = get_wrapped_class(
+    GenerationConfigHF,
+    ignore_file_pattern=[
+        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
+    ])
+BitsAndBytesConfig = get_wrapped_class(
+    BitsAndBytesConfigHF,
+    ignore_file_pattern=[
+        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
+    ])
+AutoImageProcessor = get_wrapped_class(
+    AutoImageProcessorHF,
+    ignore_file_pattern=[
+        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt', r'\w+\.h5'
+    ])
+
+GPTQConfig = GPTQConfigHF
+AwqConfig = AwqConfigHF
+BatchFeature = get_wrapped_class(BatchFeatureHF)
--- a/modelscope/utils/hf_util/patcher.py
+++ b/modelscope/utils/hf_util/patcher.py
@@ -0,0 +1,268 @@
+# Copyright (c) Alibaba, Inc. and its affiliates.
+import inspect
+import os
+import sys
+from functools import partial
+from pathlib import Path
+import importlib
+from types import MethodType
+from typing import BinaryIO, Dict, List, Optional, Union
+
+from huggingface_hub.hf_api import CommitInfo, future_compatible
+from modelscope import snapshot_download
+from modelscope.utils.constant import Invoke
+from modelscope.utils.logger import get_logger
+
+
+logger = get_logger()
+
+
+extra_modules = ['T5']
+lazy_module = sys.modules['transformers']
+all_modules = lazy_module._modules
+all_imported_modules = []
+for module in all_modules:
+    if 'auto' in module.lower() or any(m in module for m in extra_modules):
+        all_imported_modules.append(importlib.import_module(f'transformers.{module}'))
+
+
+def user_agent(invoked_by=None):
+    if invoked_by is None:
+        invoked_by = Invoke.PRETRAINED
+    uagent = '%s/%s' % (Invoke.KEY, invoked_by)
+    return uagent
+
+
+def _patch_pretrained_class():
+
+    def get_model_dir(pretrained_model_name_or_path, ignore_file_pattern,
+                      **kwargs):
+        if not os.path.exists(pretrained_model_name_or_path):
+            revision = kwargs.pop('revision', None)
+            model_dir = snapshot_download(
+                pretrained_model_name_or_path,
+                revision=revision,
+                ignore_file_pattern=ignore_file_pattern)
+        else:
+            model_dir = pretrained_model_name_or_path
+        return model_dir
+
+    ignore_file_pattern = [
+        r'\w+\.bin', r'\w+\.safetensors', r'\w+\.pth', r'\w+\.pt'
+    ]
+
+    def patch_pretrained_model_name_or_path(cls, pretrained_model_name_or_path,
+                                            *model_args, **kwargs):
+        model_dir = get_model_dir(pretrained_model_name_or_path,
+                                  kwargs.pop('ignore_file_pattern', None),
+                                  **kwargs)
+        return kwargs.pop('ori_func')(cls, model_dir, *model_args, **kwargs)
+
+    def patch_peft_model_id(cls, model, model_id, *model_args, **kwargs):
+        model_dir = get_model_dir(model_id,
+                                  kwargs.pop('ignore_file_pattern', None),
+                                  **kwargs)
+        return kwargs.pop('ori_func')(cls, model, model_dir, *model_args,
+                                      **kwargs)
+
+    def _get_peft_type(cls, model_id, **kwargs):
+        model_dir = get_model_dir(model_id, ignore_file_pattern, **kwargs)
+        return kwargs.pop('ori_func')(cls, model_dir, **kwargs)
+
+    for var in all_imported_modules:
+        if var is None:
+            continue
+        name = var.__name__
+        need_model = 'model' in name.lower() or 'processor' in name.lower() or 'extractor' in name.lower()
+        if need_model:
+            ignore_file_pattern_kwargs = {}
+        else:
+            ignore_file_pattern_kwargs = {'ignore_file_pattern': ignore_file_pattern}
+
+        if name.endswith('HF'):
+            has_from_pretrained = hasattr(var, 'from_pretrained')
+            has_get_peft_type = hasattr(var, '_get_peft_type')
+            parameters = inspect.signature(var.from_pretrained).parameters
+            is_peft = 'model' in parameters and 'model_id' in parameters
+            if has_from_pretrained:
+                if not is_peft:
+                    var.from_pretrained = partial(patch_pretrained_model_name_or_path,
+                                                  ori_func=var.from_pretrained,
+                                                  **ignore_file_pattern_kwargs)
+                else:
+                    var.from_pretrained = partial(patch_peft_model_id,
+                                                  ori_func=var.from_pretrained,
+                                                  **ignore_file_pattern_kwargs)
+            if has_get_peft_type:
+                var._get_peft_type = partial(_get_peft_type,
+                                              ori_func=var._get_peft_type,
+                                              **ignore_file_pattern_kwargs)
+
+
+def _patch_hub():
+    import huggingface_hub
+    from huggingface_hub import hf_api
+    from huggingface_hub.hf_api import api
+
+    def _file_exists(
+            self,
+            repo_id: str,
+            filename: str,
+            *,
+            repo_type: Optional[str] = None,
+            revision: Optional[str] = None,
+            token: Union[str, bool, None] = None,
+    ):
+        """Patch huggingface_hub.file_exists"""
+        if repo_type is not None:
+            logger.warning(
+                'The passed in repo_type will not be used in modelscope. Now only model repo can be queried.'
+            )
+        from modelscope.hub.api import HubApi
+        api = HubApi()
+        api.try_login(token)
+        return api.file_exists(repo_id, filename, revision=revision)
+
+    def _file_download(repo_id: str,
+                       filename: str,
+                       *,
+                       subfolder: Optional[str] = None,
+                       repo_type: Optional[str] = None,
+                       revision: Optional[str] = None,
+                       cache_dir: Union[str, Path, None] = None,
+                       local_dir: Union[str, Path, None] = None,
+                       token: Union[bool, str, None] = None,
+                       local_files_only: bool = False,
+                       **kwargs):
+        """Patch huggingface_hub.hf_hub_download"""
+        if len(kwargs) > 0:
+            logger.warning(
+                'The passed in library_name,library_version,user_agent,force_download,proxies'
+                'etag_timeout,headers,endpoint '
+                'will not be used in modelscope.')
+        assert repo_type in (
+            None, 'model',
+            'dataset'), f'repo_type={repo_type} is not supported in ModelScope'
+        if repo_type in (None, 'model'):
+            from modelscope.hub.file_download import model_file_download as file_download
+        else:
+            from modelscope.hub.file_download import dataset_file_download as file_download
+        from modelscope import HubApi
+        api = HubApi()
+        api.try_login(token)
+        return file_download(
+            repo_id,
+            file_path=os.path.join(subfolder, filename) if subfolder else filename,
+            cache_dir=cache_dir,
+            local_dir=local_dir,
+            local_files_only=local_files_only,
+            revision=revision)
+
+    def _whoami(self, token: Union[bool, str, None] = None) -> Dict:
+        from modelscope.hub.api import ModelScopeConfig
+        return {'name': ModelScopeConfig.get_user_info()[0] or 'unknown'}
+
+    # Patch hf_hub_download
+    huggingface_hub.hf_hub_download = _file_download
+    huggingface_hub.file_download.hf_hub_download = _file_download
+
+    # Patch file_exists
+    hf_api.file_exists = MethodType(_file_exists, api)
+    huggingface_hub.file_exists = hf_api.file_exists
+    huggingface_hub.hf_api.file_exists = hf_api.file_exists
+
+    # Patch whoami
+    hf_api.whoami = MethodType(_whoami, api)
+    huggingface_hub.whoami = hf_api.whoami
+    huggingface_hub.hf_api.whoami = hf_api.whoami
+
+    # Patch repocard.validate
+    from huggingface_hub import repocard
+    repocard.RepoCard.validate = lambda *args, **kwargs: None
+
+    def create_repo(self,
+                    repo_id: str,
+                    *,
+                    token: Union[str, bool, None] = None,
+                    private: bool = False,
+                    **kwargs) -> 'RepoUrl':
+        """
+        Create a new repository on the hub.
+
+        Args:
+            repo_id: The ID of the repository to create.
+            token: The authentication token to use.
+            private: Whether the repository should be private.
+            **kwargs: Additional arguments.
+
+        Returns:
+            RepoUrl: The URL of the created repository.
+        """
+        from modelscope.hub.create_model import create_model_repo
+        hub_model_id = create_model_repo(repo_id, token, private)
+        from huggingface_hub import RepoUrl
+        return RepoUrl(url=hub_model_id, )
+
+    @future_compatible
+    def upload_folder(
+            *,
+            repo_id: str,
+            folder_path: Union[str, Path],
+            path_in_repo: Optional[str] = None,
+            commit_message: Optional[str] = None,
+            commit_description: Optional[str] = None,
+            token: Union[str, bool, None] = None,
+            revision: Optional[str] = 'master',
+            ignore_patterns: Optional[Union[List[str], str]] = None,
+            **kwargs,
+    ):
+        from modelscope.hub.push_to_hub import push_model_to_hub
+        push_model_to_hub(repo_id, folder_path, path_in_repo, commit_message,
+                          commit_description, token, True, revision,
+                          ignore_patterns)
+        return CommitInfo(
+            commit_url=f'https://www.modelscope.cn/models/{repo_id}/files',
+            commit_message=commit_message,
+            commit_description=commit_description,
+            oid=None,
+        )
+
+    @future_compatible
+    def upload_file(
+            self,
+            *,
+            path_or_fileobj: Union[str, Path, bytes, BinaryIO],
+            path_in_repo: str,
+            repo_id: str,
+            token: Union[str, bool, None] = None,
+            revision: Optional[str] = None,
+            commit_message: Optional[str] = None,
+            commit_description: Optional[str] = None,
+            **kwargs,
+    ):
+        from modelscope.hub.push_to_hub import push_files_to_hub
+        push_files_to_hub(path_or_fileobj, path_in_repo, repo_id, token,
+                          revision, commit_message, commit_description)
+
+    # Patch create_repo
+    from transformers.utils import hub
+    hf_api.create_repo = MethodType(create_repo, api)
+    huggingface_hub.create_repo = hf_api.create_repo
+    huggingface_hub.hf_api.create_repo = hf_api.create_repo
+    hub.create_repo = create_repo
+
+    # Patch upload_folder
+    hf_api.upload_folder = MethodType(upload_folder, api)
+    huggingface_hub.upload_folder = hf_api.upload_folder
+    huggingface_hub.hf_api.upload_folder = hf_api.upload_folder
+
+    # Patch upload_file
+    hf_api.upload_file = MethodType(upload_file, api)
+    huggingface_hub.upload_file = hf_api.upload_file
+    huggingface_hub.hf_api.upload_file = hf_api.upload_file
+    repocard.upload_file = hf_api.upload_file
+
+
+def patch_hub():
+    _patch_hub()
+    _patch_pretrained_class()
--- a/tests/hub/test_patch_hf.py
+++ b/tests/hub/test_patch_hf.py
@@ -0,0 +1,19 @@
+import unittest
+
+from modelscope.msdatasets import MsDataset
+from modelscope.utils.test_utils import test_level
+
+
+class DownloadDatasetTest(unittest.TestCase):
+
+    def setUp(self):
+        from modelscope.utils.hf_util import patch_hub
+        patch_hub()
+
+    def test_automodel_download(self):
+        from transformers import AutoModel
+        model = AutoModel.from_pretrained('AI-ModelScope/bert-base-uncased')
+        self.assertTrue(model is not None)
+
+
+