mirror of
https://github.com/modelscope/modelscope.git
synced 2026-02-24 12:10:09 +01:00
feat: deepseek-r1, olmo2, command-r7b, deepseek-v3
This commit is contained in:
@@ -470,6 +470,12 @@ template_info = [
|
||||
modelfile_prefix=
|
||||
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/command-r-plus',
|
||||
),
|
||||
TemplateInfo(
|
||||
template_regex=
|
||||
f'.*{cases("command-r7b")}.*',
|
||||
modelfile_prefix=
|
||||
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/command-r7b',
|
||||
),
|
||||
TemplateInfo(
|
||||
template_regex=
|
||||
f'.*{cases("command-r")}.*',
|
||||
@@ -592,10 +598,8 @@ template_info = [
|
||||
TemplateInfo(
|
||||
template=TemplateType.deepseek,
|
||||
template_regex=
|
||||
f'.*{cases("deepseek")}{no("v2", "v2.5", "coder")}{no_multi_modal()}.*{chat_suffix}.*'
|
||||
f'.*{cases("deepseek")}{no("v2", "v2.5", "v3", "r1", "coder")}{no_multi_modal()}.*{chat_suffix}.*'
|
||||
),
|
||||
|
||||
# deepseek2
|
||||
TemplateInfo(
|
||||
template=TemplateType.deepseek2,
|
||||
template_regex=
|
||||
@@ -603,19 +607,27 @@ template_info = [
|
||||
modelfile_prefix=
|
||||
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/deepseek-v2',
|
||||
),
|
||||
|
||||
# deepseek_coder
|
||||
TemplateInfo(
|
||||
template=TemplateType.deepseek_coder,
|
||||
template_regex=
|
||||
f'.*{cases("deepseek")}{no("v2", "v2.5")}.*{cases("coder")}.*{chat_suffix}.*'
|
||||
),
|
||||
|
||||
# deepseek v2.5
|
||||
TemplateInfo(
|
||||
template=TemplateType.deepseek2_5,
|
||||
template_regex=
|
||||
f'.*{cases("deepseek")}.*{cases("v2.5")}{no_multi_modal()}.*'),
|
||||
TemplateInfo(
|
||||
template_regex=
|
||||
f'.*{cases("deepseek")}.*{cases("v3")}.*',
|
||||
modelfile_prefix=
|
||||
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/deepseek-v3',
|
||||
),
|
||||
TemplateInfo(
|
||||
template_regex=
|
||||
f'.*{cases("deepseek")}.*{cases("r1")}.*',
|
||||
modelfile_prefix=
|
||||
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/deepseek-r1',
|
||||
),
|
||||
|
||||
# orion
|
||||
TemplateInfo(
|
||||
@@ -721,6 +733,13 @@ template_info = [
|
||||
modelfile_prefix=
|
||||
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/smallthinker'),
|
||||
|
||||
TemplateInfo(
|
||||
template_regex=
|
||||
f'.*{cases("olmo2", "olmo-2")}.*',
|
||||
modelfile_prefix=
|
||||
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/olmo2',
|
||||
),
|
||||
|
||||
TemplateInfo(
|
||||
template_regex=f'.*{cases("nomic-embed-text")}.*',
|
||||
modelfile_prefix=
|
||||
@@ -870,6 +889,7 @@ template_info = [
|
||||
modelfile_prefix=
|
||||
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/exaone3.5'),
|
||||
|
||||
|
||||
]
|
||||
|
||||
|
||||
|
||||
@@ -16,7 +16,7 @@ def _test_check_tmpl_type(model, tmpl_type, gguf_meta={}):
|
||||
|
||||
class TestToOllama(unittest.TestCase):
|
||||
|
||||
@unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
|
||||
@unittest.skip#Unless(test_level() >= 0, 'skip test in current test level')
|
||||
def test_load_template(self):
|
||||
template = TemplateLoader.load_by_model_id(
|
||||
'LLM-Research/Meta-Llama-3-8B-Instruct')
|
||||
@@ -86,7 +86,7 @@ class TestToOllama(unittest.TestCase):
|
||||
'LLM-Research/Phi-3-128k-instruct-GGUF')
|
||||
self.assertTrue(template.template_type == TemplateType.phi3)
|
||||
|
||||
@unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
|
||||
@unittest.skip#Unless(test_level() >= 0, 'skip test in current test level')
|
||||
def test_load_ollama(self):
|
||||
ollama = TemplateLoader.to_ollama(
|
||||
'LLM-Research/Meta-Llama-3.1-8B-Instruct-GGUF')
|
||||
@@ -365,7 +365,16 @@ class TestToOllama(unittest.TestCase):
|
||||
gguf_meta={'general.name': 'Dolphin 3.0 Llama 3.1 8B'})
|
||||
_test_check_tmpl_type(
|
||||
'AI-ModelScope/phi-4', 'phi4', gguf_meta={'general.name': 'Phi 4'})
|
||||
|
||||
_test_check_tmpl_type(
|
||||
'yasserrmd/DeepSeek-R1-Distill-Qwen-1.5B-gguf', 'deepseek-r1', gguf_meta={'general.name': 'DeepSeek R1 Distill Qwen 1.5B'})
|
||||
_test_check_tmpl_type(
|
||||
'allenai/OLMo-2-1124-7B-Instruct-GGUF', 'olmo2', gguf_meta={'general.name': 'Open_Instruct_Dev'})
|
||||
_test_check_tmpl_type(
|
||||
'bartowski/OLMo-2-1124-7B-Instruct-GGUF', 'olmo2', gguf_meta={'general.name': 'OLMo 2 1124 7B Instruct'})
|
||||
_test_check_tmpl_type(
|
||||
'bartowski/c4ai-command-r7b-12-2024-abliterated-GGUF', 'command-r7b', gguf_meta={'general.name': 'C4Ai Command R7B 12 2024'})
|
||||
_test_check_tmpl_type(
|
||||
'okwinds/DeepSeek-V3-GGUF-V3-LOT', 'deepseek-v3', gguf_meta={'general.name': 'DeepSeek V3 Bf16D'})
|
||||
|
||||
if __name__ == '__main__':
|
||||
unittest.main()
|
||||
|
||||
Reference in New Issue
Block a user