feat: new ollama template (#1199)

* feat: deepseek-r1, olmo2, command-r7b, deepseek-v3

---------

Co-authored-by: suluyan <suluyan.sly@alibaba-inc.com>
This commit is contained in:
suluyana
2025-01-21 17:49:54 +08:00
committed by GitHub
parent 58c90dee2c
commit dc7e22ebeb
2 changed files with 47 additions and 7 deletions

View File

@@ -470,6 +470,12 @@ template_info = [
modelfile_prefix=
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/command-r-plus',
),
TemplateInfo(
template_regex=
f'.*{cases("command-r7b")}.*',
modelfile_prefix=
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/command-r7b',
),
TemplateInfo(
template_regex=
f'.*{cases("command-r")}.*',
@@ -592,10 +598,8 @@ template_info = [
TemplateInfo(
template=TemplateType.deepseek,
template_regex=
f'.*{cases("deepseek")}{no("v2", "v2.5", "coder")}{no_multi_modal()}.*{chat_suffix}.*'
f'.*{cases("deepseek")}{no("v2", "v2.5", "v3", "r1", "coder")}{no_multi_modal()}.*{chat_suffix}.*'
),
# deepseek2
TemplateInfo(
template=TemplateType.deepseek2,
template_regex=
@@ -603,19 +607,27 @@ template_info = [
modelfile_prefix=
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/deepseek-v2',
),
# deepseek_coder
TemplateInfo(
template=TemplateType.deepseek_coder,
template_regex=
f'.*{cases("deepseek")}{no("v2", "v2.5")}.*{cases("coder")}.*{chat_suffix}.*'
),
# deepseek v2.5
TemplateInfo(
template=TemplateType.deepseek2_5,
template_regex=
f'.*{cases("deepseek")}.*{cases("v2.5")}{no_multi_modal()}.*'),
TemplateInfo(
template_regex=
f'.*{cases("deepseek")}.*{cases("v3")}.*',
modelfile_prefix=
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/deepseek-v3',
),
TemplateInfo(
template_regex=
f'.*{cases("deepseek")}.*{cases("r1")}.*',
modelfile_prefix=
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/deepseek-r1',
),
# orion
TemplateInfo(
@@ -721,6 +733,13 @@ template_info = [
modelfile_prefix=
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/smallthinker'),
TemplateInfo(
template_regex=
f'.*{cases("olmo2", "olmo-2")}.*',
modelfile_prefix=
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/olmo2',
),
TemplateInfo(
template_regex=f'.*{cases("nomic-embed-text")}.*',
modelfile_prefix=
@@ -870,6 +889,7 @@ template_info = [
modelfile_prefix=
'https://modelscope.oss-cn-beijing.aliyuncs.com/llm_template/ollama/exaone3.5'),
]

View File

@@ -365,6 +365,26 @@ class TestToOllama(unittest.TestCase):
gguf_meta={'general.name': 'Dolphin 3.0 Llama 3.1 8B'})
_test_check_tmpl_type(
'AI-ModelScope/phi-4', 'phi4', gguf_meta={'general.name': 'Phi 4'})
_test_check_tmpl_type(
'yasserrmd/DeepSeek-R1-Distill-Qwen-1.5B-gguf',
'deepseek-r1',
gguf_meta={'general.name': 'DeepSeek R1 Distill Qwen 1.5B'})
_test_check_tmpl_type(
'allenai/OLMo-2-1124-7B-Instruct-GGUF',
'olmo2',
gguf_meta={'general.name': 'Open_Instruct_Dev'})
_test_check_tmpl_type(
'bartowski/OLMo-2-1124-7B-Instruct-GGUF',
'olmo2',
gguf_meta={'general.name': 'OLMo 2 1124 7B Instruct'})
_test_check_tmpl_type(
'bartowski/c4ai-command-r7b-12-2024-abliterated-GGUF',
'command-r7b',
gguf_meta={'general.name': 'C4Ai Command R7B 12 2024'})
_test_check_tmpl_type(
'okwinds/DeepSeek-V3-GGUF-V3-LOT',
'deepseek-v3',
gguf_meta={'general.name': 'DeepSeek V3 Bf16D'})
if __name__ == '__main__':