diff --git a/README.md b/README.md index 93b64a41..23d06ae8 100644 --- a/README.md +++ b/README.md @@ -283,7 +283,7 @@ Choose your path: | [GPT-OSS](https://huggingface.co/openai) | 20B/120B | gpt | | [Granite 3.0-3.3](https://huggingface.co/ibm-granite) | 1B/2B/3B/8B | granite3 | | [Granite 4](https://huggingface.co/ibm-granite) | 7B | granite4 | -| [Hunyuan](https://huggingface.co/tencent/) | 7B | hunyuan | +| [Hunyuan (MT)](https://huggingface.co/tencent/) | 7B | hunyuan | | [Index](https://huggingface.co/IndexTeam) | 1.9B | index | | [InternLM 2-3](https://huggingface.co/internlm) | 7B/8B/20B | intern2 | | [InternVL 2.5-3.5](https://huggingface.co/OpenGVLab) | 1B/2B/4B/8B/14B/30B/38B/78B/241B | intern_vl | diff --git a/README_zh.md b/README_zh.md index bd4351d2..4679663b 100644 --- a/README_zh.md +++ b/README_zh.md @@ -285,7 +285,7 @@ https://github.com/user-attachments/assets/43b700c6-a178-41db-b1f8-8190a5d3fcfc | [GPT-OSS](https://huggingface.co/openai) | 20B/120B | gpt | | [Granite 3.0-3.3](https://huggingface.co/ibm-granite) | 1B/2B/3B/8B | granite3 | | [Granite 4](https://huggingface.co/ibm-granite) | 7B | granite4 | -| [Hunyuan](https://huggingface.co/tencent/) | 7B | hunyuan | +| [Hunyuan (MT)](https://huggingface.co/tencent/) | 7B | hunyuan | | [Index](https://huggingface.co/IndexTeam) | 1.9B | index | | [InternLM 2-3](https://huggingface.co/internlm) | 7B/8B/20B | intern2 | | [InternVL 2.5-3.5](https://huggingface.co/OpenGVLab) | 1B/2B/4B/8B/14B/30B/38B/78B/241B | intern_vl | diff --git a/src/llamafactory/data/template.py b/src/llamafactory/data/template.py index cf607589..444064f5 100644 --- a/src/llamafactory/data/template.py +++ b/src/llamafactory/data/template.py @@ -1201,10 +1201,10 @@ register_template( register_template( name="hunyuan", - format_user=StringFormatter(slots=["<|bos|>user\n{{content}}<|eos|>\n<|bos|>assistant\n"]), - format_assistant=StringFormatter(slots=["{{content}}<|eos|>\n"]), - format_system=StringFormatter(slots=["<|bos|>system\n{{content}}<|eos|>\n"]), - format_prefix=EmptyFormatter(slots=["<|bos|>"]), + format_user=StringFormatter(slots=["{{content}}<|extra_0|>"]), + format_assistant=StringFormatter(slots=["{{content}}<|eos|>"]), + format_system=StringFormatter(slots=["{{content}}<|extra_4|>"]), + format_prefix=EmptyFormatter(slots=["<|startoftext|>"]), stop_words=["<|eos|>"], ) diff --git a/src/llamafactory/extras/constants.py b/src/llamafactory/extras/constants.py index 03587c53..a5e05119 100644 --- a/src/llamafactory/extras/constants.py +++ b/src/llamafactory/extras/constants.py @@ -1152,6 +1152,10 @@ register_model_group( DownloadSource.DEFAULT: "tencent/Hunyuan-7B-Instruct", DownloadSource.MODELSCOPE: "AI-ModelScope/Hunyuan-7B-Instruct", }, + "Hunyuan-MT-7B-Instruct": { + DownloadSource.DEFAULT: "tencent/Hunyuan-MT-7B", + DownloadSource.MODELSCOPE: "Tencent-Hunyuan/Hunyuan-MT-7B", + }, }, template="hunyuan", )