File tree Expand file tree Collapse file tree 6 files changed +31
-0
lines changed Expand file tree Collapse file tree 6 files changed +31
-0
lines changed Original file line number Diff line number Diff line change 547
547
| [ XiaomiMiMo/MiMo-7B-RL-Zero] ( https://modelscope.cn/models/XiaomiMiMo/MiMo-7B-RL-Zero ) | mimo| qwen| transformers>=4.37| ✘ ; | -| [ XiaomiMiMo/MiMo-7B-RL-Zero] ( https://huggingface.co/XiaomiMiMo/MiMo-7B-RL-Zero ) |
548
548
| [ XiaomiMiMo/MiMo-7B-RL] ( https://modelscope.cn/models/XiaomiMiMo/MiMo-7B-RL ) | mimo| qwen| transformers>=4.37| ✘ ; | -| [ XiaomiMiMo/MiMo-7B-RL] ( https://huggingface.co/XiaomiMiMo/MiMo-7B-RL ) |
549
549
| [ XiaomiMiMo/MiMo-7B-RL-0530] ( https://modelscope.cn/models/XiaomiMiMo/MiMo-7B-RL-0530 ) | mimo_rl| mimo_rl| transformers>=4.37| ✘ ; | -| [ XiaomiMiMo/MiMo-7B-RL-0530] ( https://huggingface.co/XiaomiMiMo/MiMo-7B-RL-0530 ) |
550
+ | [ rednote-hilab/dots.llm1.base] ( https://modelscope.cn/models/rednote-hilab/dots.llm1.base ) | dots1| dots1| transformers>=4.53.0.dev0| ✘ ; | -| [ rednote-hilab/dots.llm1.base] ( https://huggingface.co/rednote-hilab/dots.llm1.base ) |
551
+ | [ rednote-hilab/dots.llm1.inst] ( https://modelscope.cn/models/rednote-hilab/dots.llm1.inst ) | dots1| dots1| transformers>=4.53.0.dev0| ✘ ; | -| [ rednote-hilab/dots.llm1.inst] ( https://huggingface.co/rednote-hilab/dots.llm1.inst ) |
550
552
| [ answerdotai/ModernBERT-base] ( https://modelscope.cn/models/answerdotai/ModernBERT-base ) | modern_bert| dummy| transformers>=4.48| ✘ ; | bert| [ answerdotai/ModernBERT-base] ( https://huggingface.co/answerdotai/ModernBERT-base ) |
551
553
| [ answerdotai/ModernBERT-large] ( https://modelscope.cn/models/answerdotai/ModernBERT-large ) | modern_bert| dummy| transformers>=4.48| ✘ ; | bert| [ answerdotai/ModernBERT-large] ( https://huggingface.co/answerdotai/ModernBERT-large ) |
552
554
| [ iic/gte-modernbert-base] ( https://modelscope.cn/models/iic/gte-modernbert-base ) | modern_bert_gte| dummy| transformers>=4.48| ✘ ; | bert, embedding| [ Alibaba-NLP/gte-modernbert-base] ( https://huggingface.co/Alibaba-NLP/gte-modernbert-base ) |
Original file line number Diff line number Diff line change @@ -547,6 +547,8 @@ The table below introduces the models integrated with ms-swift:
547
547
| [ XiaomiMiMo/MiMo-7B-RL-Zero] ( https://modelscope.cn/models/XiaomiMiMo/MiMo-7B-RL-Zero ) | mimo| qwen| transformers>=4.37| ✘ ; | -| [ XiaomiMiMo/MiMo-7B-RL-Zero] ( https://huggingface.co/XiaomiMiMo/MiMo-7B-RL-Zero ) |
548
548
| [ XiaomiMiMo/MiMo-7B-RL] ( https://modelscope.cn/models/XiaomiMiMo/MiMo-7B-RL ) | mimo| qwen| transformers>=4.37| ✘ ; | -| [ XiaomiMiMo/MiMo-7B-RL] ( https://huggingface.co/XiaomiMiMo/MiMo-7B-RL ) |
549
549
| [ XiaomiMiMo/MiMo-7B-RL-0530] ( https://modelscope.cn/models/XiaomiMiMo/MiMo-7B-RL-0530 ) | mimo_rl| mimo_rl| transformers>=4.37| ✘ ; | -| [ XiaomiMiMo/MiMo-7B-RL-0530] ( https://huggingface.co/XiaomiMiMo/MiMo-7B-RL-0530 ) |
550
+ | [ rednote-hilab/dots.llm1.base] ( https://modelscope.cn/models/rednote-hilab/dots.llm1.base ) | dots1| dots1| transformers>=4.53.0.dev0| ✘ ; | -| [ rednote-hilab/dots.llm1.base] ( https://huggingface.co/rednote-hilab/dots.llm1.base ) |
551
+ | [ rednote-hilab/dots.llm1.inst] ( https://modelscope.cn/models/rednote-hilab/dots.llm1.inst ) | dots1| dots1| transformers>=4.53.0.dev0| ✘ ; | -| [ rednote-hilab/dots.llm1.inst] ( https://huggingface.co/rednote-hilab/dots.llm1.inst ) |
550
552
| [ answerdotai/ModernBERT-base] ( https://modelscope.cn/models/answerdotai/ModernBERT-base ) | modern_bert| dummy| transformers>=4.48| ✘ ; | bert| [ answerdotai/ModernBERT-base] ( https://huggingface.co/answerdotai/ModernBERT-base ) |
551
553
| [ answerdotai/ModernBERT-large] ( https://modelscope.cn/models/answerdotai/ModernBERT-large ) | modern_bert| dummy| transformers>=4.48| ✘ ; | bert| [ answerdotai/ModernBERT-large] ( https://huggingface.co/answerdotai/ModernBERT-large ) |
552
554
| [ iic/gte-modernbert-base] ( https://modelscope.cn/models/iic/gte-modernbert-base ) | modern_bert_gte| dummy| transformers>=4.48| ✘ ; | bert, embedding| [ Alibaba-NLP/gte-modernbert-base] ( https://huggingface.co/Alibaba-NLP/gte-modernbert-base ) |
Original file line number Diff line number Diff line change @@ -116,6 +116,7 @@ class LLMModelType:
116
116
moonlight = 'moonlight'
117
117
mimo = 'mimo'
118
118
mimo_rl = 'mimo_rl'
119
+ dots1 = 'dots1'
119
120
120
121
121
122
class BertModelType :
Original file line number Diff line number Diff line change @@ -328,3 +328,18 @@ def forward(self, **kwargs):
328
328
model_arch = ModelArch .llama ,
329
329
architectures = ['MiMoForCausalLM' ],
330
330
requires = ['transformers>=4.37' ]))
331
+
332
+ register_model (
333
+ ModelMeta (
334
+ LLMModelType .dots1 ,
335
+ [
336
+ ModelGroup ([
337
+ Model ('rednote-hilab/dots.llm1.base' , 'rednote-hilab/dots.llm1.base' ),
338
+ Model ('rednote-hilab/dots.llm1.inst' , 'rednote-hilab/dots.llm1.inst' ),
339
+ ])
340
+ ],
341
+ TemplateType .dots1 ,
342
+ get_model_tokenizer_with_flash_attn ,
343
+ architectures = ['Dots1ForCausalLM' ],
344
+ requires = ['transformers>=4.53.0.dev0' ],
345
+ ))
Original file line number Diff line number Diff line change @@ -82,6 +82,7 @@ class LLMTemplateType:
82
82
orion = 'orion'
83
83
moonlight = 'moonlight'
84
84
mimo_rl = 'mimo_rl'
85
+ dots1 = 'dots1'
85
86
86
87
aya = 'aya'
87
88
c4ai = 'c4ai'
Original file line number Diff line number Diff line change @@ -279,3 +279,13 @@ class TeleChatTemplateMeta(TemplateMeta):
279
279
LLMTemplateType .mimo_rl ,
280
280
default_system = 'You are MiMo, an AI assistant developed by Xiaomi.' ,
281
281
))
282
+
283
+ register_template (
284
+ TemplateMeta (
285
+ LLMTemplateType .dots1 ,
286
+ prefix = ['<|system|>{{SYSTEM}}<|endofsystem|>' ],
287
+ prompt = ['<|userprompt|>{{QUERY}}<|endofuserprompt|><|response|>' ],
288
+ chat_sep = ['<|endofresponse|>' ],
289
+ suffix = ['<|endofresponse|>' ],
290
+ default_system = 'You are a helpful assistant.' ,
291
+ ))
You can’t perform that action at this time.
0 commit comments