File tree Expand file tree Collapse file tree 3 files changed +6
-0
lines changed Expand file tree Collapse file tree 3 files changed +6
-0
lines changed Original file line number Diff line number Diff line change 217
217
| [ Qwen/Qwen3-235B-A22B-Instruct-2507] ( https://modelscope.cn/models/Qwen/Qwen3-235B-A22B-Instruct-2507 ) | qwen3_moe| qwen3| transformers>=4.51| ✔ ; | -| [ Qwen/Qwen3-235B-A22B-Instruct-2507] ( https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507 ) |
218
218
| [ Qwen/Qwen3-235B-A22B-Instruct-2507-FP8] ( https://modelscope.cn/models/Qwen/Qwen3-235B-A22B-Instruct-2507-FP8 ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | -| [ Qwen/Qwen3-235B-A22B-Instruct-2507-FP8] ( https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507-FP8 ) |
219
219
| [ swift/Qwen3-235B-A22B-Instruct-2507-AWQ] ( https://modelscope.cn/models/swift/Qwen3-235B-A22B-Instruct-2507-AWQ ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | -| -|
220
+ | [ Qwen/Qwen3-Coder-30B-A3B-Instruct] ( https://modelscope.cn/models/Qwen/Qwen3-Coder-30B-A3B-Instruct ) | qwen3_moe| qwen3| transformers>=4.51| ✔ ; | coding| [ Qwen/Qwen3-Coder-30B-A3B-Instruct] ( https://huggingface.co/Qwen/Qwen3-Coder-30B-A3B-Instruct ) |
221
+ | [ Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8] ( https://modelscope.cn/models/Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8 ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | coding| [ Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8] ( https://huggingface.co/Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8 ) |
220
222
| [ Qwen/Qwen3-Coder-480B-A35B-Instruct] ( https://modelscope.cn/models/Qwen/Qwen3-Coder-480B-A35B-Instruct ) | qwen3_moe| qwen3| transformers>=4.51| ✔ ; | coding| [ Qwen/Qwen3-Coder-480B-A35B-Instruct] ( https://huggingface.co/Qwen/Qwen3-Coder-480B-A35B-Instruct ) |
221
223
| [ Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8] ( https://modelscope.cn/models/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8 ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | coding| [ Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8] ( https://huggingface.co/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8 ) |
222
224
| [ swift/Qwen3-Coder-480B-A35B-Instruct-AWQ] ( https://modelscope.cn/models/swift/Qwen3-Coder-480B-A35B-Instruct-AWQ ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | coding| -|
Original file line number Diff line number Diff line change @@ -217,6 +217,8 @@ The table below introduces the models integrated with ms-swift:
217
217
| [ Qwen/Qwen3-235B-A22B-Instruct-2507] ( https://modelscope.cn/models/Qwen/Qwen3-235B-A22B-Instruct-2507 ) | qwen3_moe| qwen3| transformers>=4.51| ✔ ; | -| [ Qwen/Qwen3-235B-A22B-Instruct-2507] ( https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507 ) |
218
218
| [ Qwen/Qwen3-235B-A22B-Instruct-2507-FP8] ( https://modelscope.cn/models/Qwen/Qwen3-235B-A22B-Instruct-2507-FP8 ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | -| [ Qwen/Qwen3-235B-A22B-Instruct-2507-FP8] ( https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507-FP8 ) |
219
219
| [ swift/Qwen3-235B-A22B-Instruct-2507-AWQ] ( https://modelscope.cn/models/swift/Qwen3-235B-A22B-Instruct-2507-AWQ ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | -| -|
220
+ | [ Qwen/Qwen3-Coder-30B-A3B-Instruct] ( https://modelscope.cn/models/Qwen/Qwen3-Coder-30B-A3B-Instruct ) | qwen3_moe| qwen3| transformers>=4.51| ✔ ; | coding| [ Qwen/Qwen3-Coder-30B-A3B-Instruct] ( https://huggingface.co/Qwen/Qwen3-Coder-30B-A3B-Instruct ) |
221
+ | [ Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8] ( https://modelscope.cn/models/Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8 ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | coding| [ Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8] ( https://huggingface.co/Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8 ) |
220
222
| [ Qwen/Qwen3-Coder-480B-A35B-Instruct] ( https://modelscope.cn/models/Qwen/Qwen3-Coder-480B-A35B-Instruct ) | qwen3_moe| qwen3| transformers>=4.51| ✔ ; | coding| [ Qwen/Qwen3-Coder-480B-A35B-Instruct] ( https://huggingface.co/Qwen/Qwen3-Coder-480B-A35B-Instruct ) |
221
223
| [ Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8] ( https://modelscope.cn/models/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8 ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | coding| [ Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8] ( https://huggingface.co/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8 ) |
222
224
| [ swift/Qwen3-Coder-480B-A35B-Instruct-AWQ] ( https://modelscope.cn/models/swift/Qwen3-Coder-480B-A35B-Instruct-AWQ ) | qwen3_moe| qwen3| transformers>=4.51| ✘ ; | coding| -|
Original file line number Diff line number Diff line change @@ -561,6 +561,8 @@ def _get_cast_dtype(self) -> torch.dtype:
561
561
Model ('swift/Qwen3-235B-A22B-Instruct-2507-AWQ' ),
562
562
]),
563
563
ModelGroup ([
564
+ Model ('Qwen/Qwen3-Coder-30B-A3B-Instruct' , 'Qwen/Qwen3-Coder-30B-A3B-Instruct' ),
565
+ Model ('Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8' , 'Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8' ),
564
566
Model ('Qwen/Qwen3-Coder-480B-A35B-Instruct' , 'Qwen/Qwen3-Coder-480B-A35B-Instruct' ),
565
567
Model ('Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8' , 'Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8' ),
566
568
Model ('swift/Qwen3-Coder-480B-A35B-Instruct-AWQ' ),
You can’t perform that action at this time.
0 commit comments