|
27 | 27 | public final class LmiConfigRecommender { |
28 | 28 |
|
29 | 29 | private static final Logger logger = LoggerFactory.getLogger(LmiConfigRecommender.class); |
30 | | - // TODO: model list is up to date with vLLM 0.4.2 |
| 30 | + // TODO: model list is up to date with vLLM 0.5.1 |
31 | 31 | private static final Map<String, String> MODEL_TO_ROLLING_BATCH = |
32 | 32 | Map.ofEntries( |
33 | 33 | Map.entry("falcon", "lmi-dist"), |
@@ -59,7 +59,16 @@ public final class LmiConfigRecommender { |
59 | 59 | Map.entry("qwen2_moe", "lmi-dist"), |
60 | 60 | Map.entry("stablelm", "lmi-dist"), |
61 | 61 | Map.entry("xverse", "lmi-dist"), |
62 | | - Map.entry("starcoder2", "lmi-dist")); |
| 62 | + Map.entry("starcoder2", "lmi-dist"), |
| 63 | + // vllm 0.5.1 |
| 64 | + Map.entry("arctic", "lmi-dist"), |
| 65 | + Map.entry("gemma2", "lmi-dist"), |
| 66 | + Map.entry("jamba", "lmi-dist"), |
| 67 | + Map.entry("phi3small", "lmi-dist"), |
| 68 | + Map.entry("llava", "lmi-dist"), |
| 69 | + Map.entry("llava_next", "lmi-dist"), |
| 70 | + Map.entry("paligemma", "lmi-dist"), |
| 71 | + Map.entry("phi3_v", "lmi-dist")); |
63 | 72 |
|
64 | 73 | private static final Set<String> OPTIMIZED_TASK_ARCHITECTURES = |
65 | 74 | Set.of("ForCausalLM", "LMHeadModel", "ForConditionalGeneration"); |
|
0 commit comments