Skip to content

Commit 99d6e38

Browse files
author
Qing Lan
committed
add 0.5.1 supported models
1 parent cb37ca0 commit 99d6e38

File tree

1 file changed

+11
-2
lines changed

1 file changed

+11
-2
lines changed

wlm/src/main/java/ai/djl/serving/wlm/LmiConfigRecommender.java

Lines changed: 11 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@
2727
public final class LmiConfigRecommender {
2828

2929
private static final Logger logger = LoggerFactory.getLogger(LmiConfigRecommender.class);
30-
// TODO: model list is up to date with vLLM 0.4.2
30+
// TODO: model list is up to date with vLLM 0.5.1
3131
private static final Map<String, String> MODEL_TO_ROLLING_BATCH =
3232
Map.ofEntries(
3333
Map.entry("falcon", "lmi-dist"),
@@ -59,7 +59,16 @@ public final class LmiConfigRecommender {
5959
Map.entry("qwen2_moe", "lmi-dist"),
6060
Map.entry("stablelm", "lmi-dist"),
6161
Map.entry("xverse", "lmi-dist"),
62-
Map.entry("starcoder2", "lmi-dist"));
62+
Map.entry("starcoder2", "lmi-dist"),
63+
// vllm 0.5.1
64+
Map.entry("arctic", "lmi-dist"),
65+
Map.entry("gemma2", "lmi-dist"),
66+
Map.entry("jamba", "lmi-dist"),
67+
Map.entry("phi3small", "lmi-dist"),
68+
Map.entry("llava", "lmi-dist"),
69+
Map.entry("llava_next", "lmi-dist"),
70+
Map.entry("paligemma", "lmi-dist"),
71+
Map.entry("phi3_v", "lmi-dist"));
6372

6473
private static final Set<String> OPTIMIZED_TASK_ARCHITECTURES =
6574
Set.of("ForCausalLM", "LMHeadModel", "ForConditionalGeneration");

0 commit comments

Comments
 (0)