Skip to content

Commit 974f4d1

Browse files
author
Qing Lan
authored
add 0.5.1 supported models (#2151)
1 parent cb37ca0 commit 974f4d1

File tree

3 files changed

+14
-3
lines changed

3 files changed

+14
-3
lines changed

tests/integration/llm/download_llm.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -12,9 +12,11 @@ def llm_download(model_id, token, allow_patterns):
1212
"*.json", "*.pt", "*.safetensors", "*.txt", "*.model", "*.tiktoken"
1313
]
1414

15+
ignore_patterns = [".git*"]
1516
snapshot_download(repo_id=model_id,
1617
local_dir=local_model_path,
1718
allow_patterns=allow_patterns,
19+
ignore_patterns=ignore_patterns,
1820
token=token)
1921

2022

tests/integration/llm/prepare.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -766,7 +766,7 @@
766766
"option.model_id": "s3://djl-llm/llama-2-70b-hf/",
767767
},
768768
"codellama-34b-aiccl": {
769-
"option.model_id": "codellama/CodeLlama-34b-hf",
769+
"option.model_id": "s3://djl-llm/CodeLlama-34b-Instruct-hf/",
770770
},
771771
"falcon-40b-aiccl": {
772772
"option.model_id": "s3://djl-llm/falcon-40b/",

wlm/src/main/java/ai/djl/serving/wlm/LmiConfigRecommender.java

Lines changed: 11 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@
2727
public final class LmiConfigRecommender {
2828

2929
private static final Logger logger = LoggerFactory.getLogger(LmiConfigRecommender.class);
30-
// TODO: model list is up to date with vLLM 0.4.2
30+
// TODO: model list is up to date with vLLM 0.5.1
3131
private static final Map<String, String> MODEL_TO_ROLLING_BATCH =
3232
Map.ofEntries(
3333
Map.entry("falcon", "lmi-dist"),
@@ -59,7 +59,16 @@ public final class LmiConfigRecommender {
5959
Map.entry("qwen2_moe", "lmi-dist"),
6060
Map.entry("stablelm", "lmi-dist"),
6161
Map.entry("xverse", "lmi-dist"),
62-
Map.entry("starcoder2", "lmi-dist"));
62+
Map.entry("starcoder2", "lmi-dist"),
63+
// vllm 0.5.1
64+
Map.entry("arctic", "lmi-dist"),
65+
Map.entry("gemma2", "lmi-dist"),
66+
Map.entry("jamba", "lmi-dist"),
67+
Map.entry("phi3small", "lmi-dist"),
68+
Map.entry("llava", "lmi-dist"),
69+
Map.entry("llava_next", "lmi-dist"),
70+
Map.entry("paligemma", "lmi-dist"),
71+
Map.entry("phi3_v", "lmi-dist"));
6372

6473
private static final Set<String> OPTIMIZED_TASK_ARCHITECTURES =
6574
Set.of("ForCausalLM", "LMHeadModel", "ForConditionalGeneration");

0 commit comments

Comments
 (0)