File tree Expand file tree Collapse file tree 1 file changed +4
-2
lines changed Expand file tree Collapse file tree 1 file changed +4
-2
lines changed Original file line number Diff line number Diff line change 69
69
70
70
71
71
def model_is_embedding (model_name : str , trust_remote_code : bool ,
72
- quantization : Optional [str ]) -> bool :
72
+ quantization : Optional [str ],
73
+ revision : Optional [str ]) -> bool :
73
74
return ModelConfig (model = model_name ,
75
+ revision = revision ,
74
76
tokenizer = model_name ,
75
77
tokenizer_mode = "auto" ,
76
78
trust_remote_code = trust_remote_code ,
@@ -130,7 +132,7 @@ async def build_async_engine_client_from_engine_args(
130
132
# If manually triggered or embedding model, use AsyncLLMEngine in process.
131
133
# TODO: support embedding model via RPC.
132
134
if (model_is_embedding (engine_args .model , engine_args .trust_remote_code ,
133
- engine_args .quantization )
135
+ engine_args .quantization , engine_args . revision )
134
136
or disable_frontend_multiprocessing ):
135
137
engine_client = AsyncLLMEngine .from_engine_args (
136
138
engine_args , usage_context = UsageContext .OPENAI_API_SERVER )
You can’t perform that action at this time.
0 commit comments