We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7aace7d commit faca3a3Copy full SHA for faca3a3
fastchat/serve/vllm_worker.py
@@ -192,6 +192,7 @@ async def api_model_details(request: Request):
192
"--controller-address", type=str, default="http://localhost:21001"
193
)
194
parser.add_argument("--model-path", type=str, default="lmsys/vicuna-7b-v1.3")
195
+ parser.add_argument("--quantization", type=str)
196
parser.add_argument(
197
"--model-names",
198
type=lambda s: s.split(","),
0 commit comments