We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1e2b203 commit bbc24c7Copy full SHA for bbc24c7
benchmarks/measure_ppl2_MC.py
@@ -72,6 +72,8 @@ def vllm_init(args):
72
kv_cache_dtype=args.kv_cache_dtype,
73
#scales_path=args.kv_cache_scales_path
74
# if args.kv_cache_scales_path!='' else None,
75
+ quantization-param-path=args.kv_cache_scales_path
76
+ if args.kv_cache_scales_path!='' else None,
77
enforce_eager=args.enforce_eager)
78
79
sampling_params = SamplingParams(n=1,
0 commit comments