Skip to content

Commit a14c71a

Browse files
author
Qing Lan
committed
add new kernels to engine
1 parent 6550580 commit a14c71a

File tree

3 files changed

+6
-0
lines changed

3 files changed

+6
-0
lines changed

engines/python/setup/djl_python/properties_manager/hf_properties.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,8 +24,10 @@ class HFQuantizeMethods(str, Enum):
2424
awq = 'awq'
2525
deepspeedfp = 'deepspeedfp'
2626
fp8 = 'fp8'
27+
fbgemm_fp8 = 'fbgemm_fp8'
2728
gptq_marlin = 'gptq_marlin'
2829
gptq_marlin_24 = 'gptq_marlin_24'
30+
awq_marlin = 'awq_marlin'
2931
marlin = 'marlin'
3032
squeezellm = 'squeezellm'
3133

engines/python/setup/djl_python/properties_manager/lmi_dist_rb_properties.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,9 +22,11 @@ class LmiDistQuantizeMethods(str, Enum):
2222
awq = 'awq'
2323
deepspeedfp = 'deepspeedfp'
2424
fp8 = 'fp8'
25+
fbgemm_fp8 = 'fbgemm_fp8'
2526
gptq = 'gptq'
2627
gptq_marlin = 'gptq_marlin'
2728
gptq_marlin_24 = 'gptq_marlin_24'
29+
awq_marlin = 'awq_marlin'
2830
marlin = 'marlin'
2931
squeezellm = 'squeezellm'
3032

engines/python/setup/djl_python/properties_manager/vllm_rb_properties.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,9 +22,11 @@ class VllmQuantizeMethods(str, Enum):
2222
awq = 'awq'
2323
deepspeedfp = 'deepspeedfp'
2424
fp8 = 'fp8'
25+
fbgemm_fp8 = 'fbgemm_fp8'
2526
gptq = 'gptq'
2627
gptq_marlin = 'gptq_marlin'
2728
gptq_marlin_24 = 'gptq_marlin_24'
29+
awq_marlin = 'awq_marlin'
2830
marlin = 'marlin'
2931
squeezellm = 'squeezellm'
3032

0 commit comments

Comments
 (0)