We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5d1477a commit d509a44Copy full SHA for d509a44
serving/docker/partition/partition.py
@@ -35,6 +35,8 @@
35
36
ALLOW_PATTERNS = ["*.json", "*.pt", "*.bin", "*.txt"]
37
38
+WEIGHT_ONLY_QUANTIZATION_TYPES = ["static_int8"]
39
+
40
41
class PartitionService(object):
42
@@ -326,7 +328,9 @@ def main():
326
328
extract_python_jar(PYTHON_CACHE_DIR)
327
329
330
service = PartitionService(properties_manager)
- if properties_manager.properties.get('option.quantize'):
331
+ if properties_manager.properties.get(
332
+ 'option.quantize') and properties_manager.properties.get(
333
+ 'option.quantize') not in WEIGHT_ONLY_QUANTIZATION_TYPES:
334
service.run_quantization()
335
else:
336
service.run_partition()
0 commit comments