From 4976889d556063b19216e6241d15759bccb686ed Mon Sep 17 00:00:00 2001 From: Florian Zimmermeister Date: Thu, 4 Jan 2024 09:22:02 +0100 Subject: [PATCH] fix cli --- server/lorax_server/cli.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/server/lorax_server/cli.py b/server/lorax_server/cli.py index 987f0096c..e55f7d556 100644 --- a/server/lorax_server/cli.py +++ b/server/lorax_server/cli.py @@ -17,6 +17,9 @@ class Quantization(str, Enum): bitsandbytes_fp4 = "bitsandbytes-fp4" gptq = "gptq" awq = "awq" + hqq_4bit = "hqq-4bit" + hqq_3bit = "hqq-3bit" + hqq_2bit = "hqq-2bit" class Dtype(str, Enum):