Skip to content

Commit 3ff6411

Browse files
authored
Remove references to squeezellm (#1603)
1 parent 2b302b9 commit 3ff6411

File tree

2 files changed

+0
-3
lines changed

2 files changed

+0
-3
lines changed

python/sglang/srt/layers/quantization/__init__.py

-2
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,6 @@
1919
from vllm.model_executor.layers.quantization.gptq_marlin_24 import GPTQMarlin24Config
2020
from vllm.model_executor.layers.quantization.marlin import MarlinConfig
2121
from vllm.model_executor.layers.quantization.qqq import QQQConfig
22-
from vllm.model_executor.layers.quantization.squeezellm import SqueezeLLMConfig
2322
from vllm.model_executor.layers.quantization.tpu_int8 import Int8TpuConfig
2423

2524
from sglang.srt.layers.quantization.base_config import QuantizationConfig
@@ -39,7 +38,6 @@
3938
"gptq_marlin": GPTQMarlinConfig,
4039
"awq_marlin": AWQMarlinConfig,
4140
"gptq": GPTQConfig,
42-
"squeezellm": SqueezeLLMConfig,
4341
"compressed-tensors": CompressedTensorsConfig,
4442
"bitsandbytes": BitsAndBytesConfig,
4543
"qqq": QQQConfig,

python/sglang/srt/server_args.py

-1
Original file line numberDiff line numberDiff line change
@@ -266,7 +266,6 @@ def add_cli_args(parser: argparse.ArgumentParser):
266266
"marlin",
267267
"gptq_marlin",
268268
"awq_marlin",
269-
"squeezellm",
270269
"bitsandbytes",
271270
],
272271
help="The quantization method.",

0 commit comments

Comments
 (0)