File tree 2 files changed +0
-3
lines changed
2 files changed +0
-3
lines changed Original file line number Diff line number Diff line change 19
19
from vllm .model_executor .layers .quantization .gptq_marlin_24 import GPTQMarlin24Config
20
20
from vllm .model_executor .layers .quantization .marlin import MarlinConfig
21
21
from vllm .model_executor .layers .quantization .qqq import QQQConfig
22
- from vllm .model_executor .layers .quantization .squeezellm import SqueezeLLMConfig
23
22
from vllm .model_executor .layers .quantization .tpu_int8 import Int8TpuConfig
24
23
25
24
from sglang .srt .layers .quantization .base_config import QuantizationConfig
39
38
"gptq_marlin" : GPTQMarlinConfig ,
40
39
"awq_marlin" : AWQMarlinConfig ,
41
40
"gptq" : GPTQConfig ,
42
- "squeezellm" : SqueezeLLMConfig ,
43
41
"compressed-tensors" : CompressedTensorsConfig ,
44
42
"bitsandbytes" : BitsAndBytesConfig ,
45
43
"qqq" : QQQConfig ,
Original file line number Diff line number Diff line change @@ -266,7 +266,6 @@ def add_cli_args(parser: argparse.ArgumentParser):
266
266
"marlin" ,
267
267
"gptq_marlin" ,
268
268
"awq_marlin" ,
269
- "squeezellm" ,
270
269
"bitsandbytes" ,
271
270
],
272
271
help = "The quantization method." ,
You can’t perform that action at this time.
0 commit comments