diff --git a/builder/requirements.txt b/builder/requirements.txt index 4a6b137..0de7524 100644 --- a/builder/requirements.txt +++ b/builder/requirements.txt @@ -9,3 +9,4 @@ pydantic pydantic-settings hf-transfer transformers +bitsandbytes>=0.44.0 diff --git a/worker-config.json b/worker-config.json index c150314..5c5d5b2 100644 --- a/worker-config.json +++ b/worker-config.json @@ -564,7 +564,8 @@ { "value": "None", "label": "None" }, { "value": "awq", "label": "AWQ" }, { "value": "squeezellm", "label": "SqueezeLLM" }, - { "value": "gptq", "label": "GPTQ" } + { "value": "gptq", "label": "GPTQ" }, + { "value": "bitsandbytes", "label": "BitsAndBytes" } ] }, "ROPE_SCALING": {