We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1929ecd commit 12f8034Copy full SHA for 12f8034
convert_hf_to_gguf.py
@@ -8943,6 +8943,13 @@ def set_vocab(self):
8943
class GptOssModel(TextModel):
8944
model_arch = gguf.MODEL_ARCH.GPT_OSS
8945
8946
+ # TODO: remove once MXFP4 is supported more generally
8947
+ def dequant_model(self):
8948
+ quant_config = self.hparams.get("quantization_config")
8949
+ if quant_config is not None and quant_config.get("quant_method") == "mxfp4":
8950
+ return
8951
+ return super().dequant_model()
8952
+
8953
def transform_nibble_layout(self, tensor):
8954
assert tensor.dtype == torch.uint8
8955
assert tensor.shape[-1] == 16
0 commit comments