File tree 5 files changed +6
-12
lines changed
5 files changed +6
-12
lines changed Original file line number Diff line number Diff line change @@ -227,7 +227,7 @@ def main(
227
227
if "spinquant" in quantization :
228
228
from torchao .prototype .spinquant import apply_spinquant
229
229
apply_spinquant (model )
230
- elif "int8wo" in quantization :
230
+ if "int8wo" in quantization :
231
231
quantize_ (model , int8_weight_only ())
232
232
elif "int8dq" in quantization :
233
233
quantize_ (model , int8_dynamic_activation_int8_weight ())
Original file line number Diff line number Diff line change 33
33
benchmark_model ,
34
34
)
35
35
36
- from .granularity import (
36
+ from torchao . quantization .granularity import (
37
37
PerRow ,
38
38
PerTensor ,
39
39
)
40
- from .subclass import ( # noqa
40
+ from torchao . quantization .subclass import ( # noqa
41
41
Int8DynamicallyQuantizedLinearWeight ,
42
42
Int8WeightOnlyQuantizedLinearWeight ,
43
43
QuantizedLinearWeightBase ,
File renamed without changes.
Original file line number Diff line number Diff line change 15
15
OTHER_AUTOQUANT_CLASS_LIST ,
16
16
autoquant ,
17
17
)
18
- from .autoquant_v2 import (
18
+ from torchao . prototype . quantization .autoquant_v2 import (
19
19
DEFAULT_AUTOQUANT_CLASS_LIST as V2_DEFAULT_AUTOQUANT_CLASS_LIST ,
20
- )
21
- from .autoquant_v2 import (
22
20
DEFAULT_INT4_AUTOQUANT_CLASS_LIST as V2_DEFAULT_INT4_AUTOQUANT_CLASS_LIST ,
23
- )
24
- from .autoquant_v2 import (
25
21
OTHER_AUTOQUANT_CLASS_LIST as V2_OTHER_AUTOQUANT_CLASS_LIST ,
26
- )
27
- from .autoquant_v2 import (
28
22
autoquant_v2 as _autoquant_v2 ,
29
23
)
30
24
from .GPTQ import (
Original file line number Diff line number Diff line change 54
54
)
55
55
56
56
from .autoquant import AutoQuantizableLinearWeight , autoquant
57
- from .autoquant_v2 import AutoQuantizableLinearWeight as AutoQuantizableLinearWeightV2
58
- from .autoquant_v2 import autoquant_v2
57
+ from torchao . prototype . quantization .autoquant_v2 import AutoQuantizableLinearWeight as AutoQuantizableLinearWeightV2
58
+ from torchao . prototype . quantization .autoquant_v2 import autoquant_v2
59
59
from .GPTQ import (
60
60
Int4WeightOnlyGPTQQuantizer ,
61
61
Int4WeightOnlyQuantizer ,
You can’t perform that action at this time.
0 commit comments