move to prototype folder

jerryzh168 · jerryzh168 · commit 831107fa813b · 2024-11-19T18:49:40.000-08:00
diff --git a/torchao/_models/llama/generate.py b/torchao/_models/llama/generate.py
@@ -227,7 +227,7 @@ def main(
         if "spinquant" in quantization:
             from torchao.prototype.spinquant import apply_spinquant
             apply_spinquant(model)
-        elif "int8wo" in quantization:
+        if "int8wo" in quantization:
             quantize_(model, int8_weight_only())
         elif "int8dq" in quantization:
             quantize_(model, int8_dynamic_activation_int8_weight())
diff --git a/torchao/prototype/quantization/autoquant_v2.py b/torchao/prototype/quantization/autoquant_v2.py
@@ -33,11 +33,11 @@
     benchmark_model,
 )
 
-from .granularity import (
+from torchao.quantization.granularity import (
     PerRow,
     PerTensor,
 )
-from .subclass import (  # noqa
+from torchao.quantization.subclass import (  # noqa
     Int8DynamicallyQuantizedLinearWeight,
     Int8WeightOnlyQuantizedLinearWeight,
     QuantizedLinearWeightBase,
diff --git a/torchao/prototype/quantization/subgraph_utils/extract_subgraphs.py b/torchao/prototype/quantization/subgraph_utils/extract_subgraphs.py
diff --git a/torchao/quantization/__init__.py b/torchao/quantization/__init__.py
@@ -15,16 +15,10 @@
     OTHER_AUTOQUANT_CLASS_LIST,
     autoquant,
 )
-from .autoquant_v2 import (
+from torchao.prototype.quantization.autoquant_v2 import (
     DEFAULT_AUTOQUANT_CLASS_LIST as V2_DEFAULT_AUTOQUANT_CLASS_LIST,
-)
-from .autoquant_v2 import (
     DEFAULT_INT4_AUTOQUANT_CLASS_LIST as V2_DEFAULT_INT4_AUTOQUANT_CLASS_LIST,
-)
-from .autoquant_v2 import (
     OTHER_AUTOQUANT_CLASS_LIST as V2_OTHER_AUTOQUANT_CLASS_LIST,
-)
-from .autoquant_v2 import (
     autoquant_v2 as _autoquant_v2,
 )
 from .GPTQ import (
diff --git a/torchao/quantization/quant_api.py b/torchao/quantization/quant_api.py
@@ -54,8 +54,8 @@
 )
 
 from .autoquant import AutoQuantizableLinearWeight, autoquant
-from .autoquant_v2 import AutoQuantizableLinearWeight as AutoQuantizableLinearWeightV2
-from .autoquant_v2 import autoquant_v2
+from torchao.prototype.quantization.autoquant_v2 import AutoQuantizableLinearWeight as AutoQuantizableLinearWeightV2
+from torchao.prototype.quantization.autoquant_v2 import autoquant_v2
 from .GPTQ import (
     Int4WeightOnlyGPTQQuantizer,
     Int4WeightOnlyQuantizer,

Original file line number	Diff line number	Diff line change
`@@ -33,11 +33,11 @@`
`33`	`33`	`benchmark_model,`
`34`	`34`	`)`
`35`	`35`
`36`		`-from .granularity import (`
	`36`	`+from torchao.quantization.granularity import (`
`37`	`37`	`PerRow,`
`38`	`38`	`PerTensor,`
`39`	`39`	`)`
`40`		`-from .subclass import ( # noqa`
	`40`	`+from torchao.quantization.subclass import ( # noqa`
`41`	`41`	`Int8DynamicallyQuantizedLinearWeight,`
`42`	`42`	`Int8WeightOnlyQuantizedLinearWeight,`
`43`	`43`	`QuantizedLinearWeightBase,`