File tree Expand file tree Collapse file tree 1 file changed +8
-2
lines changed
Expand file tree Collapse file tree 1 file changed +8
-2
lines changed Original file line number Diff line number Diff line change @@ -130,7 +130,10 @@ def quantize(self, model):
130130
131131
132132# int4 weight-only
133- Int4WeightOnlyQATQuantizerModuleSwap = Int4WeightOnlyQATQuantizer
133+ class Int4WeightOnlyQATQuantizerModuleSwap (Int4WeightOnlyQATQuantizer ):
134+ pass
135+
136+
134137disable_4w_fake_quant_module_swap = disable_4w_fake_quant
135138enable_4w_fake_quant_module_swap = enable_4w_fake_quant
136139_quantizer_to_mode [Int4WeightOnlyQATQuantizerModuleSwap ] = "4w-qat-module-swap"
@@ -142,7 +145,10 @@ def quantize(self, model):
142145] = enable_4w_fake_quant_module_swap
143146
144147# int8 dynamic activations + int4 weight
145- Int8DynActInt4WeightQATQuantizerModuleSwap = Int8DynActInt4WeightQATQuantizer
148+ class Int8DynActInt4WeightQATQuantizerModuleSwap (Int8DynActInt4WeightQATQuantizer ):
149+ pass
150+
151+
146152disable_8da4w_fake_quant_module_swap = disable_8da4w_fake_quant
147153enable_8da4w_fake_quant_module_swap = enable_8da4w_fake_quant
148154_quantizer_to_mode [Int8DynActInt4WeightQATQuantizerModuleSwap ] = "8da4w-qat-module-swap"
You can’t perform that action at this time.
0 commit comments