|
|
@@ -92,6 +92,15 @@ ema_fakequant_qconfig = QConfig( |
|
|
|
act_fake_quant=partial(FakeQuantize, dtype="qint8", narrow_range=False), |
|
|
|
) |
|
|
|
|
|
|
|
ema_lowbit_fakequant_qconfig = QConfig( |
|
|
|
weight_observer=partial(MinMaxObserver, dtype="qint4", narrow_range=False), |
|
|
|
act_observer=partial( |
|
|
|
ExponentialMovingAverageObserver, dtype="qint4", narrow_range=False |
|
|
|
), |
|
|
|
weight_fake_quant=partial(FakeQuantize, dtype="qint4", narrow_range=False), |
|
|
|
act_fake_quant=partial(FakeQuantize, dtype="qint4", narrow_range=False), |
|
|
|
) |
|
|
|
|
|
|
|
calibration_qconfig = QConfig( |
|
|
|
weight_observer=partial(MinMaxObserver, dtype="qint8", narrow_range=True), |
|
|
|
act_observer=partial(HistogramObserver, dtype="qint8", narrow_range=False), |
|
|
|