diff --git a/src/diffusers/quantizers/auto.py b/src/diffusers/quantizers/auto.py index ce214ae7bc..93691b3b53 100644 --- a/src/diffusers/quantizers/auto.py +++ b/src/diffusers/quantizers/auto.py @@ -21,9 +21,11 @@ from typing import Dict, Optional, Union from .bitsandbytes import BnB4BitDiffusersQuantizer, BnB8BitDiffusersQuantizer from .gguf import GGUFQuantizer +from .nunchaku import NunChakuQuantizer from .quantization_config import ( BitsAndBytesConfig, GGUFQuantizationConfig, + NunchakuConfig, QuantizationConfigMixin, QuantizationMethod, QuantoConfig, @@ -39,6 +41,7 @@ AUTO_QUANTIZER_MAPPING = { "gguf": GGUFQuantizer, "quanto": QuantoQuantizer, "torchao": TorchAoHfQuantizer, + "nunchaku": NunChakuQuantizer, } AUTO_QUANTIZATION_CONFIG_MAPPING = { @@ -47,6 +50,7 @@ AUTO_QUANTIZATION_CONFIG_MAPPING = { "gguf": GGUFQuantizationConfig, "quanto": QuantoConfig, "torchao": TorchAoConfig, + "nunchaku": NunchakuConfig, } diff --git a/src/diffusers/quantizers/nunchaku/__init__.py b/src/diffusers/quantizers/nunchaku/__init__.py new file mode 100644 index 0000000000..04b57f831a --- /dev/null +++ b/src/diffusers/quantizers/nunchaku/__init__.py @@ -0,0 +1 @@ +from .nunchaku_quantizer import NunChakuQuantizer