2323
2424from .. import __version__
2525from ..quantizers import DiffusersAutoQuantizer
26+ from ..quantizers .quantization_config import NunchakuConfig
2627from ..utils import deprecate , is_accelerate_available , is_torch_version , logging
2728from ..utils .torch_utils import empty_device_cache
2829from .single_file_utils import (
@@ -442,6 +443,7 @@ def from_single_file(cls, pretrained_model_link_or_path_or_dict: Optional[str] =
442443 )
443444
444445 # This step is better off here than above because `diffusers_format_checkpoint` holds the keys we expect.
446+ # We can move it to a separate function as well.
445447 if quantization_config is not None :
446448 original_modules_to_not_convert = quantization_config .modules_to_not_convert or []
447449 determined_modules_to_not_convert = _maybe_determine_modules_to_not_convert (
@@ -450,12 +452,15 @@ def from_single_file(cls, pretrained_model_link_or_path_or_dict: Optional[str] =
450452 if determined_modules_to_not_convert :
451453 determined_modules_to_not_convert .extend (original_modules_to_not_convert )
452454 determined_modules_to_not_convert = list (set (determined_modules_to_not_convert ))
453- logger .info (
455+ logger .debug (
454456 f"`modules_to_not_convert` in the quantization_config was updated from { quantization_config .modules_to_not_convert } to { determined_modules_to_not_convert } ."
455457 )
456- quantization_config .modules_to_not_convert = original_modules_to_not_convert
457- # Update the `quant_config`.
458- hf_quantizer .quantization_config = quantization_config
458+ modified_quant_config = quantization_config .to_dict ()
459+ modified_quant_config ["modules_to_not_convert" ] = determined_modules_to_not_convert
460+ # TODO: figure out a better way.
461+ modified_quant_config = NunchakuConfig .from_dict (modified_quant_config )
462+ setattr (hf_quantizer , "quantization_config" , modified_quant_config )
463+ logger .debug ("TODO" )
459464
460465 # Check if `_keep_in_fp32_modules` is not None
461466 use_keep_in_fp32_modules = (cls ._keep_in_fp32_modules is not None ) and (
0 commit comments