Reduce memory usage

bitsandbytes-foundation · Titus-von-Koeller · May 24, 2024 · May 8, 2024 · May 10, 2024 · May 11, 2024
commit dd15734709f131b4c1e3244ba28e632dbf5a3ed6
diff --git a/bitsandbytes/backends/cpu_xpu_common.py b/bitsandbytes/backends/cpu_xpu_common.py
@@ -377,6 +377,7 @@ def quantize_4bit_impl(
             int(lowp_mode),
             -1,  # act_quant_mode. -1 means don't quant activation
         )
+        return torch.Tensor(), state
 
     return out, state