From fbcdf62dcb5d4325982fac32404e7b1bc234c470 Mon Sep 17 00:00:00 2001 From: jiqing-feng Date: Wed, 31 Jul 2024 12:13:59 -0400 Subject: [PATCH] fix dequant 4bit weight --- bitsandbytes/backends/cpu_xpu_common.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/bitsandbytes/backends/cpu_xpu_common.py b/bitsandbytes/backends/cpu_xpu_common.py index 04755ed2d..c9ff7cb6f 100644 --- a/bitsandbytes/backends/cpu_xpu_common.py +++ b/bitsandbytes/backends/cpu_xpu_common.py @@ -484,7 +484,7 @@ def dequantize_4bit_impl( out_reshaped[n - rem :] = out_dq[n - rem :] * absmax[-1] # take transpose here because weight is transposed (again) for computation - return out.t() + return out # Do not need torch.compile here as we are calling torch/ipex kernel