fix dequant 4bit weight

bitsandbytes-foundation · Jul 31, 2024 · fbcdf62 · fbcdf62
1 parent d385aea
commit fbcdf62
Showing 1 changed file with 1 addition and 1 deletion.
diff --git a/bitsandbytes/backends/cpu_xpu_common.py b/bitsandbytes/backends/cpu_xpu_common.py
@@ -484,7 +484,7 @@ def dequantize_4bit_impl(
         out_reshaped[n - rem :] = out_dq[n - rem :] * absmax[-1]
 
     # take transpose here because weight is transposed (again) for computation
-    return out.t()
+    return out
 
 
 # Do not need torch.compile here as we are calling torch/ipex kernel