This commit is contained in:
John Smith 2023-03-29 01:25:37 +08:00
parent 234004ceb5
commit d28ee06202
1 changed files with 2 additions and 2 deletions

View File

@ -108,9 +108,9 @@ def matmul4bit(x, qweight, scales, zeros, groupsize=-1):
if np.prod(x.shape[:-1]) > auto_switch_thd:
output = _matmul4bit_v1_recons(x, qweight, scales, zeros)
else:
output = _matmul4bit_v1(x, qweight, scales.float(), zeros)
output = _matmul4bit_v1(x, qweight, scales.float(), zeros.float())
else:
output = _matmul4bit_v1(x, qweight, scales.float(), zeros)
output = _matmul4bit_v1(x, qweight, scales.float(), zeros.float())
else:
# use v2
if use_new: