Update autograd_4bit.py

2023-03-18 22:13:11 +08:00 · 2023-03-18 22:13:11 +08:00 · 2b84b32fbe
parent 6f4bbb40a9
commit 2b84b32fbe
1 changed files with 0 additions and 2 deletions
--- a/GPTQ-for-LLaMa/autograd_4bit.py
+++ b/GPTQ-for-LLaMa/autograd_4bit.py
@ -17,7 +17,6 @@ def matmul4bit(x, qweight, scales, zeros):
    assert qweight.shape[0] * 8 == x.shape[-1]
    outshape = tuple(list(x.shape[:-1]) + [qweight.shape[1]])
    x = x.reshape(-1, x.shape[-1])
-    assert x.shape[0] % 256 == 0
    y = torch.zeros((x.shape[0], qweight.shape[-1]), dtype=torch.float32, device=x.device)
    dtype = x.dtype
    x = x.float()
@ -39,7 +38,6 @@ def matmul4bit_transpose(x, qweight, scales, zeros):
    assert qweight.shape[1] == x.shape[-1]
    outshape = tuple(list(x.shape[:-1]) + [qweight.shape[0] * 8])
    x = x.reshape(-1, x.shape[-1])
-    assert x.shape[0] % 256 == 0
    y = torch.zeros((qweight.shape[0] * 8, x.shape[0]), dtype=torch.float32, device=x.device)
    dtype = x.dtype
    x = x.float()