From 76d7963dfff218c91f243c55016656fc8a47fab7 Mon Sep 17 00:00:00 2001 From: John Smith Date: Thu, 13 Apr 2023 10:36:57 +0800 Subject: [PATCH] fix bug --- inference.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/inference.py b/inference.py index 134ae14..9e290cd 100644 --- a/inference.py +++ b/inference.py @@ -14,7 +14,7 @@ print('Fitting 4bit scales and zeros to half') model.half() for n, m in model.named_modules(): if isinstance(m, Autograd4bitQuantLinear): - if m.groupsize == -1: + if m.is_v1_model: m.zeros = m.zeros.half() m.scales = m.scales.half() m.bias = m.bias.half()