Merge pull request #34 from winglian/v2-fixes

fixes for most recent update
2023-03-28 23:49:56 +08:00 · 2023-03-28 23:49:56 +08:00 · b5e3dae573
parent 234004ceb5 b47da33084
commit b5e3dae573
2 changed files with 2 additions and 1 deletions
--- a/matmul_utils_4bit.py
+++ b/matmul_utils_4bit.py
@ -1,6 +1,6 @@
 import torch
 import numpy as np
-import quant_cuda
+from gptq_llama import quant_cuda


 # Global Buffer
--- a/requirements.txt
+++ b/requirements.txt
@ -3,6 +3,7 @@ accelerate
 bitsandbytes
 datasets
 sentencepiece
+safetensors
 git+https://github.com/huggingface/transformers.git
 git+https://github.com/sterlind/GPTQ-for-LLaMa.git@lora_4bit
 git+https://github.com/sterlind/peft.git