Use flash attention monkeypatch
This commit is contained in:
parent
8020b3ec3b
commit
3ea18575c7
|
|
@ -16,6 +16,9 @@
|
|||
}
|
||||
]
|
||||
"""
|
||||
from monkeypatch.llama_flash_attn_monkey_patch import replace_llama_attn_with_flash_attn
|
||||
|
||||
replace_llama_attn_with_flash_attn()
|
||||
|
||||
import sys
|
||||
|
||||
|
|
|
|||
Loading…
Reference in New Issue