Use flash attention monkeypatch
This commit is contained in:
parent
8020b3ec3b
commit
3ea18575c7
|
|
@ -16,6 +16,9 @@
|
||||||
}
|
}
|
||||||
]
|
]
|
||||||
"""
|
"""
|
||||||
|
from monkeypatch.llama_flash_attn_monkey_patch import replace_llama_attn_with_flash_attn
|
||||||
|
|
||||||
|
replace_llama_attn_with_flash_attn()
|
||||||
|
|
||||||
import sys
|
import sys
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue