Use flash attention monkeypatch

This commit is contained in:
yamashi
2023-04-06 13:49:12 +02:00
committed by GitHub
parent 8020b3ec3b
commit 3ea18575c7
+3
View File
@@ -16,6 +16,9 @@
}
]
"""
from monkeypatch.llama_flash_attn_monkey_patch import replace_llama_attn_with_flash_attn
replace_llama_attn_with_flash_attn()
import sys