mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
Put back flash-v2 build step.
This commit is contained in:
parent
76fef7b1d2
commit
7c4927482b
@ -1,6 +1,10 @@
|
||||
flash_att_v2_commit_cuda := v2.5.9.post1
|
||||
flash_att_v2_commit_rocm := 2554f490101742ccdc56620a938f847f61754be6
|
||||
|
||||
build-flash-attention-v2-cuda:
|
||||
pip install -U packaging wheel
|
||||
pip install flash-attn==$(flash_att_v2_commit_cuda)
|
||||
|
||||
install-flash-attention-v2-cuda:
|
||||
pip install -U packaging wheel
|
||||
pip install flash-attn==$(flash_att_v2_commit_cuda)
|
||||
|
Loading…
Reference in New Issue
Block a user