diff --git a/server/Makefile-flash-att-v2 b/server/Makefile-flash-att-v2 index 5005e007..14c7829f 100644 --- a/server/Makefile-flash-att-v2 +++ b/server/Makefile-flash-att-v2 @@ -2,7 +2,7 @@ flash_att_v2_commit_cuda := v2.5.9.post1 flash_att_v2_commit_rocm := 2554f490101742ccdc56620a938f847f61754be6 install-flash-attention-v2-cuda: - pip install -U packaging + pip install -U packaging wheel pip install flash-attn==$(flash_att_v2_commit_cuda) install-flash-attention-v2-rocm: build-flash-attention-v2-rocm