Update server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py

Co-authored-by: OlivierDehaene <olivier@huggingface.co>
2025-09-10 20:04:52 +00:00 · 2023-11-08 19:07:45 +09:00 · 2023-11-08 19:07:45 +09:00 · 891fe74099
commit 891fe74099
parent f746b8e0ae
1 changed files with 1 additions and 1 deletions
--- a/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py
+++ b/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py
@ -27,7 +27,7 @@ from transformers.configuration_utils import PretrainedConfig
 from typing import Optional, List, Tuple

 from text_generation_server.utils import paged_attention, flash_attn
-from text_generation_server.utils.flash_attn import attention, HAS_FLASH_ATTN_V2_ROCM, HAS_FLASH_ATTN_V2_ROCM
+from text_generation_server.utils.flash_attn import attention, HAS_FLASH_ATTN_V2_ROCM, HAS_FLASH_ATTN_V2_CUDA
 from text_generation_server.utils.layers import (
    TensorParallelRowLinear,
    TensorParallelColumnLinear,