dead code

This commit is contained in:
fxmarty 2024-06-07 12:38:56 +00:00
parent b884d2b9b8
commit fb5487d00c

View File

@ -50,8 +50,6 @@ __all__ = [
FLASH_ATT_ERROR_MESSAGE = "{} requires Flash Attention enabled models."
SLIDING_WINDOW_MESSAGE = "The backend {} does not support sliding window attention. TGI webserver was started max_input_tokens={} larger than sliding_window={}. To use this model with the {} backend, please launch TGI with the argument `--max-batch-prefill-tokens` smaller than {}."
FLASH_ATTENTION = True
try: