mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-24 16:32:12 +00:00
Forgot last default place.
This commit is contained in:
parent
3d46783f1a
commit
cdbf73eef8
@ -47,7 +47,7 @@ impl BackendV3 {
|
|||||||
} else if prefix_caching {
|
} else if prefix_caching {
|
||||||
Attention::FlashInfer
|
Attention::FlashInfer
|
||||||
} else {
|
} else {
|
||||||
Attention::Paged
|
Attention::FlashDecoding
|
||||||
};
|
};
|
||||||
let block_size = if attention == Attention::FlashDecoding {
|
let block_size = if attention == Attention::FlashDecoding {
|
||||||
256
|
256
|
||||||
|
Loading…
Reference in New Issue
Block a user