mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
Update router/src/infer.rs
This commit is contained in:
parent
13caf958eb
commit
be87c840b8
@ -76,7 +76,7 @@ impl Infer {
|
||||
} else {
|
||||
false
|
||||
};
|
||||
let block_size = if flashdecoding { 256 } else { 32 };
|
||||
let block_size = if flashdecoding { 256 } else { 16 };
|
||||
let block_size = std::env::var("BLOCK_SIZE")
|
||||
.map(|b| b.parse().unwrap_or(block_size))
|
||||
.unwrap_or(block_size);
|
||||
|
Loading…
Reference in New Issue
Block a user