mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
Update router/src/infer.rs
This commit is contained in:
parent
13caf958eb
commit
be87c840b8
@ -76,7 +76,7 @@ impl Infer {
|
|||||||
} else {
|
} else {
|
||||||
false
|
false
|
||||||
};
|
};
|
||||||
let block_size = if flashdecoding { 256 } else { 32 };
|
let block_size = if flashdecoding { 256 } else { 16 };
|
||||||
let block_size = std::env::var("BLOCK_SIZE")
|
let block_size = std::env::var("BLOCK_SIZE")
|
||||||
.map(|b| b.parse().unwrap_or(block_size))
|
.map(|b| b.parse().unwrap_or(block_size))
|
||||||
.unwrap_or(block_size);
|
.unwrap_or(block_size);
|
||||||
|
Loading…
Reference in New Issue
Block a user