mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-06-19 15:52:08 +00:00
Fix args
Signed-off-by: Adrien Gallouët <angt@huggingface.co>
This commit is contained in:
parent
7a3ed4171e
commit
3f199134f0
@ -37,7 +37,7 @@ struct Args {
|
|||||||
n_gpu_layers: usize,
|
n_gpu_layers: usize,
|
||||||
|
|
||||||
/// Split the model across multiple GPUs.
|
/// Split the model across multiple GPUs.
|
||||||
#[clap(default_value = "Layer", long, env)]
|
#[clap(default_value = "layer", long, env)]
|
||||||
split_mode: LlamacppSplitMode,
|
split_mode: LlamacppSplitMode,
|
||||||
|
|
||||||
/// Defragment the KV cache if holes/size > threshold.
|
/// Defragment the KV cache if holes/size > threshold.
|
||||||
@ -45,7 +45,7 @@ struct Args {
|
|||||||
defrag_threshold: f32,
|
defrag_threshold: f32,
|
||||||
|
|
||||||
/// Setup NUMA optimizations.
|
/// Setup NUMA optimizations.
|
||||||
#[clap(default_value = "Disabled", value_enum, long, env)]
|
#[clap(default_value = "disabled", value_enum, long, env)]
|
||||||
numa: LlamacppNuma,
|
numa: LlamacppNuma,
|
||||||
|
|
||||||
/// Whether to use memory mapping.
|
/// Whether to use memory mapping.
|
||||||
|
Loading…
Reference in New Issue
Block a user