Adding warnings for deprecated bitsandbytes + upgrade info to warn.

This commit is contained in:
Nicolas Patry 2024-08-15 11:04:30 +02:00
parent e46df82e4f
commit 18ad84c8fa
No known key found for this signature in database
GPG Key ID: 64AF4752B2967863

View File

@ -1557,6 +1557,9 @@ fn main() -> Result<(), LauncherError> {
))); )));
} }
if matches!(args.quantize, Some(Quantization::Bitsandbytes)) {
tracing::warn!("Bitsandbytes is deprecated, use `eetq` instead, which provides better latencies overall and is drop-in in most cases.");
}
let quantize = args.quantize.or(quantize); let quantize = args.quantize.or(quantize);
let cuda_graphs = match (&args.cuda_graphs, &quantize) { let cuda_graphs = match (&args.cuda_graphs, &quantize) {
(Some(cuda_graphs), _) => cuda_graphs.iter().cloned().filter(|&c| c > 0).collect(), (Some(cuda_graphs), _) => cuda_graphs.iter().cloned().filter(|&c| c > 0).collect(),
@ -1569,11 +1572,11 @@ fn main() -> Result<(), LauncherError> {
| Quantization::BitsandbytesFp4, | Quantization::BitsandbytesFp4,
), ),
) => { ) => {
tracing::info!("Bitsandbytes doesn't work with cuda graphs, deactivating them"); tracing::warn!("Bitsandbytes doesn't work with cuda graphs, deactivating them");
vec![] vec![]
} }
(None, Some(Quantization::Exl2)) => { (None, Some(Quantization::Exl2)) => {
tracing::info!("Exl2 doesn't work with cuda graphs, deactivating them"); tracing::warn!("Exl2 doesn't work with cuda graphs, deactivating them");
vec![] vec![]
} }
_ => { _ => {