diff --git a/launcher/src/main.rs b/launcher/src/main.rs index bb1d881f..430b9620 100644 --- a/launcher/src/main.rs +++ b/launcher/src/main.rs @@ -1558,7 +1558,6 @@ fn main() -> Result<(), LauncherError> { } let quantize = args.quantize.or(quantize); - tracing::info!("Quantize found {quantize:?}"); let cuda_graphs = match (&args.cuda_graphs, &quantize) { (Some(cuda_graphs), _) => cuda_graphs.iter().cloned().filter(|&c| c > 0).collect(), #[allow(deprecated)] diff --git a/server/Makefile-exllamav2 b/server/Makefile-exllamav2 index 38abeffe..0d4cc385 100644 --- a/server/Makefile-exllamav2 +++ b/server/Makefile-exllamav2 @@ -1,7 +1,7 @@ -exllamav2_commit := 872386c89eaebe0bde5b245a890f1da9522768b3 +exllamav2_commit := v0.1.8 build-exllamav2: - git clone https://github.com/Narsil/exllamav2.git exllamav2 && \ + git clone https://github.com/turboderp/exllamav2.git exllamav2 && \ cd exllamav2 && git fetch && git checkout $(exllamav2_commit) && \ git submodule update --init --recursive && \ pip install -r requirements.txt && \