From 903fbec604d4871b737a89a309d6e3182b3e1ae7 Mon Sep 17 00:00:00 2001 From: Nicolas Patry Date: Fri, 9 Feb 2024 11:29:34 +0000 Subject: [PATCH] Fixing AWQ. --- server/Makefile-awq | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/server/Makefile-awq b/server/Makefile-awq index 80e78c08..11517386 100644 --- a/server/Makefile-awq +++ b/server/Makefile-awq @@ -1,8 +1,10 @@ -awq_commit := f084f40bd996f3cf3a0633c1ad7d9d476c318aaa +# Fork that adds only the correct stream to this kernel in order +# to make cuda graphs work. +awq_commit := d2d7cfbfa0de87fbbc17a2984c69cd6681149885 awq: rm -rf llm-awq - git clone https://github.com/mit-han-lab/llm-awq + git clone https://github.com/huggingface/llm-awq build-awq: awq cd llm-awq/ && git fetch && git checkout $(awq_commit)