diff --git a/Dockerfile b/Dockerfile index 865e2980..b6c5b2ed 100644 --- a/Dockerfile +++ b/Dockerfile @@ -157,7 +157,7 @@ RUN make build-vllm-cuda # Build megablocks FROM kernel-builder as megablocks-builder -RUN pip install git+https://github.com/OlivierDehaene/megablocks@3de516d9b774ea5dd1b79c68e2c475880f3983e7 +RUN pip install git+https://github.com/OlivierDehaene/megablocks@181709df192de9a941fdf3a641cdc65a0462996e # Text Generation Inference base image FROM nvidia/cuda:12.1.0-base-ubuntu20.04 as base diff --git a/server/Makefile b/server/Makefile index d271e894..b1926828 100644 --- a/server/Makefile +++ b/server/Makefile @@ -17,7 +17,7 @@ gen-server: touch text_generation_server/pb/__init__.py install-megablocks: - pip install git+https://github.com/OlivierDehaene/megablocks@3de516d9b774ea5dd1b79c68e2c475880f3983e7 + pip install git+https://github.com/OlivierDehaene/megablocks@181709df192de9a941fdf3a641cdc65a0462996e install: gen-server pip install pip --upgrade