From 6c2ac3b5fb7755a83ef05358c50e3924544a202f Mon Sep 17 00:00:00 2001 From: OlivierDehaene <23298448+OlivierDehaene@users.noreply.github.com> Date: Mon, 11 Dec 2023 13:40:50 +0100 Subject: [PATCH] support h100 --- Dockerfile | 2 +- server/Makefile | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Dockerfile b/Dockerfile index 865e2980..b6c5b2ed 100644 --- a/Dockerfile +++ b/Dockerfile @@ -157,7 +157,7 @@ RUN make build-vllm-cuda # Build megablocks FROM kernel-builder as megablocks-builder -RUN pip install git+https://github.com/OlivierDehaene/megablocks@3de516d9b774ea5dd1b79c68e2c475880f3983e7 +RUN pip install git+https://github.com/OlivierDehaene/megablocks@181709df192de9a941fdf3a641cdc65a0462996e # Text Generation Inference base image FROM nvidia/cuda:12.1.0-base-ubuntu20.04 as base diff --git a/server/Makefile b/server/Makefile index d271e894..b1926828 100644 --- a/server/Makefile +++ b/server/Makefile @@ -17,7 +17,7 @@ gen-server: touch text_generation_server/pb/__init__.py install-megablocks: - pip install git+https://github.com/OlivierDehaene/megablocks@3de516d9b774ea5dd1b79c68e2c475880f3983e7 + pip install git+https://github.com/OlivierDehaene/megablocks@181709df192de9a941fdf3a641cdc65a0462996e install: gen-server pip install pip --upgrade