mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
fix: adjust typos and docker build
This commit is contained in:
parent
5b30a425f6
commit
deed8e8154
10
Dockerfile
10
Dockerfile
@ -154,17 +154,17 @@ COPY server/Makefile-vllm Makefile
|
|||||||
# Build specific version of vllm
|
# Build specific version of vllm
|
||||||
RUN make build-vllm-cuda
|
RUN make build-vllm-cuda
|
||||||
|
|
||||||
# Build megablocks
|
|
||||||
FROM kernel-builder as megablocks-builder
|
|
||||||
|
|
||||||
RUN pip install git+https://github.com/OlivierDehaene/megablocks@181709df192de9a941fdf3a641cdc65a0462996e
|
|
||||||
|
|
||||||
# Build mamba kernels
|
# Build mamba kernels
|
||||||
FROM kernel-builder as mamba-builder
|
FROM kernel-builder as mamba-builder
|
||||||
WORKDIR /usr/src
|
WORKDIR /usr/src
|
||||||
COPY server/Makefile-selective-scan Makefile
|
COPY server/Makefile-selective-scan Makefile
|
||||||
RUN make build-all
|
RUN make build-all
|
||||||
|
|
||||||
|
# Build megablocks
|
||||||
|
FROM kernel-builder as megablocks-builder
|
||||||
|
|
||||||
|
RUN pip install git+https://github.com/OlivierDehaene/megablocks@181709df192de9a941fdf3a641cdc65a0462996e
|
||||||
|
|
||||||
# Text Generation Inference base image
|
# Text Generation Inference base image
|
||||||
FROM nvidia/cuda:12.1.0-base-ubuntu20.04 as base
|
FROM nvidia/cuda:12.1.0-base-ubuntu20.04 as base
|
||||||
|
|
||||||
|
@ -137,7 +137,7 @@ class MambaBlock(nn.Module):
|
|||||||
z = _z[i:i+1, -1, :]
|
z = _z[i:i+1, -1, :]
|
||||||
x_db = self.x_proj(x)
|
x_db = self.x_proj(x)
|
||||||
dt, B, C = torch.split(x_db, [self.dt_rank, self.d_state, self.d_state], dim=-1)
|
dt, B, C = torch.split(x_db, [self.dt_rank, self.d_state, self.d_state], dim=-1)
|
||||||
df = self.dt_proj_no_bias(x)
|
dt = F.linear(dt, self.dt_proj.weight)
|
||||||
y = selective_state_update(
|
y = selective_state_update(
|
||||||
ssm_state[i:i+1,:,:], x, dt, self.negA, B, C, self.D, z=z, dt_bias=self.dt_proj.bias, dt_softplus=True
|
ssm_state[i:i+1,:,:], x, dt, self.negA, B, C, self.D, z=z, dt_bias=self.dt_proj.bias, dt_softplus=True
|
||||||
)
|
)
|
||||||
|
Loading…
Reference in New Issue
Block a user