mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-26 20:42:06 +00:00
update launcher
This commit is contained in:
parent
3cc2f4e9fa
commit
e81c4cf863
@ -213,5 +213,5 @@ FROM base-copy
|
|||||||
COPY ./tgi-entrypoint.sh /tgi-entrypoint.sh
|
COPY ./tgi-entrypoint.sh /tgi-entrypoint.sh
|
||||||
RUN chmod +x /tgi-entrypoint.sh
|
RUN chmod +x /tgi-entrypoint.sh
|
||||||
|
|
||||||
# ENTRYPOINT ["/tgi-entrypoint.sh"]
|
ENTRYPOINT ["/tgi-entrypoint.sh"]
|
||||||
# CMD ["--json-output"]
|
CMD ["--json-output"]
|
||||||
|
3
Makefile
3
Makefile
@ -53,6 +53,3 @@ run-falcon-7b-instruct-quantize:
|
|||||||
|
|
||||||
clean:
|
clean:
|
||||||
rm -rf target aml
|
rm -rf target aml
|
||||||
|
|
||||||
interact:
|
|
||||||
docker run --rm -it --cap-add=SYS_PTRACE --security-opt seccomp=unconfined --device=/dev/kfd --device=/dev/dri --group-add video --ipc=host --shm-size 64g --net host -v /home/mohit/.cache/huggingface/hub/:/data -v $(PWD):/tgi tgi-mht
|
|
||||||
|
@ -158,10 +158,10 @@ impl std::fmt::Display for KvDtype {
|
|||||||
match self {
|
match self {
|
||||||
KvDtype::Fp8 => {
|
KvDtype::Fp8 => {
|
||||||
write!(f, "fp8")
|
write!(f, "fp8")
|
||||||
},
|
}
|
||||||
KvDtype::Fp8e5m2 => {
|
KvDtype::Fp8e5m2 => {
|
||||||
write!(f, "fp8_e5m2")
|
write!(f, "fp8_e5m2")
|
||||||
},
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user