mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-26 12:32:10 +00:00
update launcher
This commit is contained in:
parent
3cc2f4e9fa
commit
e81c4cf863
@ -213,5 +213,5 @@ FROM base-copy
|
||||
COPY ./tgi-entrypoint.sh /tgi-entrypoint.sh
|
||||
RUN chmod +x /tgi-entrypoint.sh
|
||||
|
||||
# ENTRYPOINT ["/tgi-entrypoint.sh"]
|
||||
# CMD ["--json-output"]
|
||||
ENTRYPOINT ["/tgi-entrypoint.sh"]
|
||||
CMD ["--json-output"]
|
||||
|
3
Makefile
3
Makefile
@ -53,6 +53,3 @@ run-falcon-7b-instruct-quantize:
|
||||
|
||||
clean:
|
||||
rm -rf target aml
|
||||
|
||||
interact:
|
||||
docker run --rm -it --cap-add=SYS_PTRACE --security-opt seccomp=unconfined --device=/dev/kfd --device=/dev/dri --group-add video --ipc=host --shm-size 64g --net host -v /home/mohit/.cache/huggingface/hub/:/data -v $(PWD):/tgi tgi-mht
|
||||
|
@ -158,10 +158,10 @@ impl std::fmt::Display for KvDtype {
|
||||
match self {
|
||||
KvDtype::Fp8 => {
|
||||
write!(f, "fp8")
|
||||
},
|
||||
}
|
||||
KvDtype::Fp8e5m2 => {
|
||||
write!(f, "fp8_e5m2")
|
||||
},
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user