mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 20:04:52 +00:00
added docker-compose example
This commit is contained in:
parent
16fadcec57
commit
a160ce5623
19
docker-compose.yml
Normal file
19
docker-compose.yml
Normal file
@ -0,0 +1,19 @@
|
|||||||
|
services:
|
||||||
|
text-generation-inference:
|
||||||
|
image: ghcr.io/huggingface/text-generation-inference:1.0.0
|
||||||
|
ports:
|
||||||
|
- "8080:80"
|
||||||
|
volumes:
|
||||||
|
- ${HOME}/.cache:/root/.cache
|
||||||
|
working_dir: /app
|
||||||
|
container_name: text-generation-inference
|
||||||
|
ipc: host
|
||||||
|
deploy:
|
||||||
|
resources:
|
||||||
|
reservations:
|
||||||
|
devices:
|
||||||
|
- driver: "nvidia"
|
||||||
|
device_ids: ["0"]
|
||||||
|
capabilities: [gpu]
|
||||||
|
restart: unless-stopped
|
||||||
|
command: --model-id tiiuae/falcon-7b-instruct --huggingface-hub-cache /root/.cache/huggingface/hub
|
Loading…
Reference in New Issue
Block a user