From abde90c493bc8ae837ced36e1ee289d3df2f2ae7 Mon Sep 17 00:00:00 2001 From: Merve Noyan Date: Tue, 22 Aug 2023 23:44:13 +0300 Subject: [PATCH] Update docs/source/basic_tutorials/non_core_models.md Co-authored-by: Omar Sanseviero --- docs/source/basic_tutorials/non_core_models.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/source/basic_tutorials/non_core_models.md b/docs/source/basic_tutorials/non_core_models.md index f6a8dc8e..9ae5e443 100644 --- a/docs/source/basic_tutorials/non_core_models.md +++ b/docs/source/basic_tutorials/non_core_models.md @@ -12,7 +12,7 @@ AutoModelForCausalLM.from_pretrained(, device_map="auto")`` AutoModelForSeq2SeqLM.from_pretrained(, device_map="auto") ``` -This means, you will be unable to use some of the features introduced by TGI, such as tensor-parallel sharding or flash attention. However, you can still get many benefits of TGI, such as continuous batching, or streaming outputs. +This means you will be unable to use some of the features introduced by TGI, such as tensor-parallel sharding or flash attention. However, you can still get many benefits of TGI, such as continuous batching or streaming outputs. You can serve these models using docker like below 👇