fix: improve messages api docs content and formatting

2025-09-11 12:24:53 +00:00 · 2024-01-29 14:18:19 +00:00 · 2024-01-29 14:18:19 +00:00 · 970f7142b5
commit 970f7142b5
parent a9ea60684b
1 changed files with 16 additions and 16 deletions
--- a/docs/source/messages_api.md
+++ b/docs/source/messages_api.md
@ -1,8 +1,8 @@
 # Messages API
-_Messages API is compatible to OpenAI Chat Completion API_
+Text Generation Inference (TGI) now supports the Messages API, which is fully compatible with the OpenAI Chat Completion API. This feature is available starting from version 1.4.0. You can use OpenAI's client libraries or third-party libraries expecting OpenAI schema to interact with TGI's Messages API. Below are some examples of how to utilize this compatibility.
-Text Generation Inference (TGI) now supports the Message API which is fully compatible with the OpenAI Chat Completion API. This means you can use OpenAI's client libraries to interact with TGI's Messages API. Below are some examples of how to utilize this compatibility.
+> **Note:** The Messages API is supported from TGI version 1.4.0 and above. Ensure you are using a compatible version to access this feature.
 ## Making a Request
@ -98,30 +98,30 @@ import boto3
 from sagemaker.huggingface import HuggingFaceModel, get_huggingface_llm_image_uri
 try:
-	role = sagemaker.get_execution_role()
+ role = sagemaker.get_execution_role()
 except ValueError:
-	iam = boto3.client('iam')
+ iam = boto3.client('iam')
-	role = iam.get_role(RoleName='sagemaker_execution_role')['Role']['Arn']
+ role = iam.get_role(RoleName='sagemaker_execution_role')['Role']['Arn']
 # Hub Model configuration. https://huggingface.co/models
 hub = {
-	'HF_MODEL_ID':'HuggingFaceH4/zephyr-7b-beta',
+ 'HF_MODEL_ID':'HuggingFaceH4/zephyr-7b-beta',
-	'SM_NUM_GPUS': json.dumps(1),
+ 'SM_NUM_GPUS': json.dumps(1),
-    'MESSAGES_API_ENABLED': True
+ 'MESSAGES_API_ENABLED': True
 }
 # create Hugging Face Model Class
 huggingface_model = HuggingFaceModel(
-	image_uri=get_huggingface_llm_image_uri("huggingface",version="1.4.0"),
+ image_uri=get_huggingface_llm_image_uri("huggingface",version="1.4.0"),
-	env=hub,
+ env=hub,
-	role=role, 
+ role=role, 
 )
 # deploy model to SageMaker Inference
 predictor = huggingface_model.deploy(
-	initial_instance_count=1,
+ initial_instance_count=1,
-	instance_type="ml.g5.2xlarge",
+ instance_type="ml.g5.2xlarge",
-	container_startup_health_check_timeout=300,
+ container_startup_health_check_timeout=300,
  )
 # send request