Fix AWS Sagemaker indentation, typo and header level

2024-10-05 13:26:25 +02:00 · 2024-10-05 13:26:25 +02:00 · 47c01cb048
parent 2358c2bb54
commit 47c01cb048
1 changed files with 16 additions and 16 deletions
--- a/docs/source/reference/api_reference.md
+++ b/docs/source/reference/api_reference.md
@ -139,11 +139,11 @@ for message in chat_completion:

 TGI can be deployed on various cloud providers for scalable and robust text generation. One such provider is Amazon SageMaker, which has recently added support for TGI. Here's how you can deploy TGI on Amazon SageMaker:

-## Amazon SageMaker
+### Amazon SageMaker

 To enable the Messages API in Amazon SageMaker you need to set the environment variable `MESSAGES_API_ENABLED=true`.

-This will modify the `/invocations` route to accept Messages dictonaries consisting out of role and content. See the example below on how to deploy Llama with the new Messages API.
+This will modify the `/invocations` route to accept Messages dictionaries consisting out of role and content. See the example below on how to deploy Llama with the new Messages API.

 ```python
 import json
@ -152,35 +152,35 @@ import boto3
 from sagemaker.huggingface import HuggingFaceModel, get_huggingface_llm_image_uri

 try:
- role = sagemaker.get_execution_role()
+    role = sagemaker.get_execution_role()
 except ValueError:
- iam = boto3.client('iam')
- role = iam.get_role(RoleName='sagemaker_execution_role')['Role']['Arn']
+    iam = boto3.client('iam')
+    role = iam.get_role(RoleName='sagemaker_execution_role')['Role']['Arn']

 # Hub Model configuration. https://huggingface.co/models
 hub = {
- 'HF_MODEL_ID':'HuggingFaceH4/zephyr-7b-beta',
- 'SM_NUM_GPUS': json.dumps(1),
- 'MESSAGES_API_ENABLED': True
+    'HF_MODEL_ID':'HuggingFaceH4/zephyr-7b-beta',
+    'SM_NUM_GPUS': json.dumps(1),
+    'MESSAGES_API_ENABLED': True
 }

 # create Hugging Face Model Class
 huggingface_model = HuggingFaceModel(
- image_uri=get_huggingface_llm_image_uri("huggingface",version="1.4.0"),
- env=hub,
- role=role,
+    image_uri=get_huggingface_llm_image_uri("huggingface",version="1.4.0"),
+    env=hub,
+    role=role,
 )

 # deploy model to SageMaker Inference
 predictor = huggingface_model.deploy(
- initial_instance_count=1,
- instance_type="ml.g5.2xlarge",
- container_startup_health_check_timeout=300,
-  )
+    initial_instance_count=1,
+    instance_type="ml.g5.2xlarge",
+    container_startup_health_check_timeout=300,
+)

 # send request
 predictor.predict({
-"messages": [
+    "messages": [
        {"role": "system", "content": "You are a helpful assistant." },
        {"role": "user", "content": "What is deep learning?"}
    ]