Solicitação e resposta Código de exemplo

Texto de incorporações do Amazon Titan

Titan Embeddings G1 - Textnão suporta o uso de parâmetros de inferência. As seções a seguir detalham os formatos de solicitação e resposta e fornecem um exemplo de código.

Tópicos

Solicitação e resposta
Código de exemplo

Solicitação e resposta

O corpo da solicitação é passado no body campo de uma InvokeModelsolicitação.

V2 Request

O parâmetro inputText é obrigatório. Os parâmetros de normalização e dimensões são opcionais.

InputText — Insira o texto a ser convertido em incorporações.
normalize - sinalizador que indica se as incorporações de saída devem ou não ser normalizadas. O valor padrão é verdadeiro.
dimensões - O número de dimensões que as incorporações de saída devem ter. Os seguintes valores são aceitos: 1024 (padrão), 512, 256.


{
                        "inputText": string,
                        "dimensions": int,
                        "normalize": boolean
}

V2 Response

Os campos são descritos abaixo.

incorporação — Uma matriz que representa o vetor de incorporação da entrada que você forneceu.
entrada TextTokenCount — O número de tokens na entrada.


{
    "embedding": [float, float, ...],
    "inputTextTokenCount": int
}

G1 Request

O único campo disponível éinputText, no qual você pode incluir texto para converter em incorporações.


{
    "inputText": string
}

G1 Response

O body da resposta contém os seguintes campos.


{
    "embedding": [float, float, ...],
    "inputTextTokenCount": int
}

Os campos são descritos abaixo.

incorporação — Uma matriz que representa o vetor de incorporação da entrada que você forneceu.
TextTokenContagem de entrada — O número de tokens na entrada.

Código de exemplo

Os exemplos a seguir mostram como chamar o modelo Amazon Titan Embeddings para gerar incorporações. Selecione a guia que corresponde ao modelo que você está usando:

Amazon Titan Embeddings G1 – Texto


# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
# SPDX-License-Identifier: Apache-2.0
"""
Shows how to generate embeddings with the Amazon Titan Embeddings G1 - Text model (on demand).
"""

import json
import logging
import boto3


from botocore.exceptions import ClientError


logger = logging.getLogger(__name__)
logging.basicConfig(level=logging.INFO)


def generate_embeddings(model_id, body):
    """
    Generate a vector of embeddings for a text input using Amazon Titan Embeddings G1 - Text on demand.
    Args:
        model_id (str): The model ID to use.
        body (str) : The request body to use.
    Returns:
        response (JSON): The embedding created by the model and the number of input tokens.
    """

    logger.info("Generating embeddings with Amazon Titan Embeddings G1 - Text model %s", model_id)

    bedrock = boto3.client(service_name='bedrock-runtime')

    accept = "application/json"
    content_type = "application/json"

    response = bedrock.invoke_model(
        body=body, modelId=model_id, accept=accept, contentType=content_type
    )

    response_body = json.loads(response.get('body').read())

    return response_body


def main():
    """
    Entrypoint for Amazon Titan Embeddings G1 - Text example.
    """

    logging.basicConfig(level=logging.INFO,
                        format="%(levelname)s: %(message)s")

    model_id = "amazon.titan-embed-text-v1"
    input_text = "What are the different services that you offer?"


    # Create request body.
    body = json.dumps({
        "inputText": input_text,
    })


    try:

        response = generate_embeddings(model_id, body)

        print(f"Generated embeddings: {response['embedding']}")
        print(f"Input Token count:  {response['inputTextTokenCount']}")

    except ClientError as err:
        message = err.response["Error"]["Message"]
        logger.error("A client error occurred: %s", message)
        print("A client error occured: " +
              format(message))

    else:
        print(f"Finished generating embeddings with Amazon Titan Embeddings G1 - Text model {model_id}.")


if __name__ == "__main__":
    main()

Amazon Incorporações de texto Titan V2


# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
# SPDX-License-Identifier: Apache-2.0
"""
Shows how to generate embeddings with the Amazon Titan Text Embeddings V2 Model
"""

import json
import logging
import boto3


from botocore.exceptions import ClientError


logger = logging.getLogger(__name__)
logging.basicConfig(level=logging.INFO)


def generate_embeddings(model_id, body):
    """
    Generate a vector of embeddings for a text input using Amazon Titan Text Embeddings G1 on demand.
    Args:
        model_id (str): The model ID to use.
        body (str) : The request body to use.
    Returns:
        response (JSON): The embedding created by the model and the number of input tokens.
    """

    logger.info("Generating embeddings with Amazon Titan Text Embeddings V2 model %s", model_id)

    bedrock = boto3.client(service_name='bedrock-runtime')

    accept = "application/json"
    content_type = "application/json"

    response = bedrock.invoke_model(
        body=body, modelId=model_id, accept=accept, contentType=content_type
    )

    response_body = json.loads(response.get('body').read())

    return response_body


def main():
    """
    Entrypoint for Amazon Titan Embeddings V2 - Text example.
    """

    logging.basicConfig(level=logging.INFO,
                        format="%(levelname)s: %(message)s")

    model_id = "amazon.titan-embed-text-v2:0"
    input_text = "What are the different services that you offer?"


    # Create request body.
    body = json.dumps({
        "inputText": input_text,
        "dimensions": 512,
        "normalize": True
    })


    try:

        response = generate_embeddings(model_id, body)

        print(f"Generated embeddings: {response['embedding']}")
        print(f"Input Token count:  {response['inputTextTokenCount']}")

    except ClientError as err:
        message = err.response["Error"]["Message"]
        logger.error("A client error occurred: %s", message)
        print("A client error occured: " +
              format(message))

    else:
        print(f"Finished generating embeddings with Amazon Titan Text Embeddings V2 model {model_id}.")


if __name__ == "__main__":
    main()
        </programlisting>
        
        <para><emphasis role="bold">Configure your accuracy-cost tradeoff as you go</emphasis></para>
        <para>While normalization is available via API customers can also reduce the embedding dimension after 
            generating the embeddings allowing them to tradeoff between accuracy and cost as their need evolve. 
            This empower customers to generate 1024-dim index embeddings, store them in low-cost storage options 
            such as S3 and load their 1024, 512 or 256 dimension version in their favorite vector DB as they go. </para>
        <para>To reduce a given embedding from 1024 to 256 dimensions you can use the following example logic:</para>
        <programlisting language="json">import numpy as np
from numpy import linalg

def normalize_embedding(embedding: np.Array):
   '''
   Args:
       embedding: Unnormlized 1D/2D numpy array
              - 1D: (emb_dim)
             - 2D: (batch_size, emb_dim)
   Return:
       np.array: Normalized 1D/2D numpy array 
   '''
   return embedding/linalg.norm(embedding, dim=-1, keep_dim=True)
   
def reduce_emb_dim(embedding: np.Array, target_dim:int, normalize:bool=True) -> np.Array:
   '''
   Args:
       embedding: Unnormlized 1D/2D numpy array. Expected shape:
          - 1D: (emb_dim)
          - 2D: (batch_size, emb_dim)
       target_dim: target dimension to reduce the embedding to
   Return:
       np.array: Normalized 1D numpy array 
   '''
   smaller_embedding = embedding[..., :target_dim]
   if normalize:
      smaller_embedding = normalize_embedding(smaller_embedding)
   return smaller_embedding
   
   
if __name__ == '__main__':
   embedding = # bedrock client call
   reduced_embedding = # bedrock client call with dim=256
   post_reduction_embeddings = reduce_emb_dim(np.array(embeddings), dim=256)
   print(linalg.norm(np.array(reduced_embedding) - post_reduction_embeddings))

Atenção O Javascript está desativado ou não está disponível no seu navegador.

Para usar a documentação da AWS, o Javascript deve estar ativado. Consulte as páginas de Ajuda do navegador para obter instruções.

Convenções do documento

Amazon Titan Image Generator G1

Amazon Titan Multimodal Embeddings G1