Inference

Table of contents

Inference#

class sagemaker.hyperpod.inference.hp_endpoint_base.HPEndpointBase[source]#

Base class for HyperPod inference endpoints.

This class provides common functionality for managing inference endpoints on SageMaker HyperPod clusters orchestrated by Amazon EKS. It handles Kubernetes API interactions for creating, listing, getting, and deleting inference endpoints.

classmethod call_create_api(metadata: Metadata, kind: str, spec: _HPJumpStartEndpoint | _HPEndpoint, debug: bool = False)[source]#

Create an inference endpoint using Kubernetes API.

Parameters:

Parameter

Type

Description

metadata

Metadata

Kubernetes metadata object containing name, namespace, labels, and annotations

kind

str

Kubernetes resource kind (e.g., ‘HPJumpStartEndpoint’)

spec

Union[_HPJumpStartEndpoint, _HPEndpoint]

Endpoint specification

Raises:

Exception: If endpoint creation fails

Usage Examples
>>> from sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config import _HPJumpStartEndpoint
>>> from sagemaker.hyperpod.common.config.metadata import Metadata
>>> spec = _HPJumpStartEndpoint(...)
>>> metadata = Metadata(name="my-endpoint", namespace="default")
>>> HPEndpointBase.call_create_api(metadata, "HPJumpStartEndpoint", spec)
classmethod call_list_api(kind: str, namespace: str)[source]#

List inference endpoints using Kubernetes API.

Parameters:

Parameter

Type

Description

kind

str

Kubernetes resource kind to list

namespace

str

Kubernetes namespace to list endpoints from

Returns:

dict: List of endpoints in the specified namespace

Raises:

Exception: If listing endpoints fails

Usage Examples
>>> endpoints = HPEndpointBase.call_list_api("HPJumpStartEndpoint", "default")
>>> print(f"Found {len(endpoints['items'])} endpoints")
classmethod call_get_api(name: str, kind: str, namespace: str)[source]#

Get a specific inference endpoint using Kubernetes API.

Parameters:

Parameter

Type

Description

name

str

Name of the endpoint to retrieve

kind

str

Kubernetes resource kind

namespace

str

Kubernetes namespace containing the endpoint

Returns:

dict: Endpoint details

Raises:

Exception: If retrieving endpoint fails

Usage Examples
>>> endpoint = HPEndpointBase.call_get_api("my-endpoint", "HPJumpStartEndpoint", "default")
>>> print(endpoint['metadata']['name'])
call_delete_api(name: str, kind: str, namespace: str)[source]#

Delete an inference endpoint using Kubernetes API.

Parameters:

Parameter

Type

Description

name

str

Name of the endpoint to delete

kind

str

Kubernetes resource kind

namespace

str

Kubernetes namespace containing the endpoint

Raises:

Exception: If deleting endpoint fails

Usage Examples
>>> base = HPEndpointBase()
>>> base.call_delete_api("my-endpoint", "HPJumpStartEndpoint", "default")
classmethod get_operator_logs(since_hours: float)[source]#

Get logs from the inference operator.

Retrieves logs from the HyperPod inference operator pods for debugging and monitoring purposes.

Parameters:

Parameter

Type

Description

since_hours

float

Number of hours back to retrieve logs from

Returns:

str: Operator logs with timestamps

Raises:

Exception: If no operator pods found or log retrieval fails

Usage Examples
>>> logs = HPEndpointBase.get_operator_logs(1.0)
>>> print(logs)
>>>
>>> # Get logs from last 30 minutes
>>> logs = HPEndpointBase.get_operator_logs(0.5)
classmethod get_logs(pod: str, container: str = None, namespace=None)[source]#

Get logs from a specific pod.

Retrieves logs from a pod associated with an inference endpoint.

Parameters:

Parameter

Type

Description

pod

str

Name of the pod to get logs from

container

str, optional

Container name. If not specified, uses the first container in the pod

namespace

str, optional

Kubernetes namespace. If not specified, uses the default namespace

Returns:

str: Pod logs with timestamps

Raises:

Exception: If log retrieval fails

Usage Examples
>>> logs = HPEndpointBase.get_logs("my-pod-name")
>>> print(logs)
>>>
>>> # Get logs from specific container
>>> logs = HPEndpointBase.get_logs("my-pod", container="inference")
>>>
>>> # Get logs from specific namespace
>>> logs = HPEndpointBase.get_logs("my-pod", namespace="my-namespace")
classmethod list_pods(namespace=None)[source]#

List all pods in a namespace.

Parameters:

Parameter

Type

Description

namespace

str, optional

Kubernetes namespace to list pods from. If not specified, uses the default namespace

Returns:

List[str]: List of pod names in the namespace

Usage Examples
>>> pods = HPEndpointBase.list_pods()
>>> print(f"Found {len(pods)} pods: {pods}")
>>>
>>> # List pods in specific namespace
>>> pods = HPEndpointBase.list_pods(namespace="my-namespace")
classmethod list_namespaces()[source]#

List all available Kubernetes namespaces.

Returns:

List[str]: List of namespace names

Usage Examples
>>> namespaces = HPEndpointBase.list_namespaces()
>>> print(f"Available namespaces: {namespaces}")
class sagemaker.hyperpod.inference.hp_endpoint.HPEndpoint[source]#

Bases: _HPEndpoint, HPEndpointBase

classmethod list_pods(namespace=None, endpoint_name=None)[source]#

List all pods in a namespace.

Parameters:

Parameter

Type

Description

namespace

str, optional

Kubernetes namespace to list pods from. If not specified, uses the default namespace

Returns:

List[str]: List of pod names in the namespace

Usage Examples
>>> pods = HPEndpointBase.list_pods()
>>> print(f"Found {len(pods)} pods: {pods}")
>>>
>>> # List pods in specific namespace
>>> pods = HPEndpointBase.list_pods(namespace="my-namespace")
model_config: ClassVar[ConfigDict] = {'extra': 'ignore'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.hp_jumpstart_endpoint.HPJumpStartEndpoint[source]#

Bases: _HPJumpStartEndpoint, HPEndpointBase

validate_mig_profile(mig_profile: str, instance_type: str)[source]#

Validate if the MIG profile is supported for the given instance type.

Parameters:
  • instance_type – SageMaker instance type (e.g., “ml.p4d.24xlarge”)

  • mig_profile – MIG profile (e.g., “1g.10gb”)

Raises:

ValueError – If the instance type doesn’t support MIG profiles or if the MIG profile is not supported for the instance type

classmethod list_pods(namespace=None, endpoint_name=None)[source]#

List all pods in a namespace.

Parameters:

Parameter

Type

Description

namespace

str, optional

Kubernetes namespace to list pods from. If not specified, uses the default namespace

Returns:

List[str]: List of pod names in the namespace

Usage Examples
>>> pods = HPEndpointBase.list_pods()
>>> print(f"Found {len(pods)} pods: {pods}")
>>>
>>> # List pods in specific namespace
>>> pods = HPEndpointBase.list_pods(namespace="my-namespace")
model_config: ClassVar[ConfigDict] = {'extra': 'ignore'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Dimensions[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.CloudWatchTrigger[source]#

Bases: BaseModel

CloudWatch metric trigger to use for autoscaling

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.CloudWatchTriggerList[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.PrometheusTrigger[source]#

Bases: BaseModel

Prometheus metric trigger to use for autoscaling

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.PrometheusTriggerList[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.AutoScalingSpec[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.IntelligentRoutingSpec[source]#

Bases: BaseModel

Configuration for intelligent routing This feature is currently not supported for existing deployments. Adding this configuration to an existing deployment will be rejected.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.L2CacheSpec[source]#

Bases: BaseModel

Configuration for providing L2 Cache offloading

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.KvCacheSpec[source]#

Bases: BaseModel

Configuration for KV Cache specification By default L1CacheOffloading will be enabled

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.LoadBalancer[source]#

Bases: BaseModel

Configuration for Application Load Balancer

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.ModelMetrics[source]#

Bases: BaseModel

Configuration for model container metrics scraping

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Metrics[source]#

Bases: BaseModel

Configuration for metrics collection and exposure

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.FsxStorage[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.S3Storage[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.ModelSourceConfig[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Tags[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.TlsConfig[source]#

Bases: BaseModel

Configurations for TLS

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.ConfigMapKeyRef[source]#

Bases: BaseModel

Selects a key of a ConfigMap.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.FieldRef[source]#

Bases: BaseModel

Selects a field of the pod: supports metadata.name, metadata.namespace, metadata.labels['<KEY>'], metadata.annotations['<KEY>'], spec.nodeName, spec.serviceAccountName, status.hostIP, status.podIP, status.podIPs.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.ResourceFieldRef[source]#

Bases: BaseModel

Selects a resource of the container: only resources limits and requests (limits.cpu, limits.memory, limits.ephemeral-storage, requests.cpu, requests.memory and requests.ephemeral-storage) are currently supported.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.SecretKeyRef[source]#

Bases: BaseModel

Selects a key of a secret in the pod’s namespace

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.ValueFrom[source]#

Bases: BaseModel

Source for the environment variable’s value. Cannot be used if value is not empty.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.EnvironmentVariables[source]#

Bases: BaseModel

EnvVar represents an environment variable present in a Container.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.ModelInvocationPort[source]#

Bases: BaseModel

Defines the port at which the model server will listen to the invocation requests.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.ModelVolumeMount[source]#

Bases: BaseModel

Defines the volume where model will be loaded

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Claims[source]#

Bases: BaseModel

ResourceClaim references one entry in PodSpec.ResourceClaims.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Resources[source]#

Bases: BaseModel

Defines the Resources in terms of CPU, GPU, Memory needed for the model to be deployed

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Worker[source]#

Bases: BaseModel

Details of the worker

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Conditions[source]#

Bases: BaseModel

DeploymentCondition describes the state of a deployment at a certain point.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Status[source]#

Bases: BaseModel

Status of the Deployment Object

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.DeploymentStatus[source]#

Bases: BaseModel

Details of the native kubernetes deployment that hosts the model

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Sagemaker[source]#

Bases: BaseModel

Status of the SageMaker endpoint

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.Endpoints[source]#

Bases: BaseModel

EndpointStatus contains the status of SageMaker endpoints

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.ModelMetricsStatus[source]#

Bases: BaseModel

Status of model container metrics collection

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.MetricsStatus[source]#

Bases: BaseModel

Status of metrics collection

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.TlsCertificate[source]#

Bases: BaseModel

CertificateStatus represents the status of TLS certificates

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_endpoint_config.InferenceEndpointConfigStatus[source]#

Bases: BaseModel

ModelDeploymentStatus defines the observed state of ModelDeployment

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.Dimensions[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.CloudWatchTrigger[source]#

Bases: BaseModel

CloudWatch metric trigger to use for autoscaling

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.PrometheusTrigger[source]#

Bases: BaseModel

Prometheus metric trigger to use for autoscaling

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.AutoScalingSpec[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.EnvironmentVariables[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.Metrics[source]#

Bases: BaseModel

Configuration for metrics collection and exposure

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.AdditionalConfigs[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.Model[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.SageMakerEndpoint[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.Validations[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.Server[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.TlsConfig[source]#

Bases: BaseModel

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.Conditions[source]#

Bases: BaseModel

DeploymentCondition describes the state of a deployment at a certain point.

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.Status[source]#

Bases: BaseModel

Status of the Deployment Object

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.DeploymentStatus[source]#

Bases: BaseModel

Details of the native kubernetes deployment that hosts the model

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.Sagemaker[source]#

Bases: BaseModel

Status of the SageMaker endpoint

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.Endpoints[source]#

Bases: BaseModel

EndpointStatus contains the status of SageMaker endpoints

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.ModelMetrics[source]#

Bases: BaseModel

Status of model container metrics collection

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.MetricsStatus[source]#

Bases: BaseModel

Status of metrics collection

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.TlsCertificate[source]#

Bases: BaseModel

CertificateStatus represents the status of TLS certificates

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

class sagemaker.hyperpod.inference.config.hp_jumpstart_endpoint_config.JumpStartModelStatus[source]#

Bases: BaseModel

ModelDeploymentStatus defines the observed state of ModelDeployment

model_config: ClassVar[ConfigDict] = {'extra': 'forbid'}#

Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].