InferenceSpecification
import type { InferenceSpecification } from "https://aws-api.deno.dev/v0.3/services/sagemaker.ts?docs=full";
Defines how to perform inference generation after a training job is run.
interface InferenceSpecification {
Containers: ModelPackageContainerDefinition[];
SupportedContentTypes: string[];
SupportedRealtimeInferenceInstanceTypes?: ProductionVariantInstanceType[] | null;
SupportedResponseMIMETypes: string[];
SupportedTransformInstanceTypes?: TransformInstanceType[] | null;
}§Properties
§
Containers: ModelPackageContainerDefinition[]
[src]The Amazon ECR registry path of the Docker image that contains the inference code.
§
SupportedRealtimeInferenceInstanceTypes?: ProductionVariantInstanceType[] | null
[src]A list of the instance types that are used to generate inferences in real-time.
This parameter is required for unversioned models, and optional for versioned models.
§
SupportedTransformInstanceTypes?: TransformInstanceType[] | null
[src]A list of the instance types on which a transformation job can be run or on which an endpoint can be deployed.
This parameter is required for unversioned models, and optional for versioned models.