-
Notifications
You must be signed in to change notification settings - Fork 17
/
awsstepfunctionstasks_ProductionVariant.go
54 lines (51 loc) · 2.05 KB
/
awsstepfunctionstasks_ProductionVariant.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
package awsstepfunctionstasks
import (
"github.com/aws/aws-cdk-go/awscdk/awsec2"
)
// Identifies a model that you want to host and the resources to deploy for hosting it.
//
// Example:
// // The code below shows an example of how to instantiate this type.
// // The values are placeholders you should change.
// import "github.com/aws/aws-cdk-go/awscdk"
// import "github.com/aws/aws-cdk-go/awscdk"
//
// var acceleratorType acceleratorType
// var instanceType instanceType
//
// productionVariant := &productionVariant{
// instanceType: instanceType,
// modelName: jsii.String("modelName"),
// variantName: jsii.String("variantName"),
//
// // the properties below are optional
// acceleratorType: acceleratorType,
// initialInstanceCount: jsii.Number(123),
// initialVariantWeight: jsii.Number(123),
// }
//
// See: https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_ProductionVariant.html
//
// Experimental.
type ProductionVariant struct {
// The ML compute instance type.
// Experimental.
InstanceType awsec2.InstanceType `field:"required" json:"instanceType" yaml:"instanceType"`
// The name of the model that you want to host.
//
// This is the name that you specified when creating the model.
// Experimental.
ModelName *string `field:"required" json:"modelName" yaml:"modelName"`
// The name of the production variant.
// Experimental.
VariantName *string `field:"required" json:"variantName" yaml:"variantName"`
// The size of the Elastic Inference (EI) instance to use for the production variant.
// Experimental.
AcceleratorType AcceleratorType `field:"optional" json:"acceleratorType" yaml:"acceleratorType"`
// Number of instances to launch initially.
// Experimental.
InitialInstanceCount *float64 `field:"optional" json:"initialInstanceCount" yaml:"initialInstanceCount"`
// Determines initial traffic distribution among all of the models that you specify in the endpoint configuration.
// Experimental.
InitialVariantWeight *float64 `field:"optional" json:"initialVariantWeight" yaml:"initialVariantWeight"`
}