Skip to content

Commit

Permalink
Update Sagemaker Controller Version (#671)
Browse files Browse the repository at this point in the history
- update sagemaker controller chart to latest version
  • Loading branch information
jsitu777 authored Apr 12, 2023
1 parent 9022bf0 commit 82a55c5
Show file tree
Hide file tree
Showing 23 changed files with 777 additions and 76 deletions.
Original file line number Diff line number Diff line change
@@ -1,8 +1,6 @@
apiVersion: v1
kind: Namespace
metadata:
labels:
control-plane: controller
name: ack-system
---
apiVersion: apps/v1
Expand All @@ -11,16 +9,17 @@ metadata:
name: ack-sagemaker-controller
namespace: ack-system
labels:
control-plane: controller
app.kubernetes.io/name: ack-sagemaker-controller
app.kubernetes.io/part-of: ack-system
spec:
selector:
matchLabels:
control-plane: controller
app.kubernetes.io/name: ack-sagemaker-controller
replicas: 1
template:
metadata:
labels:
control-plane: controller
app.kubernetes.io/name: ack-sagemaker-controller
spec:
containers:
- command:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -6,4 +6,4 @@ kind: Kustomization
images:
- name: controller
newName: public.ecr.aws/aws-controllers-k8s/sagemaker-controller
newTag: v0.4.5
newTag: v1.2.1
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ metadata:
namespace: ack-system
spec:
selector:
control-plane: controller
app.kubernetes.io/name: ack-sagemaker-controller
ports:
- name: metricsport
port: 8080
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -43,8 +43,7 @@ spec:
description: The name of the app.
type: string
appType:
description: The type of app. Supported apps are JupyterServer and
KernelGateway. TensorBoard is not supported.
description: The type of app.
type: string
domainID:
description: The domain ID.
Expand Down Expand Up @@ -91,13 +90,13 @@ spec:
type: object
type: array
userProfileName:
description: The user profile name.
description: The user profile name. If this value is not set, then
SpaceName must be set.
type: string
required:
- appName
- appType
- domainID
- userProfileName
type: object
status:
description: AppStatus defines the observed state of App
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -133,13 +133,14 @@ spec:
see SSD Instance Store Volumes (https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/ssd-instance-store.html)."
type: string
productionVariants:
description: An list of ProductionVariant objects, one for each model
description: An array of ProductionVariant objects, one for each model
that you want to host at this endpoint.
items:
description: Identifies a model that you want to host and the resources
chosen to deploy for hosting it. If you are deploying multiple
models, tell SageMaker how to distribute traffic among the models
by specifying variant weights.
by specifying variant weights. For more information on production
variants, check Production variants (https://docs.aws.amazon.com/sagemaker/latest/dg/model-ab-testing.html).
properties:
acceleratorType:
type: string
Expand All @@ -155,6 +156,8 @@ spec:
kmsKeyID:
type: string
type: object
enableSSMAccess:
type: boolean
initialInstanceCount:
format: int64
type: integer
Expand All @@ -167,6 +170,17 @@ spec:
type: integer
modelName:
type: string
serverlessConfig:
description: Specifies the serverless configuration for an endpoint
variant.
properties:
maxConcurrency:
format: int64
type: integer
memorySizeInMB:
format: int64
type: integer
type: object
variantName:
type: string
volumeSizeInGB:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -44,6 +44,73 @@ spec:
description: "EndpointSpec defines the desired state of Endpoint. \n A
hosted endpoint for real-time inference."
properties:
deploymentConfig:
description: The deployment configuration for an endpoint, which contains
the desired deployment strategy and rollback configurations.
properties:
autoRollbackConfiguration:
description: Automatic rollback configuration for handling endpoint
deployment failures and recovery.
properties:
alarms:
items:
description: An Amazon CloudWatch alarm configured to monitor
metrics on an endpoint.
properties:
alarmName:
type: string
type: object
type: array
type: object
blueGreenUpdatePolicy:
description: Update policy for a blue/green deployment. If this
update policy is specified, SageMaker creates a new fleet during
the deployment while maintaining the old fleet. SageMaker flips
traffic to the new fleet according to the specified traffic
routing configuration. Only one update policy should be used
in the deployment configuration. If no update policy is specified,
SageMaker uses a blue/green deployment strategy with all at
once traffic shifting by default.
properties:
maximumExecutionTimeoutInSeconds:
format: int64
type: integer
terminationWaitInSeconds:
format: int64
type: integer
trafficRoutingConfiguration:
description: Defines the traffic routing strategy during an
endpoint deployment to shift traffic from the old fleet
to the new fleet.
properties:
canarySize:
description: Specifies the endpoint capacity to activate
for production.
properties:
type_:
type: string
value:
format: int64
type: integer
type: object
linearStepSize:
description: Specifies the endpoint capacity to activate
for production.
properties:
type_:
type: string
value:
format: int64
type: integer
type: object
type_:
type: string
waitIntervalInSeconds:
format: int64
type: integer
type: object
type: object
type: object
endpointConfigName:
description: The name of an endpoint configuration. For more information,
see CreateEndpointConfig.
Expand Down Expand Up @@ -181,6 +248,100 @@ spec:
description: A timestamp that shows when the endpoint was last modified.
format: date-time
type: string
pendingDeploymentSummary:
description: Returns the summary of an in-progress deployment. This
field is only returned when the endpoint is creating or updating
with a new endpoint configuration.
properties:
endpointConfigName:
type: string
productionVariants:
items:
description: The production variant summary for a deployment
when an endpoint is creating or updating with the CreateEndpoint
or UpdateEndpoint operations. Describes the VariantStatus
, weight and capacity for a production variant associated
with an endpoint.
properties:
acceleratorType:
type: string
currentInstanceCount:
format: int64
type: integer
currentServerlessConfig:
description: Specifies the serverless configuration for
an endpoint variant.
properties:
maxConcurrency:
format: int64
type: integer
memorySizeInMB:
format: int64
type: integer
type: object
currentWeight:
type: number
deployedImages:
items:
description: "Gets the Amazon EC2 Container Registry path
of the docker image of the model that is hosted in this
ProductionVariant. \n If you used the registry/repository[:tag]
form to specify the image path of the primary container
when you created the model hosted in this ProductionVariant,
the path resolves to a path of the form registry/repository[@digest].
A digest is a hash value that identifies a specific
version of an image. For information about Amazon ECR
paths, see Pulling an Image (https://docs.aws.amazon.com/AmazonECR/latest/userguide/docker-pull-ecr-image.html)
in the Amazon ECR User Guide."
properties:
resolutionTime:
format: date-time
type: string
resolvedImage:
type: string
specifiedImage:
type: string
type: object
type: array
desiredInstanceCount:
format: int64
type: integer
desiredServerlessConfig:
description: Specifies the serverless configuration for
an endpoint variant.
properties:
maxConcurrency:
format: int64
type: integer
memorySizeInMB:
format: int64
type: integer
type: object
desiredWeight:
type: number
instanceType:
type: string
variantName:
type: string
variantStatus:
items:
description: Describes the status of the production variant.
properties:
startTime:
format: date-time
type: string
status:
type: string
statusMessage:
type: string
type: object
type: array
type: object
type: array
startTime:
format: date-time
type: string
type: object
productionVariants:
description: An array of ProductionVariantSummary objects, one for
each model hosted behind this endpoint.
Expand All @@ -193,6 +354,17 @@ spec:
currentInstanceCount:
format: int64
type: integer
currentServerlessConfig:
description: Specifies the serverless configuration for an endpoint
variant.
properties:
maxConcurrency:
format: int64
type: integer
memorySizeInMB:
format: int64
type: integer
type: object
currentWeight:
type: number
deployedImages:
Expand Down Expand Up @@ -220,6 +392,17 @@ spec:
desiredInstanceCount:
format: int64
type: integer
desiredServerlessConfig:
description: Specifies the serverless configuration for an endpoint
variant.
properties:
maxConcurrency:
format: int64
type: integer
memorySizeInMB:
format: int64
type: integer
type: object
desiredWeight:
type: number
variantName:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -99,7 +99,9 @@ spec:
we encrypt all data at rest using Amazon Web Services KMS key. By
defining your bucket-level key (https://docs.aws.amazon.com/AmazonS3/latest/userguide/bucket-key.html)
for SSE, you can reduce Amazon Web Services KMS requests costs by
up to 99 percent. \n To learn more about this parameter, see OfflineStoreConfig."
up to 99 percent. \n * Format for the offline store table. Supported
formats are Glue (Default) and Apache Iceberg (https://iceberg.apache.org/).
\n To learn more about this parameter, see OfflineStoreConfig."
properties:
dataCatalogConfig:
description: The meta data of the Glue table which serves as data
Expand Down
Loading

0 comments on commit 82a55c5

Please sign in to comment.