Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@ type: application
# This is the chart version. This version number should be incremented each time you make changes
# to the chart and its templates, including the app version.
# Versions are expected to follow Semantic Versioning (https://semver.org/)
version: 2.1.0
version: 2.1.1

# This is the version number of the application being deployed. Keep this aligned
# with operator image MAJOR.MINOR version.
Expand Down

Large diffs are not rendered by default.

Original file line number Diff line number Diff line change
Expand Up @@ -262,7 +262,7 @@ spec:
type: string
serverAddress:
description: Server address for AMP workspace
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+\/[a-zA-Z0-9-]+$|^$
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+$|^$
type: string
targetValue:
description: Target metric value for scaling
Expand Down Expand Up @@ -307,7 +307,7 @@ spec:
type: string
serverAddress:
description: Server address for AMP workspace
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+\/[a-zA-Z0-9-]+$|^$
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+$|^$
type: string
targetValue:
description: Target metric value for scaling
Expand Down Expand Up @@ -335,6 +335,211 @@ spec:
minimum: 0
type: integer
type: object
dataCapture:
description: Configuration for data capture across multiple tiers
(SageMaker, LoadBalancer, Model Pod)
properties:
loadBalancer:
description: Configuration for LoadBalancer level data capture
(Tier 2)
properties:
enabled:
description: Enable or disable load balancer access logs
type: boolean
required:
- enabled
type: object
modelPod:
description: Configuration for Model Pod level data capture (Tier
3)
properties:
bufferConfig:
description: Configuration for buffering and flushing captured
data
properties:
batchSize:
default: 10
description: Number of records to batch before writing
to S3
format: int32
maximum: 1000
minimum: 1
type: integer
flushIntervalSeconds:
default: 60
description: Flush interval in seconds
format: int32
maximum: 300
minimum: 10
type: integer
type: object
captureContentTypeHeader:
description: Configuration for how to treat different content
type headers during capture
properties:
csvContentTypes:
description: |-
List of content type headers to treat as CSV
Each item must be 1-256 characters and match pattern: [a-zA-Z0-9](-*[a-zA-Z0-9])*/[a-zA-Z0-9](-*[a-zA-Z0-9.])*
Example: text/csv, application/csv
items:
type: string
maxItems: 10
minItems: 1
type: array
x-kubernetes-list-type: set
jsonContentTypes:
description: |-
List of content type headers to treat as JSON
Each item must be 1-256 characters and match pattern: [a-zA-Z0-9](-*[a-zA-Z0-9])*/[a-zA-Z0-9](-*[a-zA-Z0-9.])*
Example: application/json, application/jsonlines
items:
type: string
maxItems: 10
minItems: 1
type: array
x-kubernetes-list-type: set
type: object
captureOptions:
description: Capture options (Input, Output, or both). Defaults
to [Input, Output] when enabled.
items:
description: CaptureOption defines what data to capture
(input, output, or both).
properties:
captureMode:
description: 'Capture mode: Input or Output'
enum:
- Input
- Output
type: string
required:
- captureMode
type: object
maxItems: 32
minItems: 1
type: array
enabled:
description: Enable or disable model pod data capture
type: boolean
initialSamplingPercentage:
description: Percentage of requests to capture (0-100). Defaults
to 100 when enabled.
format: int32
maximum: 100
minimum: 0
type: integer
kmsKeyId:
description: Optional KMS key ID, ARN, alias name, or alias
ARN for encrypting captured data
maxLength: 2048
pattern: ^[a-zA-Z0-9:/_-]*$
type: string
payloadConfig:
description: Configuration for payload size limits
properties:
maxPayloadSizeKB:
default: 0
description: Maximum payload size in KB to capture. 0
means no limit (capture full payload).
format: int32
maximum: 10240
minimum: 0
type: integer
type: object
required:
- enabled
type: object
s3Uri:
description: |-
Common S3 URI for all data capture tiers. Each tier will write to a specific prefix within this bucket.
Must use s3:// protocol (required by ALB access logs).
If not provided, the TLS certificate bucket will be used for data capture storage.
maxLength: 512
pattern: ^s3://([^/]+)(/[^,=]*)?$
type: string
sagemakerEndpoint:
description: Configuration for SageMaker Endpoint level data capture
(Tier 1)
properties:
captureContentTypeHeader:
description: Configuration for how to treat different content
type headers during capture
properties:
csvContentTypes:
description: |-
List of content type headers to treat as CSV
Each item must be 1-256 characters and match pattern: [a-zA-Z0-9](-*[a-zA-Z0-9])*/[a-zA-Z0-9](-*[a-zA-Z0-9.])*
Example: text/csv, application/csv
items:
type: string
maxItems: 10
minItems: 1
type: array
x-kubernetes-list-type: set
jsonContentTypes:
description: |-
List of content type headers to treat as JSON
Each item must be 1-256 characters and match pattern: [a-zA-Z0-9](-*[a-zA-Z0-9])*/[a-zA-Z0-9](-*[a-zA-Z0-9.])*
Example: application/json, application/jsonlines
items:
type: string
maxItems: 10
minItems: 1
type: array
x-kubernetes-list-type: set
type: object
captureOptions:
description: Capture options (Input, Output, or both). Defaults
to [Input, Output] when enabled.
items:
description: CaptureOption defines what data to capture
(input, output, or both).
properties:
captureMode:
description: 'Capture mode: Input or Output'
enum:
- Input
- Output
type: string
required:
- captureMode
type: object
maxItems: 32
minItems: 1
type: array
enabled:
description: Enable or disable SageMaker endpoint data capture
type: boolean
initialSamplingPercentage:
description: Percentage of requests to capture (0-100). Defaults
to 100 when enabled.
format: int32
maximum: 100
minimum: 0
type: integer
kmsKeyId:
description: Optional KMS key ID, ARN, alias name, or alias
ARN for encrypting captured data
maxLength: 2048
pattern: ^[a-zA-Z0-9:/_-]*$
type: string
required:
- enabled
type: object
type: object
dnsConfig:
description: DNS automation configuration for Route53. Requires tlsConfig.customCertificateConfig
to be set.
properties:
hostedZoneId:
description: Route53 Hosted Zone ID where the DNS record will
be created.
pattern: ^Z[A-Z0-9]+$
type: string
required:
- hostedZoneId
type: object
environmentVariables:
description: Additional environment variables to be passed to the
inference server. Limited to 100 key-value pairs.
Expand Down Expand Up @@ -576,7 +781,7 @@ spec:
type: string
serverAddress:
description: Server address for AMP workspace
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+\/[a-zA-Z0-9-]+$|^$
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+$|^$
type: string
targetValue:
description: Target metric value for scaling
Expand Down Expand Up @@ -623,7 +828,7 @@ spec:
type: string
serverAddress:
description: Server address for AMP workspace
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+\/[a-zA-Z0-9-]+$|^$
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+$|^$
type: string
targetValue:
description: Target metric value for scaling
Expand Down Expand Up @@ -937,6 +1142,34 @@ spec:
- type
type: object
type: array
dataCaptureStatus:
description: Health status of the data capture pipeline
properties:
modelPod:
description: Health status of the model pod data capture tier
properties:
lastTransitionTime:
description: Time of the last health state transition
format: date-time
type: string
message:
description: Human-readable message describing the health
state
type: string
reason:
description: Reason for unhealthy status (e.g., OOMKilled,
S3UploadFailure, MultipleContainerRestarts)
type: string
status:
description: Current health status
enum:
- Healthy
- Unhealthy
type: string
required:
- status
type: object
type: object
deploymentStatus:
description: Details of the native kubernetes deployment that hosts
the model
Expand Down Expand Up @@ -1031,7 +1264,7 @@ spec:
Total number of terminating pods targeted by this deployment. Terminating pods have a non-null
.metadata.deletionTimestamp and have not yet reached the Failed or Succeeded .status.phase.

This is an alpha field. Enable DeploymentReplicaSetTerminatingReplicas to be able to use this field.
This is a beta field and requires enabling DeploymentReplicaSetTerminatingReplicas feature (enabled by default).
format: int32
type: integer
unavailableReplicas:
Expand All @@ -1051,6 +1284,44 @@ spec:
- lastUpdated
- name
type: object
dnsStatus:
description: Status of the operator-managed Route53 DNS record
properties:
dnsHealth:
description: 'DNS resolution status: Active, Pending, or Error.'
enum:
- Active
- Pending
- Error
type: string
hostedZoneId:
description: Route53 hosted zone ID.
type: string
lastTransitionTime:
description: When the status last transitioned, used for propagation
timeout.
format: date-time
type: string
managedByOperator:
description: Whether the operator manages this DNS record.
type: boolean
message:
description: Human-readable status or error message.
type: string
previousHostedZoneId:
description: Previous hosted zone ID, retained during domain/zone
changes until cleanup completes.
type: string
previousRecordName:
description: Previous record name, retained during domain/zone
changes until cleanup completes.
type: string
recordName:
description: Route53 record name.
type: string
required:
- managedByOperator
type: object
endpoints:
description: EndpointStatus contains the status of SageMaker endpoints
properties:
Expand Down Expand Up @@ -1352,7 +1623,7 @@ spec:
type: string
serverAddress:
description: Server address for AMP workspace
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+\/[a-zA-Z0-9-]+$|^$
pattern: ^https:\/\/aps-workspaces\.[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.amazonaws\.com\/workspaces\/ws-[a-zA-Z0-9-]+$|^$
type: string
targetValue:
description: Target metric value for scaling
Expand Down Expand Up @@ -1701,7 +1972,7 @@ spec:
Total number of terminating pods targeted by this deployment. Terminating pods have a non-null
.metadata.deletionTimestamp and have not yet reached the Failed or Succeeded .status.phase.

This is an alpha field. Enable DeploymentReplicaSetTerminatingReplicas to be able to use this field.
This is a beta field and requires enabling DeploymentReplicaSetTerminatingReplicas feature (enabled by default).
format: int32
type: integer
unavailableReplicas:
Expand Down
Loading
Loading