|
11199 | 11199 | "shape":"Boolean", |
11200 | 11200 | "documentation":"<p>Sets whether all model containers deployed to the endpoint are isolated. If they are, no inbound or outbound network calls can be made to or from the model containers.</p>", |
11201 | 11201 | "box":true |
| 11202 | + }, |
| 11203 | + "MetricsConfig":{ |
| 11204 | + "shape":"MetricsConfig", |
| 11205 | + "documentation":"<p>The configuration parameters for utilization metrics.</p>" |
11202 | 11206 | } |
11203 | 11207 | } |
11204 | 11208 | }, |
|
16621 | 16625 | "shape":"Boolean", |
16622 | 16626 | "documentation":"<p>Indicates whether all model containers deployed to the endpoint are isolated. If they are, no inbound or outbound network calls can be made to or from the model containers.</p>", |
16623 | 16627 | "box":true |
| 16628 | + }, |
| 16629 | + "MetricsConfig":{ |
| 16630 | + "shape":"MetricsConfig", |
| 16631 | + "documentation":"<p>The configuration parameters for utilization metrics.</p>" |
16624 | 16632 | } |
16625 | 16633 | } |
16626 | 16634 | }, |
|
16696 | 16704 | "ShadowProductionVariants":{ |
16697 | 16705 | "shape":"ProductionVariantSummaryList", |
16698 | 16706 | "documentation":"<p>An array of <a href=\"https://docs.aws.amazon.com/sagemaker/latest/APIReference/API_ProductionVariantSummary.html\">ProductionVariantSummary</a> objects, one for each model that you want to host at this endpoint in shadow mode with production traffic replicated from the model specified on <code>ProductionVariants</code>.</p>" |
| 16707 | + }, |
| 16708 | + "MetricsConfig":{ |
| 16709 | + "shape":"MetricsConfig", |
| 16710 | + "documentation":"<p>The configuration parameters for utilization metrics.</p>" |
16699 | 16711 | } |
16700 | 16712 | } |
16701 | 16713 | }, |
|
21268 | 21280 | }, |
21269 | 21281 | "EnableCaching":{"type":"boolean"}, |
21270 | 21282 | "EnableCapture":{"type":"boolean"}, |
| 21283 | + "EnableEnhancedMetrics":{ |
| 21284 | + "type":"boolean", |
| 21285 | + "box":true |
| 21286 | + }, |
21271 | 21287 | "EnableInfraCheck":{ |
21272 | 21288 | "type":"boolean", |
21273 | 21289 | "box":true |
|
31201 | 31217 | "min":1, |
31202 | 31218 | "pattern":".+" |
31203 | 31219 | }, |
| 31220 | + "MetricPublishFrequencyInSeconds":{ |
| 31221 | + "type":"integer", |
| 31222 | + "box":true |
| 31223 | + }, |
31204 | 31224 | "MetricRegex":{ |
31205 | 31225 | "type":"string", |
31206 | 31226 | "max":500, |
|
31231 | 31251 | "union":true |
31232 | 31252 | }, |
31233 | 31253 | "MetricValue":{"type":"float"}, |
| 31254 | + "MetricsConfig":{ |
| 31255 | + "type":"structure", |
| 31256 | + "members":{ |
| 31257 | + "EnableEnhancedMetrics":{ |
| 31258 | + "shape":"EnableEnhancedMetrics", |
| 31259 | + "documentation":"<p>Specifies whether to enable enhanced metrics for the endpoint. Enhanced metrics provide utilization data at instance and container granularity. Container granularity is supported for Inference Components. The default is <code>False</code>.</p>" |
| 31260 | + }, |
| 31261 | + "MetricPublishFrequencyInSeconds":{ |
| 31262 | + "shape":"MetricPublishFrequencyInSeconds", |
| 31263 | + "documentation":"<p>The frequency, in seconds, at which utilization metrics are published to Amazon CloudWatch. The default is <code>60</code> seconds.</p>" |
| 31264 | + } |
| 31265 | + }, |
| 31266 | + "documentation":"<p>The configuration for Utilization metrics.</p>" |
| 31267 | + }, |
31234 | 31268 | "MetricsSource":{ |
31235 | 31269 | "type":"structure", |
31236 | 31270 | "required":[ |
|
38553 | 38587 | }, |
38554 | 38588 | "ResourceConfig":{ |
38555 | 38589 | "type":"structure", |
38556 | | - "required":["VolumeSizeInGB"], |
38557 | 38590 | "members":{ |
38558 | 38591 | "InstanceType":{ |
38559 | 38592 | "shape":"TrainingInstanceType", |
|
38565 | 38598 | "box":true |
38566 | 38599 | }, |
38567 | 38600 | "VolumeSizeInGB":{ |
38568 | | - "shape":"VolumeSizeInGB", |
| 38601 | + "shape":"OptionalVolumeSizeInGB", |
38569 | 38602 | "documentation":"<p>The size of the ML storage volume that you want to provision. </p> <p>ML storage volumes store model artifacts and incremental states. Training algorithms might also use the ML storage volume for scratch space. If you want to store the training data in the ML storage volume, choose <code>File</code> as the <code>TrainingInputMode</code> in the algorithm specification. </p> <p>When using an ML instance with <a href=\"https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/ssd-instance-store.html#nvme-ssd-volumes\">NVMe SSD volumes</a>, SageMaker doesn't provision Amazon EBS General Purpose SSD (gp2) storage. Available storage is fixed to the NVMe-type instance's storage capacity. SageMaker configures storage paths for training datasets, checkpoints, model artifacts, and outputs to use the entire capacity of the instance storage. For example, ML instance families with the NVMe-type instance storage include <code>ml.p4d</code>, <code>ml.g4dn</code>, and <code>ml.g5</code>. </p> <p>When using an ML instance with the EBS-only storage option and without instance storage, you must define the size of EBS volume through <code>VolumeSizeInGB</code> in the <code>ResourceConfig</code> API. For example, ML instance families that use EBS volumes include <code>ml.c5</code> and <code>ml.p2</code>. </p> <p>To look up instance types and their instance storage types and volumes, see <a href=\"http://aws.amazon.com/ec2/instance-types/\">Amazon EC2 Instance Types</a>.</p> <p>To find the default local paths defined by the SageMaker training platform, see <a href=\"https://docs.aws.amazon.com/sagemaker/latest/dg/model-train-storage.html\">Amazon SageMaker Training Storage Folders for Training Datasets, Checkpoints, Model Artifacts, and Outputs</a>.</p>", |
38570 | 38603 | "box":true |
38571 | 38604 | }, |
@@ -38837,10 +38870,10 @@ |
38837 | 38870 | }, |
38838 | 38871 | "GroupPatterns":{ |
38839 | 38872 | "shape":"GroupPatternsList", |
38840 | | - "documentation":"<p>A list of AWS IAM Identity Center group patterns that should be assigned to the specified role. Group patterns support wildcard matching using <code>*</code>.</p>" |
| 38873 | + "documentation":"<p>A list of Amazon Web Services IAM Identity Center group patterns that should be assigned to the specified role. Group patterns support wildcard matching using <code>*</code>.</p>" |
38841 | 38874 | } |
38842 | 38875 | }, |
38843 | | - "documentation":"<p>Defines the mapping between an in-app role and the AWS IAM Identity Center group patterns that should be assigned to that role within the SageMaker Partner AI App.</p>" |
| 38876 | + "documentation":"<p>Defines the mapping between an in-app role and the Amazon Web Services IAM Identity Center group patterns that should be assigned to that role within the SageMaker Partner AI App.</p>" |
38844 | 38877 | }, |
38845 | 38878 | "RoleGroupAssignmentsList":{ |
38846 | 38879 | "type":"list", |
|
0 commit comments