Skip to content

Instantly share code, notes, and snippets.

@smitjainsj
Created January 21, 2023 12:12
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save smitjainsj/78f7f5e14cf4d98b1ec3451de076b957 to your computer and use it in GitHub Desktop.
Save smitjainsj/78f7f5e14cf4d98b1ec3451de076b957 to your computer and use it in GitHub Desktop.
aws cloudwatch sagemaker inference dashboard for endpoints
{
"widgets": [
{
"height": 6,
"width": 24,
"y": 0,
"x": 0,
"type": "metric",
"properties": {
"view": "timeSeries",
"stacked": false,
"metrics": [
[ "/aws/sagemaker/Endpoints", "CPUUtilization", "EndpointName", "<endpoint_name>", "VariantName", "<variant_name>" ],
[ "/aws/sagemaker/Endpoints", "MemoryUtilization", "EndpointName", "<endpoint_name>", "VariantName", "<variant_name>" ],
[ "/aws/sagemaker/Endpoints", "DiskUtilization", "EndpointName", "<endpoint_name>", "VariantName", "<variant_name>" ]
],
"region": "ap-southeast-1",
"title": "CPU,Memory,Disk Utilization per Second",
"period": 60,
"stat": "Average",
"yAxis": {
"right": {
"label": ""
},
"left": {
"label": "CPU,Memory,Disk Utilization per Second",
"showUnits": false
}
}
}
},
{
"height": 6,
"width": 24,
"y": 6,
"x": 0,
"type": "metric",
"properties": {
"view": "timeSeries",
"stacked": false,
"metrics": [
[ { "expression": "m1 / PERIOD(m1)", "label": "Invocations per Second", "id": "e1" } ],
[ "AWS/SageMaker", "Invocations", "EndpointName", "<endpoint_name>", "VariantName", "<variant_name>", { "region": "ap-southeast-1", "id": "m1", "visible": false } ]
],
"region": "ap-southeast-1",
"title": "Invocations per Second",
"period": 60,
"stat": "Sum",
"yAxis": {
"right": {
"label": ""
},
"left": {
"label": "Invocations per Second",
"showUnits": false
}
}
}
},
{
"height": 6,
"width": 24,
"y": 12,
"x": 0,
"type": "metric",
"properties": {
"view": "timeSeries",
"stacked": false,
"metrics": [
[ "AWS/SageMaker", "ModelLatency", "EndpointName", "<endpoint_name>", "VariantName", "<variant_name>" ],
[ "AWS/SageMaker", "OverheadLatency", "EndpointName", "<endpoint_name>", "VariantName", "<variant_name>" ]
],
"region": "ap-southeast-1",
"title": "Model,Overhead Latency",
"period": 60,
"stat": "p95",
"yAxis": {
"right": {
"label": ""
},
"left": {
"label": "Model,Overhead Latency",
"showUnits": false
}
}
}
},
{
"height": 6,
"width": 24,
"y": 18,
"x": 0,
"type": "metric",
"properties": {
"view": "timeSeries",
"stacked": false,
"metrics": [
[ "AWS/SageMaker", "Invocation5XXErrors", "EndpointName", "<endpoint_name>", "VariantName", "<variant_name>" ]
],
"region": "ap-southeast-1",
"title": "Invocation 5XX Errors",
"period": 60,
"stat": "Sum",
"yAxis": {
"right": {
"label": ""
},
"left": {
"label": "Invocation 5XX Errors",
"showUnits": false
}
}
}
}
]
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment