@instana-integration/wxd-presto
Version:
The Instana integration package is designed to showcase observability features in Instana, specifically for monitoring the Watsonx.data Presto Engine.
976 lines • 42.5 kB
JSON
{
"id": "bNWcFOSgTq61oODYMXuBDw",
"title": "presto-error-health",
"accessRules": [
{
"accessType": "READ_WRITE",
"relationType": "USER",
"relatedId": "5ee5195fbea6150001758c40"
},
{
"accessType": "READ_WRITE",
"relationType": "GLOBAL",
"relatedId": ""
}
],
"widgets": [
{
"id": "_cTYe6gwllPF70Lj",
"title": "Service/Component Affected - Task Executor",
"width": 6,
"height": 13,
"x": 6,
"y": 26,
"type": "chart",
"config": {
"shareMaxAxisDomain": false,
"y1": {
"formatter": "number.compact",
"renderer": "line",
"metrics": [
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor split wall time all time max error",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_wall_time_all_time_max_error",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_wall_time_all_time_max_error",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor blocked quanta wall time all time max error",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_blocked_quanta_wall_time_all_time_max_error",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_blocked_quanta_wall_time_all_time_max_error",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor leaf split cpu time max error",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_leaf_split_cpu_time_max_error",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_leaf_split_cpu_time_max_error",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor intermediate split wall time max error",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_intermediate_split_wall_time_max_error",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_intermediate_split_wall_time_max_error",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor unblocked quanta wall time one minute max error",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_unblocked_quanta_wall_time_one_minute_max_error",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_unblocked_quanta_wall_time_one_minute_max_error",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor split queued time one minute max error",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_queued_time_one_minute_max_error",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_queued_time_one_minute_max_error",
"crossSeriesAggregation": "MEAN"
}
],
"formatterSelected": true
},
"y2": {
"formatter": "number.detailed",
"renderer": "line",
"metrics": []
},
"type": "TIME_SERIES"
}
},
{
"id": "CtggjV79LbZoxAPr",
"title": "Severity Level - Moderate (Warning)",
"width": 6,
"height": 13,
"x": 0,
"y": 13,
"type": "chart",
"config": {
"shareMaxAxisDomain": false,
"y1": {
"formatter": "number.compact",
"renderer": "line",
"metrics": [
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "query manager user error failures five minute count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_user_error_failures_five_minute_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_user_error_failures_five_minute_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "hive s3 file system aws retry count fifteen minute rate",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_aws_retry_count_fifteen_minute_rate",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_aws_retry_count_fifteen_minute_rate",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "hive s3 file system get object errors fifteen minute rate",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_object_errors_fifteen_minute_rate",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_object_errors_fifteen_minute_rate",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "hive s3 file system read retries fifteen minute rate",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_read_retries_fifteen_minute_rate",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_read_retries_fifteen_minute_rate",
"crossSeriesAggregation": "MEAN"
}
],
"formatterSelected": true
},
"y2": {
"formatter": "number.detailed",
"renderer": "line",
"metrics": []
},
"type": "TIME_SERIES"
}
},
{
"id": "Mkc9FadVgIV1RviR",
"title": "Severity Level - Low (Info)",
"width": 6,
"height": 13,
"x": 6,
"y": 13,
"type": "chart",
"config": {
"shareMaxAxisDomain": false,
"y1": {
"formatter": "number.detailed",
"renderer": "line",
"metrics": [
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "hive s3 file system get metadata retries five minute count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_metadata_retries_five_minute_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_metadata_retries_five_minute_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor split skipped due to memory pressure total count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_skipped_due_to_memory_pressure_total_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_skipped_due_to_memory_pressure_total_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor processor executor shutdown",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_processor_executor_shutdown",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_processor_executor_shutdown",
"crossSeriesAggregation": "MEAN"
}
],
"formatterSelected": false
},
"y2": {
"formatter": "number.detailed",
"renderer": "line",
"metrics": []
},
"type": "TIME_SERIES"
}
},
{
"id": "xZETNuNJ-H9ojBY5",
"title": "Query Failure Rate",
"width": 6,
"height": 13,
"x": 0,
"y": 39,
"type": "chart",
"config": {
"shareMaxAxisDomain": false,
"y1": {
"formatter": "number.compact",
"renderer": "line",
"metrics": [
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "query manager failed queries five minute count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_failed_queries_five_minute_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_failed_queries_five_minute_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "query manager internal failures five minute count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_internal_failures_five_minute_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_internal_failures_five_minute_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "query manager user error failures five minute count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_user_error_failures_five_minute_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_user_error_failures_five_minute_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor split skipped due to memory pressure five minute count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_skipped_due_to_memory_pressure_five_minute_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_skipped_due_to_memory_pressure_five_minute_count",
"crossSeriesAggregation": "MEAN"
}
],
"formatterSelected": true
},
"y2": {
"formatter": "number.detailed",
"renderer": "line",
"metrics": []
},
"type": "TIME_SERIES"
}
},
{
"id": "lcUUc6YEgGSfx2jH",
"title": "Service/Component Affected - Hive S3 / FileSystem",
"width": 6,
"height": 13,
"x": 0,
"y": 26,
"type": "chart",
"config": {
"shareMaxAxisDomain": false,
"y1": {
"formatter": "number.compact",
"renderer": "line",
"metrics": [
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "hive s3 file system failed uploads total count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_failed_uploads_total_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_failed_uploads_total_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "hive s3 file system aws retry count fifteen minute count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_aws_retry_count_fifteen_minute_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_aws_retry_count_fifteen_minute_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "hive s3 file system get metadata errors total count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_metadata_errors_total_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_metadata_errors_total_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "hive s3 file system socket timeout exceptions total count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_socket_timeout_exceptions_total_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_socket_timeout_exceptions_total_count",
"crossSeriesAggregation": "MEAN"
}
],
"formatterSelected": true
},
"y2": {
"formatter": "number.detailed",
"renderer": "line",
"metrics": []
},
"type": "TIME_SERIES"
}
},
{
"id": "pvmDEhEUzRZXXPjd",
"title": "Severity Level - Severe (Critical)",
"width": 12,
"height": 13,
"x": 0,
"y": 0,
"type": "chart",
"config": {
"shareMaxAxisDomain": false,
"y1": {
"formatter": "number.compact",
"renderer": "line",
"metrics": [
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "query manager internal failures five minute count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_internal_failures_five_minute_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_internal_failures_five_minute_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor split wall time all time max error",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_wall_time_all_time_max_error",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_wall_time_all_time_max_error",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "task executor blocked quanta wall time all time max error",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_blocked_quanta_wall_time_all_time_max_error",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_blocked_quanta_wall_time_all_time_max_error",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "hive s3 file system failed uploads total count",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_failed_uploads_total_count",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_failed_uploads_total_count",
"crossSeriesAggregation": "MEAN"
},
{
"lastValue": false,
"color": "",
"compareToTimeShifted": false,
"threshold": {
"critical": "",
"warning": "",
"thresholdEnabled": false,
"operator": ">="
},
"aggregation": "MEAN",
"label": "cache stats quota exceeded",
"source": "INFRASTRUCTURE_METRICS",
"metricPath": [
"Others",
"Regex"
],
"formatter": "number.detailed",
"unit": "number",
"regex": true,
"metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_cache_stats_quota_exceeded",
"timeShift": 0,
"tagFilterExpression": {
"logicalOperator": "AND",
"elements": [],
"type": "EXPRESSION"
},
"allowedCrossSeriesAggregations": [],
"metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_cache_stats_quota_exceeded",
"crossSeriesAggregation": "MEAN"
}
],
"formatterSelected": true
},
"y2": {
"formatter": "number.detailed",
"renderer": "line",
"metrics": []
},
"type": "TIME_SERIES"
}
}
],
"ownerId": "5ee5195fbea6150001758c40",
"writable": true
}