UNPKG

@instana-integration/wxd-presto

Version:

The Instana integration package is designed to showcase observability features in Instana, specifically for monitoring the Watsonx.data Presto Engine.

976 lines 42.5 kB
{ "id": "bNWcFOSgTq61oODYMXuBDw", "title": "presto-error-health", "accessRules": [ { "accessType": "READ_WRITE", "relationType": "USER", "relatedId": "5ee5195fbea6150001758c40" }, { "accessType": "READ_WRITE", "relationType": "GLOBAL", "relatedId": "" } ], "widgets": [ { "id": "_cTYe6gwllPF70Lj", "title": "Service/Component Affected - Task Executor", "width": 6, "height": 13, "x": 6, "y": 26, "type": "chart", "config": { "shareMaxAxisDomain": false, "y1": { "formatter": "number.compact", "renderer": "line", "metrics": [ { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor split wall time all time max error", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_wall_time_all_time_max_error", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_wall_time_all_time_max_error", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor blocked quanta wall time all time max error", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_blocked_quanta_wall_time_all_time_max_error", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_blocked_quanta_wall_time_all_time_max_error", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor leaf split cpu time max error", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_leaf_split_cpu_time_max_error", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_leaf_split_cpu_time_max_error", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor intermediate split wall time max error", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_intermediate_split_wall_time_max_error", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_intermediate_split_wall_time_max_error", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor unblocked quanta wall time one minute max error", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_unblocked_quanta_wall_time_one_minute_max_error", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_unblocked_quanta_wall_time_one_minute_max_error", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor split queued time one minute max error", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_queued_time_one_minute_max_error", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_queued_time_one_minute_max_error", "crossSeriesAggregation": "MEAN" } ], "formatterSelected": true }, "y2": { "formatter": "number.detailed", "renderer": "line", "metrics": [] }, "type": "TIME_SERIES" } }, { "id": "CtggjV79LbZoxAPr", "title": "Severity Level - Moderate (Warning)", "width": 6, "height": 13, "x": 0, "y": 13, "type": "chart", "config": { "shareMaxAxisDomain": false, "y1": { "formatter": "number.compact", "renderer": "line", "metrics": [ { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "query manager user error failures five minute count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_user_error_failures_five_minute_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_user_error_failures_five_minute_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "hive s3 file system aws retry count fifteen minute rate", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_aws_retry_count_fifteen_minute_rate", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_aws_retry_count_fifteen_minute_rate", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "hive s3 file system get object errors fifteen minute rate", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_object_errors_fifteen_minute_rate", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_object_errors_fifteen_minute_rate", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "hive s3 file system read retries fifteen minute rate", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_read_retries_fifteen_minute_rate", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_read_retries_fifteen_minute_rate", "crossSeriesAggregation": "MEAN" } ], "formatterSelected": true }, "y2": { "formatter": "number.detailed", "renderer": "line", "metrics": [] }, "type": "TIME_SERIES" } }, { "id": "Mkc9FadVgIV1RviR", "title": "Severity Level - Low (Info)", "width": 6, "height": 13, "x": 6, "y": 13, "type": "chart", "config": { "shareMaxAxisDomain": false, "y1": { "formatter": "number.detailed", "renderer": "line", "metrics": [ { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "hive s3 file system get metadata retries five minute count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_metadata_retries_five_minute_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_metadata_retries_five_minute_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor split skipped due to memory pressure total count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_skipped_due_to_memory_pressure_total_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_skipped_due_to_memory_pressure_total_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor processor executor shutdown", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_processor_executor_shutdown", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_processor_executor_shutdown", "crossSeriesAggregation": "MEAN" } ], "formatterSelected": false }, "y2": { "formatter": "number.detailed", "renderer": "line", "metrics": [] }, "type": "TIME_SERIES" } }, { "id": "xZETNuNJ-H9ojBY5", "title": "Query Failure Rate", "width": 6, "height": 13, "x": 0, "y": 39, "type": "chart", "config": { "shareMaxAxisDomain": false, "y1": { "formatter": "number.compact", "renderer": "line", "metrics": [ { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "query manager failed queries five minute count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_failed_queries_five_minute_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_failed_queries_five_minute_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "query manager internal failures five minute count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_internal_failures_five_minute_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_internal_failures_five_minute_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "query manager user error failures five minute count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_user_error_failures_five_minute_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_user_error_failures_five_minute_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor split skipped due to memory pressure five minute count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_skipped_due_to_memory_pressure_five_minute_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_skipped_due_to_memory_pressure_five_minute_count", "crossSeriesAggregation": "MEAN" } ], "formatterSelected": true }, "y2": { "formatter": "number.detailed", "renderer": "line", "metrics": [] }, "type": "TIME_SERIES" } }, { "id": "lcUUc6YEgGSfx2jH", "title": "Service/Component Affected - Hive S3 / FileSystem", "width": 6, "height": 13, "x": 0, "y": 26, "type": "chart", "config": { "shareMaxAxisDomain": false, "y1": { "formatter": "number.compact", "renderer": "line", "metrics": [ { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "hive s3 file system failed uploads total count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_failed_uploads_total_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_failed_uploads_total_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "hive s3 file system aws retry count fifteen minute count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_aws_retry_count_fifteen_minute_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_aws_retry_count_fifteen_minute_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "hive s3 file system get metadata errors total count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_metadata_errors_total_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_get_metadata_errors_total_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "hive s3 file system socket timeout exceptions total count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_socket_timeout_exceptions_total_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_socket_timeout_exceptions_total_count", "crossSeriesAggregation": "MEAN" } ], "formatterSelected": true }, "y2": { "formatter": "number.detailed", "renderer": "line", "metrics": [] }, "type": "TIME_SERIES" } }, { "id": "pvmDEhEUzRZXXPjd", "title": "Severity Level - Severe (Critical)", "width": 12, "height": 13, "x": 0, "y": 0, "type": "chart", "config": { "shareMaxAxisDomain": false, "y1": { "formatter": "number.compact", "renderer": "line", "metrics": [ { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "query manager internal failures five minute count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_internal_failures_five_minute_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_query_manager_internal_failures_five_minute_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor split wall time all time max error", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_wall_time_all_time_max_error", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_split_wall_time_all_time_max_error", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "task executor blocked quanta wall time all time max error", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_blocked_quanta_wall_time_all_time_max_error", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_task_executor_blocked_quanta_wall_time_all_time_max_error", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "hive s3 file system failed uploads total count", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_failed_uploads_total_count", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_hive_s3_presto_s3_file_system_failed_uploads_total_count", "crossSeriesAggregation": "MEAN" }, { "lastValue": false, "color": "", "compareToTimeShifted": false, "threshold": { "critical": "", "warning": "", "thresholdEnabled": false, "operator": ">=" }, "aggregation": "MEAN", "label": "cache stats quota exceeded", "source": "INFRASTRUCTURE_METRICS", "metricPath": [ "Others", "Regex" ], "formatter": "number.detailed", "unit": "number", "regex": true, "metric": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_cache_stats_quota_exceeded", "timeShift": 0, "tagFilterExpression": { "logicalOperator": "AND", "elements": [], "type": "EXPRESSION" }, "allowedCrossSeriesAggregations": [], "metricLabel": "metrics\\.gauges\\.github\\.com/open-telemetry/opentelemetry-collector-contrib/receiver/prometheusreceiver/watsonx_data_presto_cache_stats_quota_exceeded", "crossSeriesAggregation": "MEAN" } ], "formatterSelected": true }, "y2": { "formatter": "number.detailed", "renderer": "line", "metrics": [] }, "type": "TIME_SERIES" } } ], "ownerId": "5ee5195fbea6150001758c40", "writable": true }