This is an automated email from the ASF dual-hosted git repository. innerpeacez pushed a commit to branch master in repository https://gitbox.apache.org/repos/asf/skywalking.git
The following commit(s) were added to refs/heads/master by this push: new f8567f7907 Filter out unknown_cluster metric data in `elasticsearch-monitoring` (#10801) f8567f7907 is described below commit f8567f7907f91aec72630b1cd73f0088c9c9a917 Author: innerpeacez <innerpeace.z...@gmail.com> AuthorDate: Mon May 15 11:32:05 2023 +0800 Filter out unknown_cluster metric data in `elasticsearch-monitoring` (#10801) * filter unknown_cluster * add changes --- docs/en/changes/changes.md | 1 + .../elasticsearch/elasticsearch-cluster.yaml | 28 +++---- .../elasticsearch/elasticsearch-index.yaml | 86 +++++++++---------- .../elasticsearch/elasticsearch-node.yaml | 98 +++++++++++----------- 4 files changed, 107 insertions(+), 106 deletions(-) diff --git a/docs/en/changes/changes.md b/docs/en/changes/changes.md index 054997624f..f533cac61b 100644 --- a/docs/en/changes/changes.md +++ b/docs/en/changes/changes.md @@ -43,6 +43,7 @@ * Support `exportErrorStatusTraceOnly` for export the error status trace segments through the Kafka channel * Add component ID for Grizzly. * Fix potential NPE in Zipkin receiver when the `Span` is missing some fields. +* Filter out unknown_cluster metric data. #### UI * Revert: cpm5d function. This feature is cancelled from backend. diff --git a/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-cluster.yaml b/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-cluster.yaml index 2f324d7b46..50b1e8b092 100644 --- a/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-cluster.yaml +++ b/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-cluster.yaml @@ -34,39 +34,39 @@ metricPrefix: meter_elasticsearch_cluster metricsRules: # cluster health - name: health_status - exp: elasticsearch_cluster_health_status.valueEqual(1).sum(['cluster' , 'color']) + exp: elasticsearch_cluster_health_status.tagNotEqual('cluster','unknown_cluster').valueEqual(1).sum(['cluster' , 'color']) # elasticsearch_breakers_tripped - name: breakers_tripped - exp: elasticsearch_breakers_tripped.sum(['cluster']).increase('PT1M') + exp: elasticsearch_breakers_tripped.tagNotEqual('cluster','unknown_cluster').sum(['cluster']).increase('PT1M') # cluster nodes - name: nodes - exp: elasticsearch_cluster_health_number_of_nodes.sum(['cluster']) + exp: elasticsearch_cluster_health_number_of_nodes.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) # cluster data nodes - name: data_nodes - exp: elasticsearch_cluster_health_number_of_data_nodes.sum(['cluster']) + exp: elasticsearch_cluster_health_number_of_data_nodes.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) # pending tasks total - name: pending_tasks_total - exp: elasticsearch_cluster_health_number_of_pending_tasks.sum(['cluster']) + exp: elasticsearch_cluster_health_number_of_pending_tasks.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) # cpu usage avg - name: cpu_usage_avg - exp: elasticsearch_process_cpu_percent.avg(['cluster']) + exp: elasticsearch_process_cpu_percent.tagNotEqual('cluster','unknown_cluster').avg(['cluster']) # jvm used memory avg - name: jvm_memory_used_avg - exp: elasticsearch_jvm_memory_used_bytes.sum(['cluster']) / elasticsearch_jvm_memory_max_bytes.sum(['cluster']) * 100 + exp: elasticsearch_jvm_memory_used_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) / elasticsearch_jvm_memory_max_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) * 100 # open file count - name: open_file_count - exp: elasticsearch_process_open_files_count.sum(['cluster']) + exp: elasticsearch_process_open_files_count.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) # shards - name: primary_shards_total - exp: elasticsearch_cluster_health_active_primary_shards.sum(['cluster']) + exp: elasticsearch_cluster_health_active_primary_shards.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) - name: shards_total - exp: elasticsearch_cluster_health_active_shards.sum(['cluster']) + exp: elasticsearch_cluster_health_active_shards.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) - name: initializing_shards_total - exp: elasticsearch_cluster_health_initializing_shards.sum(['cluster']) + exp: elasticsearch_cluster_health_initializing_shards.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) - name: delayed_unassigned_shards_total - exp: elasticsearch_cluster_health_delayed_unassigned_shards.sum(['cluster']) + exp: elasticsearch_cluster_health_delayed_unassigned_shards.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) - name: relocating_shards_total - exp: elasticsearch_cluster_health_relocating_shards.sum(['cluster']) + exp: elasticsearch_cluster_health_relocating_shards.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) - name: unassigned_shards_total - exp: elasticsearch_cluster_health_unassigned_shards.sum(['cluster']) \ No newline at end of file + exp: elasticsearch_cluster_health_unassigned_shards.tagNotEqual('cluster','unknown_cluster').sum(['cluster']) \ No newline at end of file diff --git a/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-index.yaml b/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-index.yaml index a31f058829..dc0af66953 100644 --- a/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-index.yaml +++ b/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-index.yaml @@ -33,95 +33,95 @@ expSuffix: tag({tags -> tags.cluster = 'elasticsearch::' + tags.cluster}).endpoi metricPrefix: meter_elasticsearch_index metricsRules: - name: stats_indexing_index_total_req_rate - exp: elasticsearch_index_stats_indexing_index_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_indexing_index_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_indexing_index_total_proc_rate - exp: 1 / (elasticsearch_index_stats_indexing_index_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_indexing_index_total.sum(['cluster' , 'index']).rate('PT1M')) + exp: 1 / (elasticsearch_index_stats_indexing_index_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_indexing_index_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M')) - name: stats_search_query_total_req_rate - exp: elasticsearch_index_stats_search_query_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_query_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_search_query_total_proc_rate - exp: 1 / ((elasticsearch_index_stats_search_query_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + elasticsearch_index_stats_search_fetch_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + elasticsearch_index_stats_search_scroll_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + elasticsearch_index_stats_search_suggest_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M')) / elasticsearch_index_stats_search_query_total.sum(['cluster' , 'index']).r [...] + exp: 1 / ((elasticsearch_index_stats_search_query_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') + elasticsearch_index_stats_search_fetch_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') + elasticsearch_index_stats_search_scroll_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') + elasticsearch_index_stats_search_suggest_time_seconds [...] - name: stats_merge_total_req_rate - exp: elasticsearch_index_stats_merge_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_merge_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_flush_total_req_rate - exp: elasticsearch_index_stats_flush_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_flush_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_refresh_total_req_rate - exp: elasticsearch_index_stats_refresh_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_refresh_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_warmer_total_req_rate - exp: elasticsearch_index_stats_warmer_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_warmer_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_indexing_delete_total_req_rate - exp: elasticsearch_index_stats_indexing_delete_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_indexing_delete_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_search_fetch_total_req_rate - exp: elasticsearch_index_stats_search_fetch_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_fetch_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_search_scroll_total_req_rate - exp: elasticsearch_index_stats_search_scroll_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_scroll_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_search_suggest_total_req_rate - exp: elasticsearch_index_stats_search_suggest_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_suggest_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_get_total_req_rate - exp: elasticsearch_index_stats_get_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_get_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_merge_time_seconds_total - exp: elasticsearch_index_stats_merge_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_merge_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_flush_time_seconds_total - exp: elasticsearch_index_stats_flush_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_flush_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_refresh_time_seconds_total - exp: elasticsearch_index_stats_refresh_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_refresh_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_warmer_time_seconds_total - exp: elasticsearch_index_stats_warmer_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_warmer_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_indexing_delete_time_seconds_total - exp: elasticsearch_index_stats_indexing_delete_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_indexing_delete_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_search_fetch_time_seconds_total - exp: elasticsearch_index_stats_search_fetch_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_fetch_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_search_query_time_seconds_total - exp: elasticsearch_index_stats_search_query_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_query_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_search_scroll_time_seconds_total - exp: elasticsearch_index_stats_search_scroll_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_scroll_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_search_suggest_time_seconds_total - exp: elasticsearch_index_stats_search_suggest_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_suggest_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_indexing_index_time_seconds_total - exp: elasticsearch_index_stats_indexing_index_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_indexing_index_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_get_time_seconds_total - exp: elasticsearch_index_stats_get_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_get_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_merge_stopped_time_seconds_total - exp: elasticsearch_index_stats_merge_stopped_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_merge_stopped_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_merge_throttle_time_seconds_total - exp: elasticsearch_index_stats_merge_throttle_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_merge_throttle_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: stats_indexing_throttle_time_seconds_total - exp: elasticsearch_index_stats_indexing_throttle_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_indexing_throttle_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: search_fetch_avg_time - exp: elasticsearch_index_stats_search_fetch_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_search_fetch_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_fetch_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_search_fetch_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: search_query_avg_time - exp: elasticsearch_index_stats_search_query_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_search_query_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_query_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_search_query_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: search_scroll_avg_time - exp: elasticsearch_index_stats_search_scroll_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_search_scroll_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_scroll_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_search_scroll_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: search_suggest_avg_time - exp: elasticsearch_index_stats_search_suggest_time_seconds_total.sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_search_suggest_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_index_stats_search_suggest_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') / elasticsearch_index_stats_search_suggest_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: indices_docs_primary - exp: elasticsearch_indices_docs_primary.sum(['cluster' , 'index']) + exp: elasticsearch_indices_docs_primary.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']) - name: indices_docs_primary_rate - exp: elasticsearch_indices_docs_primary.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_indices_docs_primary.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: indices_store_size_bytes_primary - exp: elasticsearch_indices_store_size_bytes_primary.sum(['cluster' , 'index']) + exp: elasticsearch_indices_store_size_bytes_primary.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']) - name: indices_docs_total - exp: elasticsearch_indices_docs_total.sum(['cluster' , 'index']) + exp: elasticsearch_indices_docs_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']) - name: indices_docs_total_rate - exp: elasticsearch_indices_docs_total.sum(['cluster' , 'index']).rate('PT1M') + exp: elasticsearch_indices_docs_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']).rate('PT1M') - name: indices_store_size_bytes_total - exp: elasticsearch_indices_store_size_bytes_total.sum(['cluster' , 'index']) + exp: elasticsearch_indices_store_size_bytes_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']) - name: indices_deleted_docs_primary - exp: elasticsearch_indices_deleted_docs_primary.sum(['cluster' , 'index']) + exp: elasticsearch_indices_deleted_docs_primary.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']) - name: indices_segment_count_total - exp: elasticsearch_indices_segment_count_total.sum(['cluster' , 'index']) + exp: elasticsearch_indices_segment_count_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']) - name: indices_segment_memory_bytes_total - exp: elasticsearch_indices_segment_memory_bytes_total.sum(['cluster' , 'index']) + exp: elasticsearch_indices_segment_memory_bytes_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']) - name: indices_segment_count_primary - exp: elasticsearch_indices_segment_count_primary.sum(['cluster' , 'index']) + exp: elasticsearch_indices_segment_count_primary.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']) - name: indices_segment_memory_bytes_primary - exp: elasticsearch_indices_segment_memory_bytes_primary.sum(['cluster' , 'index']) + exp: elasticsearch_indices_segment_memory_bytes_primary.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index']) - name: indices_shards_docs - exp: elasticsearch_indices_shards_docs.sum(['cluster' , 'index' , 'primary' , 'shard']).tag({tags -> if (tags['primary'] == 'true') {tags.primary = 'primary'} else {tags.primary = 'replica'} }) \ No newline at end of file + exp: elasticsearch_indices_shards_docs.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'index' , 'primary' , 'shard']).tag({tags -> if (tags['primary'] == 'true') {tags.primary = 'primary'} else {tags.primary = 'replica'} }) \ No newline at end of file diff --git a/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-node.yaml b/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-node.yaml index 90f428a3e8..1650b94403 100644 --- a/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-node.yaml +++ b/oap-server/server-starter/src/main/resources/otel-rules/elasticsearch/elasticsearch-node.yaml @@ -34,116 +34,116 @@ metricPrefix: meter_elasticsearch_node metricsRules: # node rules - name: rules - exp: elasticsearch_process_cpu_percent.sum(['cluster' , 'name' , 'es_client_node' , 'es_data_node' , 'es_ingest_node' , 'es_master_node']) + exp: elasticsearch_process_cpu_percent.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'es_client_node' , 'es_data_node' , 'es_ingest_node' , 'es_master_node']) - name: open_file_count - exp: elasticsearch_process_open_files_count.sum(['cluster' , 'name']) + exp: elasticsearch_process_open_files_count.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) - name: all_disk_free_space - exp: elasticsearch_filesystem_data_available_bytes.sum(['cluster' , 'name']) + exp: elasticsearch_filesystem_data_available_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) - name: jvm_memory_used - exp: elasticsearch_jvm_memory_used_bytes.sum(['cluster' , 'name']) + exp: elasticsearch_jvm_memory_used_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) # jvm - name: jvm_memory_nonheap_used - exp: elasticsearch_jvm_memory_used_bytes.tagEqual('area' , 'non-heap').sum(['cluster' , 'name']) + exp: elasticsearch_jvm_memory_used_bytes.tagNotEqual('cluster','unknown_cluster').tagEqual('area' , 'non-heap').sum(['cluster' , 'name']) - name: jvm_memory_heap_used - exp: elasticsearch_jvm_memory_used_bytes.tagEqual('area' , 'heap').sum(['cluster' , 'name']) + exp: elasticsearch_jvm_memory_used_bytes.tagNotEqual('cluster','unknown_cluster').tagEqual('area' , 'heap').sum(['cluster' , 'name']) - name: jvm_memory_heap_max - exp: elasticsearch_jvm_memory_max_bytes.tagEqual('area' , 'heap').sum(['cluster' , 'name']) + exp: elasticsearch_jvm_memory_max_bytes.tagNotEqual('cluster','unknown_cluster').tagEqual('area' , 'heap').sum(['cluster' , 'name']) - name: jvm_memory_nonheap_committed - exp: elasticsearch_jvm_memory_committed_bytes.tagEqual('area' , 'non-heap').sum(['cluster' , 'name']) + exp: elasticsearch_jvm_memory_committed_bytes.tagNotEqual('cluster','unknown_cluster').tagEqual('area' , 'non-heap').sum(['cluster' , 'name']) - name: jvm_memory_heap_committed - exp: elasticsearch_jvm_memory_committed_bytes.tagEqual('area' , 'heap').sum(['cluster' , 'name']) + exp: elasticsearch_jvm_memory_committed_bytes.tagNotEqual('cluster','unknown_cluster').tagEqual('area' , 'heap').sum(['cluster' , 'name']) - name: jvm_memory_pool_peak_used - exp: elasticsearch_jvm_memory_pool_peak_used_bytes.sum(['cluster' , 'name' , 'pool']) + exp: elasticsearch_jvm_memory_pool_peak_used_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'pool']) - name: jvm_gc_count - exp: elasticsearch_jvm_gc_collection_seconds_count.sum(['cluster' , 'name' , 'gc']).increase('PT1M') + exp: elasticsearch_jvm_gc_collection_seconds_count.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'gc']).increase('PT1M') - name: jvm_gc_time - exp: (elasticsearch_jvm_gc_collection_seconds_sum * 1000).sum(['cluster' , 'name' , 'gc']).increase('PT1M') + exp: (elasticsearch_jvm_gc_collection_seconds_sum * 1000).tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'gc']).increase('PT1M') # cpu - name: process_cpu_percent - exp: elasticsearch_process_cpu_percent.sum(['cluster' , 'name']) + exp: elasticsearch_process_cpu_percent.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) - name: os_cpu_percent - exp: elasticsearch_os_cpu_percent.sum(['cluster' , 'name']) + exp: elasticsearch_os_cpu_percent.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) - name: os_load1 - exp: elasticsearch_os_load1.sum(['cluster' , 'name']) * 100 + exp: elasticsearch_os_load1.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) * 100 - name: os_load5 - exp: elasticsearch_os_load5.sum(['cluster' , 'name']) * 100 + exp: elasticsearch_os_load5.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) * 100 - name: os_load15 - exp: elasticsearch_os_load15.sum(['cluster' , 'name']) * 100 + exp: elasticsearch_os_load15.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) * 100 # translog - name: indices_translog_operations - exp: elasticsearch_indices_translog_operations.sum(['cluster' , 'name']).irate() + exp: elasticsearch_indices_translog_operations.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).irate() - name: indices_translog_size - exp: elasticsearch_indices_translog_size_in_bytes.sum(['cluster' , 'name']).irate() + exp: elasticsearch_indices_translog_size_in_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).irate() # breakers tripped - name: breakers_tripped - exp: elasticsearch_breakers_tripped.sum(['cluster' , 'name' , 'breaker']).increase('PT1M') + exp: elasticsearch_breakers_tripped.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'breaker']).increase('PT1M') - name: breakers_estimated_size - exp: elasticsearch_breakers_estimated_size_bytes.sum(['cluster' , 'name' , 'breaker']) + exp: elasticsearch_breakers_estimated_size_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'breaker']) # disk - name: disk_usage_percent - exp: 100 - (elasticsearch_filesystem_data_available_bytes * 100).sum(['cluster' , 'name' , 'mount']) / elasticsearch_filesystem_data_size_bytes.sum(['cluster' , 'name' , 'mount']) + exp: 100 - (elasticsearch_filesystem_data_available_bytes * 100).tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'mount']) / elasticsearch_filesystem_data_size_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'mount']) - name: disk_usage - exp: elasticsearch_filesystem_data_size_bytes.sum(['cluster' , 'name' , 'mount']) - elasticsearch_filesystem_data_available_bytes.sum(['cluster' , 'name' , 'mount']) + exp: elasticsearch_filesystem_data_size_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'mount']) - elasticsearch_filesystem_data_available_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'mount']) - name: disk_io_read_bytes - exp: elasticsearch_filesystem_io_stats_device_read_size_kilobytes_sum.sum(['cluster' , 'name' , 'mount']).irate() + exp: elasticsearch_filesystem_io_stats_device_read_size_kilobytes_sum.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'mount']).irate() - name: disk_io_write_bytes - exp: elasticsearch_filesystem_io_stats_device_write_size_kilobytes_sum.sum(['cluster' , 'name' , 'mount']).irate() + exp: elasticsearch_filesystem_io_stats_device_write_size_kilobytes_sum.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name' , 'mount']).irate() # network - name: network_send_bytes - exp: elasticsearch_transport_tx_size_bytes_total.sum(['cluster' , 'name']).irate() + exp: elasticsearch_transport_tx_size_bytes_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).irate() - name: network_receive_bytes - exp: elasticsearch_transport_rx_size_bytes_total.sum(['cluster' , 'name']).irate() + exp: elasticsearch_transport_rx_size_bytes_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).irate() # operations - name: indices_search_query_total_req_rate - exp: elasticsearch_indices_search_query_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_search_query_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_search_query_time_seconds_proc_rate - exp: 1 / ((elasticsearch_indices_search_query_time_seconds.sum(['cluster' , 'name']).rate('PT1M') + elasticsearch_indices_search_fetch_time_seconds.sum(['cluster' , 'name']).rate('PT1M') + elasticsearch_indices_search_scroll_time_seconds.sum(['cluster' , 'name']).rate('PT1M') + elasticsearch_indices_search_suggest_time_seconds.sum(['cluster' , 'name']).rate('PT1M')) / elasticsearch_indices_search_query_total.sum(['cluster' , 'name']).rate('PT1M')) + exp: 1 / ((elasticsearch_indices_search_query_time_seconds.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') + elasticsearch_indices_search_fetch_time_seconds.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') + elasticsearch_indices_search_scroll_time_seconds.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') + elasticsearch_indices_search_suggest_time_seconds.tagNotEqual('cluster','unknown_clust [...] - name: indices_search_fetch_total_req_rate - exp: elasticsearch_indices_search_fetch_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_search_fetch_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_search_fetch_time_seconds - exp: elasticsearch_indices_search_fetch_time_seconds.sum(['cluster' , 'name']).increase('PT1M') + exp: elasticsearch_indices_search_fetch_time_seconds.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).increase('PT1M') - name: indices_indexing_index_total_req_rate - exp: elasticsearch_indices_indexing_index_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_indexing_index_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_indexing_index_total_proc_rate - exp: 1 / (elasticsearch_indices_indexing_index_time_seconds_total.sum(['cluster' , 'name']).rate('PT1M') / elasticsearch_indices_indexing_index_total.sum(['cluster' , 'name']).rate('PT1M')) + exp: 1 / (elasticsearch_indices_indexing_index_time_seconds_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') / elasticsearch_indices_indexing_index_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M')) - name: indices_merges_total_req_rate - exp: elasticsearch_indices_merges_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_merges_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_refresh_total_req_rate - exp: elasticsearch_indices_refresh_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_refresh_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_flush_total_req_rate - exp: elasticsearch_indices_flush_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_flush_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_get_exists_total_req_rate - exp: elasticsearch_indices_get_exists_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_get_exists_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_get_missing_total_req_rate - exp: elasticsearch_indices_get_missing_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_get_missing_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_get_total_req_rate - exp: elasticsearch_indices_get_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_get_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_indexing_delete_total_req_rate - exp: elasticsearch_indices_indexing_delete_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_indexing_delete_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_search_scroll_total_req_rate - exp: elasticsearch_indices_search_scroll_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_search_scroll_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_search_suggest_total_req_rate - exp: elasticsearch_indices_search_suggest_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_search_suggest_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_docs - exp: elasticsearch_indices_docs.sum(['cluster' , 'name']) + exp: elasticsearch_indices_docs.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) - name: indices_docs_deleted_total - exp: elasticsearch_indices_docs_deleted.sum(['cluster' , 'name']) + exp: elasticsearch_indices_docs_deleted.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) - name: indices_docs_deleted - exp: elasticsearch_indices_docs_deleted.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_docs_deleted.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_merges_docs_total - exp: elasticsearch_indices_merges_docs_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_merges_docs_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: indices_merges_total_size_bytes_total - exp: elasticsearch_indices_merges_total_size_bytes_total.sum(['cluster' , 'name']).rate('PT1M') + exp: elasticsearch_indices_merges_total_size_bytes_total.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']).rate('PT1M') - name: segment_count - exp: elasticsearch_indices_segments_count.sum(['cluster' , 'name']) + exp: elasticsearch_indices_segments_count.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) - name: segment_memory - exp: elasticsearch_indices_segments_memory_bytes.sum(['cluster' , 'name']) \ No newline at end of file + exp: elasticsearch_indices_segments_memory_bytes.tagNotEqual('cluster','unknown_cluster').sum(['cluster' , 'name']) \ No newline at end of file