groups: - name: cortex_api rules: - expr: histogram_quantile(0.99, sum(rate(cortex_request_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_request_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_request_duration_seconds:50quantile - expr: sum(rate(cortex_request_duration_seconds_sum[1m])) by (cluster, job) / sum(rate(cortex_request_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_request_duration_seconds:avg - expr: sum(rate(cortex_request_duration_seconds_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_request_duration_seconds_sum[1m])) by (cluster, job) record: cluster_job:cortex_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_request_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_request_duration_seconds_bucket[1m])) by (le, cluster, job, route)) record: cluster_job_route:cortex_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_request_duration_seconds_bucket[1m])) by (le, cluster, job, route)) record: cluster_job_route:cortex_request_duration_seconds:50quantile - expr: sum(rate(cortex_request_duration_seconds_sum[1m])) by (cluster, job, route) / sum(rate(cortex_request_duration_seconds_count[1m])) by (cluster, job, route) record: cluster_job_route:cortex_request_duration_seconds:avg - expr: sum(rate(cortex_request_duration_seconds_bucket[1m])) by (le, cluster, job, route) record: cluster_job_route:cortex_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_request_duration_seconds_sum[1m])) by (cluster, job, route) record: cluster_job_route:cortex_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_request_duration_seconds_count[1m])) by (cluster, job, route) record: cluster_job_route:cortex_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_request_duration_seconds_bucket[1m])) by (le, cluster, namespace, job, route)) record: cluster_namespace_job_route:cortex_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_request_duration_seconds_bucket[1m])) by (le, cluster, namespace, job, route)) record: cluster_namespace_job_route:cortex_request_duration_seconds:50quantile - expr: sum(rate(cortex_request_duration_seconds_sum[1m])) by (cluster, namespace, job, route) / sum(rate(cortex_request_duration_seconds_count[1m])) by (cluster, namespace, job, route) record: cluster_namespace_job_route:cortex_request_duration_seconds:avg - expr: sum(rate(cortex_request_duration_seconds_bucket[1m])) by (le, cluster, namespace, job, route) record: cluster_namespace_job_route:cortex_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_request_duration_seconds_sum[1m])) by (cluster, namespace, job, route) record: cluster_namespace_job_route:cortex_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_request_duration_seconds_count[1m])) by (cluster, namespace, job, route) record: cluster_namespace_job_route:cortex_request_duration_seconds_count:sum_rate - name: cortex_querier_api rules: - expr: histogram_quantile(0.99, sum(rate(cortex_querier_request_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_querier_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_querier_request_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_querier_request_duration_seconds:50quantile - expr: sum(rate(cortex_querier_request_duration_seconds_sum[1m])) by (cluster, job) / sum(rate(cortex_querier_request_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_querier_request_duration_seconds:avg - expr: sum(rate(cortex_querier_request_duration_seconds_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_querier_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_querier_request_duration_seconds_sum[1m])) by (cluster, job) record: cluster_job:cortex_querier_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_querier_request_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_querier_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_querier_request_duration_seconds_bucket[1m])) by (le, cluster, job, route)) record: cluster_job_route:cortex_querier_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_querier_request_duration_seconds_bucket[1m])) by (le, cluster, job, route)) record: cluster_job_route:cortex_querier_request_duration_seconds:50quantile - expr: sum(rate(cortex_querier_request_duration_seconds_sum[1m])) by (cluster, job, route) / sum(rate(cortex_querier_request_duration_seconds_count[1m])) by (cluster, job, route) record: cluster_job_route:cortex_querier_request_duration_seconds:avg - expr: sum(rate(cortex_querier_request_duration_seconds_bucket[1m])) by (le, cluster, job, route) record: cluster_job_route:cortex_querier_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_querier_request_duration_seconds_sum[1m])) by (cluster, job, route) record: cluster_job_route:cortex_querier_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_querier_request_duration_seconds_count[1m])) by (cluster, job, route) record: cluster_job_route:cortex_querier_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_querier_request_duration_seconds_bucket[1m])) by (le, cluster, namespace, job, route)) record: cluster_namespace_job_route:cortex_querier_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_querier_request_duration_seconds_bucket[1m])) by (le, cluster, namespace, job, route)) record: cluster_namespace_job_route:cortex_querier_request_duration_seconds:50quantile - expr: sum(rate(cortex_querier_request_duration_seconds_sum[1m])) by (cluster, namespace, job, route) / sum(rate(cortex_querier_request_duration_seconds_count[1m])) by (cluster, namespace, job, route) record: cluster_namespace_job_route:cortex_querier_request_duration_seconds:avg - expr: sum(rate(cortex_querier_request_duration_seconds_bucket[1m])) by (le, cluster, namespace, job, route) record: cluster_namespace_job_route:cortex_querier_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_querier_request_duration_seconds_sum[1m])) by (cluster, namespace, job, route) record: cluster_namespace_job_route:cortex_querier_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_querier_request_duration_seconds_count[1m])) by (cluster, namespace, job, route) record: cluster_namespace_job_route:cortex_querier_request_duration_seconds_count:sum_rate - name: cortex_cache rules: - expr: histogram_quantile(0.99, sum(rate(cortex_memcache_request_duration_seconds_bucket[1m])) by (le, cluster, job, method)) record: cluster_job_method:cortex_memcache_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_memcache_request_duration_seconds_bucket[1m])) by (le, cluster, job, method)) record: cluster_job_method:cortex_memcache_request_duration_seconds:50quantile - expr: sum(rate(cortex_memcache_request_duration_seconds_sum[1m])) by (cluster, job, method) / sum(rate(cortex_memcache_request_duration_seconds_count[1m])) by (cluster, job, method) record: cluster_job_method:cortex_memcache_request_duration_seconds:avg - expr: sum(rate(cortex_memcache_request_duration_seconds_bucket[1m])) by (le, cluster, job, method) record: cluster_job_method:cortex_memcache_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_memcache_request_duration_seconds_sum[1m])) by (cluster, job, method) record: cluster_job_method:cortex_memcache_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_memcache_request_duration_seconds_count[1m])) by (cluster, job, method) record: cluster_job_method:cortex_memcache_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_cache_request_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_cache_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_cache_request_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_cache_request_duration_seconds:50quantile - expr: sum(rate(cortex_cache_request_duration_seconds_sum[1m])) by (cluster, job) / sum(rate(cortex_cache_request_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_cache_request_duration_seconds:avg - expr: sum(rate(cortex_cache_request_duration_seconds_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_cache_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_cache_request_duration_seconds_sum[1m])) by (cluster, job) record: cluster_job:cortex_cache_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_cache_request_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_cache_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_cache_request_duration_seconds_bucket[1m])) by (le, cluster, job, method)) record: cluster_job_method:cortex_cache_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_cache_request_duration_seconds_bucket[1m])) by (le, cluster, job, method)) record: cluster_job_method:cortex_cache_request_duration_seconds:50quantile - expr: sum(rate(cortex_cache_request_duration_seconds_sum[1m])) by (cluster, job, method) / sum(rate(cortex_cache_request_duration_seconds_count[1m])) by (cluster, job, method) record: cluster_job_method:cortex_cache_request_duration_seconds:avg - expr: sum(rate(cortex_cache_request_duration_seconds_bucket[1m])) by (le, cluster, job, method) record: cluster_job_method:cortex_cache_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_cache_request_duration_seconds_sum[1m])) by (cluster, job, method) record: cluster_job_method:cortex_cache_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_cache_request_duration_seconds_count[1m])) by (cluster, job, method) record: cluster_job_method:cortex_cache_request_duration_seconds_count:sum_rate - name: cortex_storage rules: - expr: histogram_quantile(0.99, sum(rate(cortex_bigtable_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation)) record: cluster_job_operation:cortex_bigtable_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_bigtable_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation)) record: cluster_job_operation:cortex_bigtable_request_duration_seconds:50quantile - expr: sum(rate(cortex_bigtable_request_duration_seconds_sum[1m])) by (cluster, job, operation) / sum(rate(cortex_bigtable_request_duration_seconds_count[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_bigtable_request_duration_seconds:avg - expr: sum(rate(cortex_bigtable_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation) record: cluster_job_operation:cortex_bigtable_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_bigtable_request_duration_seconds_sum[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_bigtable_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_bigtable_request_duration_seconds_count[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_bigtable_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_cassandra_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation)) record: cluster_job_operation:cortex_cassandra_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_cassandra_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation)) record: cluster_job_operation:cortex_cassandra_request_duration_seconds:50quantile - expr: sum(rate(cortex_cassandra_request_duration_seconds_sum[1m])) by (cluster, job, operation) / sum(rate(cortex_cassandra_request_duration_seconds_count[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_cassandra_request_duration_seconds:avg - expr: sum(rate(cortex_cassandra_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation) record: cluster_job_operation:cortex_cassandra_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_cassandra_request_duration_seconds_sum[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_cassandra_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_cassandra_request_duration_seconds_count[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_cassandra_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_dynamo_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation)) record: cluster_job_operation:cortex_dynamo_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_dynamo_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation)) record: cluster_job_operation:cortex_dynamo_request_duration_seconds:50quantile - expr: sum(rate(cortex_dynamo_request_duration_seconds_sum[1m])) by (cluster, job, operation) / sum(rate(cortex_dynamo_request_duration_seconds_count[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_dynamo_request_duration_seconds:avg - expr: sum(rate(cortex_dynamo_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation) record: cluster_job_operation:cortex_dynamo_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_dynamo_request_duration_seconds_sum[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_dynamo_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_dynamo_request_duration_seconds_count[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_dynamo_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_chunk_store_index_lookups_per_query_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_chunk_store_index_lookups_per_query:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_chunk_store_index_lookups_per_query_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_chunk_store_index_lookups_per_query:50quantile - expr: sum(rate(cortex_chunk_store_index_lookups_per_query_sum[1m])) by (cluster, job) / sum(rate(cortex_chunk_store_index_lookups_per_query_count[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_index_lookups_per_query:avg - expr: sum(rate(cortex_chunk_store_index_lookups_per_query_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_chunk_store_index_lookups_per_query_bucket:sum_rate - expr: sum(rate(cortex_chunk_store_index_lookups_per_query_sum[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_index_lookups_per_query_sum:sum_rate - expr: sum(rate(cortex_chunk_store_index_lookups_per_query_count[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_index_lookups_per_query_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_chunk_store_series_pre_intersection_per_query_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_chunk_store_series_pre_intersection_per_query:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_chunk_store_series_pre_intersection_per_query_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_chunk_store_series_pre_intersection_per_query:50quantile - expr: sum(rate(cortex_chunk_store_series_pre_intersection_per_query_sum[1m])) by (cluster, job) / sum(rate(cortex_chunk_store_series_pre_intersection_per_query_count[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_series_pre_intersection_per_query:avg - expr: sum(rate(cortex_chunk_store_series_pre_intersection_per_query_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_chunk_store_series_pre_intersection_per_query_bucket:sum_rate - expr: sum(rate(cortex_chunk_store_series_pre_intersection_per_query_sum[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_series_pre_intersection_per_query_sum:sum_rate - expr: sum(rate(cortex_chunk_store_series_pre_intersection_per_query_count[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_series_pre_intersection_per_query_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_chunk_store_series_post_intersection_per_query_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_chunk_store_series_post_intersection_per_query:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_chunk_store_series_post_intersection_per_query_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_chunk_store_series_post_intersection_per_query:50quantile - expr: sum(rate(cortex_chunk_store_series_post_intersection_per_query_sum[1m])) by (cluster, job) / sum(rate(cortex_chunk_store_series_post_intersection_per_query_count[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_series_post_intersection_per_query:avg - expr: sum(rate(cortex_chunk_store_series_post_intersection_per_query_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_chunk_store_series_post_intersection_per_query_bucket:sum_rate - expr: sum(rate(cortex_chunk_store_series_post_intersection_per_query_sum[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_series_post_intersection_per_query_sum:sum_rate - expr: sum(rate(cortex_chunk_store_series_post_intersection_per_query_count[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_series_post_intersection_per_query_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_chunk_store_chunks_per_query_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_chunk_store_chunks_per_query:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_chunk_store_chunks_per_query_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_chunk_store_chunks_per_query:50quantile - expr: sum(rate(cortex_chunk_store_chunks_per_query_sum[1m])) by (cluster, job) / sum(rate(cortex_chunk_store_chunks_per_query_count[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_chunks_per_query:avg - expr: sum(rate(cortex_chunk_store_chunks_per_query_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_chunk_store_chunks_per_query_bucket:sum_rate - expr: sum(rate(cortex_chunk_store_chunks_per_query_sum[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_chunks_per_query_sum:sum_rate - expr: sum(rate(cortex_chunk_store_chunks_per_query_count[1m])) by (cluster, job) record: cluster_job:cortex_chunk_store_chunks_per_query_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_database_request_duration_seconds_bucket[1m])) by (le, cluster, job, method)) record: cluster_job_method:cortex_database_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_database_request_duration_seconds_bucket[1m])) by (le, cluster, job, method)) record: cluster_job_method:cortex_database_request_duration_seconds:50quantile - expr: sum(rate(cortex_database_request_duration_seconds_sum[1m])) by (cluster, job, method) / sum(rate(cortex_database_request_duration_seconds_count[1m])) by (cluster, job, method) record: cluster_job_method:cortex_database_request_duration_seconds:avg - expr: sum(rate(cortex_database_request_duration_seconds_bucket[1m])) by (le, cluster, job, method) record: cluster_job_method:cortex_database_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_database_request_duration_seconds_sum[1m])) by (cluster, job, method) record: cluster_job_method:cortex_database_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_database_request_duration_seconds_count[1m])) by (cluster, job, method) record: cluster_job_method:cortex_database_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_gcs_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation)) record: cluster_job_operation:cortex_gcs_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_gcs_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation)) record: cluster_job_operation:cortex_gcs_request_duration_seconds:50quantile - expr: sum(rate(cortex_gcs_request_duration_seconds_sum[1m])) by (cluster, job, operation) / sum(rate(cortex_gcs_request_duration_seconds_count[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_gcs_request_duration_seconds:avg - expr: sum(rate(cortex_gcs_request_duration_seconds_bucket[1m])) by (le, cluster, job, operation) record: cluster_job_operation:cortex_gcs_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_gcs_request_duration_seconds_sum[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_gcs_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_gcs_request_duration_seconds_count[1m])) by (cluster, job, operation) record: cluster_job_operation:cortex_gcs_request_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_kv_request_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_kv_request_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_kv_request_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_kv_request_duration_seconds:50quantile - expr: sum(rate(cortex_kv_request_duration_seconds_sum[1m])) by (cluster, job) / sum(rate(cortex_kv_request_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_kv_request_duration_seconds:avg - expr: sum(rate(cortex_kv_request_duration_seconds_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_kv_request_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_kv_request_duration_seconds_sum[1m])) by (cluster, job) record: cluster_job:cortex_kv_request_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_kv_request_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_kv_request_duration_seconds_count:sum_rate - name: cortex_queries rules: - expr: histogram_quantile(0.99, sum(rate(cortex_query_frontend_retries_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_query_frontend_retries:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_query_frontend_retries_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_query_frontend_retries:50quantile - expr: sum(rate(cortex_query_frontend_retries_sum[1m])) by (cluster, job) / sum(rate(cortex_query_frontend_retries_count[1m])) by (cluster, job) record: cluster_job:cortex_query_frontend_retries:avg - expr: sum(rate(cortex_query_frontend_retries_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_query_frontend_retries_bucket:sum_rate - expr: sum(rate(cortex_query_frontend_retries_sum[1m])) by (cluster, job) record: cluster_job:cortex_query_frontend_retries_sum:sum_rate - expr: sum(rate(cortex_query_frontend_retries_count[1m])) by (cluster, job) record: cluster_job:cortex_query_frontend_retries_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_query_frontend_queue_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_query_frontend_queue_duration_seconds:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_query_frontend_queue_duration_seconds_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_query_frontend_queue_duration_seconds:50quantile - expr: sum(rate(cortex_query_frontend_queue_duration_seconds_sum[1m])) by (cluster, job) / sum(rate(cortex_query_frontend_queue_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_query_frontend_queue_duration_seconds:avg - expr: sum(rate(cortex_query_frontend_queue_duration_seconds_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_query_frontend_queue_duration_seconds_bucket:sum_rate - expr: sum(rate(cortex_query_frontend_queue_duration_seconds_sum[1m])) by (cluster, job) record: cluster_job:cortex_query_frontend_queue_duration_seconds_sum:sum_rate - expr: sum(rate(cortex_query_frontend_queue_duration_seconds_count[1m])) by (cluster, job) record: cluster_job:cortex_query_frontend_queue_duration_seconds_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_ingester_queried_series_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_ingester_queried_series:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_ingester_queried_series_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_ingester_queried_series:50quantile - expr: sum(rate(cortex_ingester_queried_series_sum[1m])) by (cluster, job) / sum(rate(cortex_ingester_queried_series_count[1m])) by (cluster, job) record: cluster_job:cortex_ingester_queried_series:avg - expr: sum(rate(cortex_ingester_queried_series_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_ingester_queried_series_bucket:sum_rate - expr: sum(rate(cortex_ingester_queried_series_sum[1m])) by (cluster, job) record: cluster_job:cortex_ingester_queried_series_sum:sum_rate - expr: sum(rate(cortex_ingester_queried_series_count[1m])) by (cluster, job) record: cluster_job:cortex_ingester_queried_series_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_ingester_queried_chunks_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_ingester_queried_chunks:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_ingester_queried_chunks_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_ingester_queried_chunks:50quantile - expr: sum(rate(cortex_ingester_queried_chunks_sum[1m])) by (cluster, job) / sum(rate(cortex_ingester_queried_chunks_count[1m])) by (cluster, job) record: cluster_job:cortex_ingester_queried_chunks:avg - expr: sum(rate(cortex_ingester_queried_chunks_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_ingester_queried_chunks_bucket:sum_rate - expr: sum(rate(cortex_ingester_queried_chunks_sum[1m])) by (cluster, job) record: cluster_job:cortex_ingester_queried_chunks_sum:sum_rate - expr: sum(rate(cortex_ingester_queried_chunks_count[1m])) by (cluster, job) record: cluster_job:cortex_ingester_queried_chunks_count:sum_rate - expr: histogram_quantile(0.99, sum(rate(cortex_ingester_queried_samples_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_ingester_queried_samples:99quantile - expr: histogram_quantile(0.50, sum(rate(cortex_ingester_queried_samples_bucket[1m])) by (le, cluster, job)) record: cluster_job:cortex_ingester_queried_samples:50quantile - expr: sum(rate(cortex_ingester_queried_samples_sum[1m])) by (cluster, job) / sum(rate(cortex_ingester_queried_samples_count[1m])) by (cluster, job) record: cluster_job:cortex_ingester_queried_samples:avg - expr: sum(rate(cortex_ingester_queried_samples_bucket[1m])) by (le, cluster, job) record: cluster_job:cortex_ingester_queried_samples_bucket:sum_rate - expr: sum(rate(cortex_ingester_queried_samples_sum[1m])) by (cluster, job) record: cluster_job:cortex_ingester_queried_samples_sum:sum_rate - expr: sum(rate(cortex_ingester_queried_samples_count[1m])) by (cluster, job) record: cluster_job:cortex_ingester_queried_samples_count:sum_rate - name: cortex_received_samples rules: - expr: | sum by (cluster, namespace, job) (rate(cortex_distributor_received_samples_total[5m])) record: cluster_namespace_job:cortex_distributor_received_samples:rate5m - name: cortex_scaling_rules rules: - expr: | sum by (cluster, namespace, deployment) (kube_deployment_spec_replicas) or sum by (cluster, namespace, deployment) ( label_replace(kube_statefulset_replicas, "deployment", "$1", "statefulset", "(.*)") ) record: cluster_namespace_deployment:actual_replicas:count - expr: | ceil( quantile_over_time(0.99, sum by (cluster, namespace) ( cluster_namespace_job:cortex_distributor_received_samples:rate5m )[24h:] ) / 240000 ) labels: deployment: distributor reason: sample_rate record: cluster_namespace_deployment_reason:required_replicas:count - expr: | ceil( sum by (cluster, namespace) (cortex_overrides{limit_name="ingestion_rate"}) * 0.59999999999999998 / 240000 ) labels: deployment: distributor reason: sample_rate_limits record: cluster_namespace_deployment_reason:required_replicas:count - expr: | ceil( quantile_over_time(0.99, sum by (cluster, namespace) ( cluster_namespace_job:cortex_distributor_received_samples:rate5m )[24h:] ) * 3 / 80000 ) labels: deployment: ingester reason: sample_rate record: cluster_namespace_deployment_reason:required_replicas:count - expr: | ceil( quantile_over_time(0.99, sum by(cluster, namespace) ( cortex_ingester_memory_series )[24h:] ) / 1500000 ) labels: deployment: ingester reason: active_series record: cluster_namespace_deployment_reason:required_replicas:count - expr: | ceil( sum by (cluster, namespace) (cortex_overrides{limit_name="max_global_series_per_user"}) * 3 * 0.59999999999999998 / 1500000 ) labels: deployment: ingester reason: active_series_limits record: cluster_namespace_deployment_reason:required_replicas:count - expr: | ceil( sum by (cluster, namespace) (cortex_overrides{limit_name="ingestion_rate"}) * 0.59999999999999998 / 80000 ) labels: deployment: ingester reason: sample_rate_limits record: cluster_namespace_deployment_reason:required_replicas:count - expr: | ceil( (sum by (cluster, namespace) ( cortex_ingester_tsdb_storage_blocks_bytes{job=~".+/ingester"} ) / 4) / avg by (cluster, namespace) ( memcached_limit_bytes{job=~".+/memcached"} ) ) labels: deployment: memcached reason: active_series record: cluster_namespace_deployment_reason:required_replicas:count - expr: | ceil( cluster_namespace_deployment:actual_replicas:count * quantile_over_time(0.99, sum by (cluster, namespace, deployment) ( label_replace( node_namespace_pod_container:container_cpu_usage_seconds_total:sum_rate, "deployment", "$1", "pod", "(.*)-(?:([0-9]+)|([a-z0-9]+)-([a-z0-9]+))" ) )[24h:5m] ) / sum by (cluster, namespace, deployment) ( label_replace( kube_pod_container_resource_requests_cpu_cores, "deployment", "$1", "pod", "(.*)-(?:([0-9]+)|([a-z0-9]+)-([a-z0-9]+))" ) ) ) labels: reason: cpu_usage record: cluster_namespace_deployment_reason:required_replicas:count - expr: | ceil( cluster_namespace_deployment:actual_replicas:count * quantile_over_time(0.99, sum by (cluster, namespace, deployment) ( label_replace( container_memory_usage_bytes, "deployment", "$1", "pod", "(.*)-(?:([0-9]+)|([a-z0-9]+)-([a-z0-9]+))" ) )[24h:5m] ) / sum by (cluster, namespace, deployment) ( label_replace( kube_pod_container_resource_requests_memory_bytes, "deployment", "$1", "pod", "(.*)-(?:([0-9]+)|([a-z0-9]+)-([a-z0-9]+))" ) ) ) labels: reason: memory_usage record: cluster_namespace_deployment_reason:required_replicas:count