Skip to content

Commit

Permalink
Remove alert and runbook for bucket scanning
Browse files Browse the repository at this point in the history
  • Loading branch information
leizor committed Nov 30, 2023
1 parent d746ef5 commit 91c93ef
Show file tree
Hide file tree
Showing 5 changed files with 0 additions and 63 deletions.
8 changes: 0 additions & 8 deletions docs/sources/mimir/manage/mimir-runbooks/_index.md
Original file line number Diff line number Diff line change
Expand Up @@ -522,14 +522,6 @@ How to **fix** it:
- Set the shard size of one or more tenants to `0`; this will shard the given tenant's rule groups across all ingesters.
- Decrease the total number of ruler replicas by the number of idle replicas.

### MimirQuerierHasNotScanTheBucket

This alert fires when a Mimir querier is not successfully scanning blocks in the storage (bucket). A querier is expected to periodically iterate the bucket to find new and deleted blocks (defaults to every 5m) and if it's not successfully synching the bucket since a long time, it may end up querying only a subset of blocks, thus leading to potentially partial results.

How to **investigate**:

- Look for any scan error in the querier logs (ie. networking or rate limiting issues)

### MimirStoreGatewayHasNotSyncTheBucket

This alert fires when a Mimir store-gateway is not successfully scanning blocks in the storage (bucket). A store-gateway is expected to periodically iterate the bucket to find new and deleted blocks (defaults to every 5m) and if it's not successfully synching the bucket for a long time, it may end up querying only a subset of blocks, thus leading to potentially partial results.
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -772,19 +772,6 @@ spec:
for: 3m
labels:
severity: critical
- alert: MimirQuerierHasNotScanTheBucket
annotations:
message: Mimir Querier {{ $labels.pod }} in {{ $labels.cluster }}/{{ $labels.namespace
}} has not successfully scanned the bucket since {{ $value | humanizeDuration
}}.
runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimirquerierhasnotscanthebucket
expr: |
(time() - cortex_querier_blocks_last_successful_scan_timestamp_seconds > 60 * 30)
and
cortex_querier_blocks_last_successful_scan_timestamp_seconds > 0
for: 5m
labels:
severity: critical
- alert: MimirStoreGatewayHasNotSyncTheBucket
annotations:
message: Mimir store-gateway {{ $labels.pod }} in {{ $labels.cluster }}/{{ $labels.namespace
Expand Down
13 changes: 0 additions & 13 deletions operations/mimir-mixin-compiled-baremetal/alerts.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -746,19 +746,6 @@ groups:
for: 3m
labels:
severity: critical
- alert: MimirQuerierHasNotScanTheBucket
annotations:
message: Mimir Querier {{ $labels.instance }} in {{ $labels.cluster }}/{{ $labels.namespace
}} has not successfully scanned the bucket since {{ $value | humanizeDuration
}}.
runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimirquerierhasnotscanthebucket
expr: |
(time() - cortex_querier_blocks_last_successful_scan_timestamp_seconds > 60 * 30)
and
cortex_querier_blocks_last_successful_scan_timestamp_seconds > 0
for: 5m
labels:
severity: critical
- alert: MimirStoreGatewayHasNotSyncTheBucket
annotations:
message: Mimir store-gateway {{ $labels.instance }} in {{ $labels.cluster }}/{{
Expand Down
13 changes: 0 additions & 13 deletions operations/mimir-mixin-compiled/alerts.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -760,19 +760,6 @@ groups:
for: 3m
labels:
severity: critical
- alert: MimirQuerierHasNotScanTheBucket
annotations:
message: Mimir Querier {{ $labels.pod }} in {{ $labels.cluster }}/{{ $labels.namespace
}} has not successfully scanned the bucket since {{ $value | humanizeDuration
}}.
runbook_url: https://grafana.com/docs/mimir/latest/operators-guide/mimir-runbooks/#mimirquerierhasnotscanthebucket
expr: |
(time() - cortex_querier_blocks_last_successful_scan_timestamp_seconds > 60 * 30)
and
cortex_querier_blocks_last_successful_scan_timestamp_seconds > 0
for: 5m
labels:
severity: critical
- alert: MimirStoreGatewayHasNotSyncTheBucket
annotations:
message: Mimir store-gateway {{ $labels.pod }} in {{ $labels.cluster }}/{{ $labels.namespace
Expand Down
16 changes: 0 additions & 16 deletions operations/mimir-mixin/alerts/blocks.libsonnet
Original file line number Diff line number Diff line change
Expand Up @@ -183,22 +183,6 @@
message: '%(product)s Ingester %(alert_instance_variable)s in %(alert_aggregation_variables)s is failing to write to TSDB WAL.' % $._config,
},
},
{
// Alert if the querier is not successfully scanning the bucket.
alert: $.alertName('QuerierHasNotScanTheBucket'),
'for': '5m',
expr: |||
(time() - cortex_querier_blocks_last_successful_scan_timestamp_seconds > 60 * 30)
and
cortex_querier_blocks_last_successful_scan_timestamp_seconds > 0
|||,
labels: {
severity: 'critical',
},
annotations: {
message: '%(product)s Querier %(alert_instance_variable)s in %(alert_aggregation_variables)s has not successfully scanned the bucket since {{ $value | humanizeDuration }}.' % $._config,
},
},
{
// Alert if the store-gateway is not successfully synching the bucket.
alert: $.alertName('StoreGatewayHasNotSyncTheBucket'),
Expand Down

0 comments on commit 91c93ef

Please sign in to comment.