From 2175c43e3c622c52dfd3e9a3a141758aa40378ba Mon Sep 17 00:00:00 2001 From: JuArce <52429267+JuArce@users.noreply.github.com> Date: Wed, 17 Dec 2025 15:42:18 -0300 Subject: [PATCH 1/2] infra(prometheus): update rules to support multiple batchers and aggregators --- infra/ansible/playbooks/files/prometheus/rules.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/infra/ansible/playbooks/files/prometheus/rules.yml b/infra/ansible/playbooks/files/prometheus/rules.yml index 2a44b4a122..4aea4077df 100644 --- a/infra/ansible/playbooks/files/prometheus/rules.yml +++ b/infra/ansible/playbooks/files/prometheus/rules.yml @@ -17,7 +17,7 @@ groups: - alert: TaskDifferenceAggregatorBatcher # Condition for alerting - expr: floor(increase(aligned_aggregator_received_tasks{job="aligned-aggregator"}[15m])) - on() floor(increase(sent_batches{job="aligned-batcher"}[15m])) > 1 + expr: floor(max(increase(aligned_aggregator_received_tasks{job="aligned-aggregator"}[15m]))) - on() floor(max(increase(sent_batches{job="aligned-batcher"}[15m]))) > 1 for: 30s # Annotation - additional informational labels to store more information annotations: @@ -30,7 +30,7 @@ groups: - alert: TaskDifferenceAggregator # Condition for alerting - expr: floor(increase(aligned_aggregator_received_tasks{job="aligned-aggregator"}[15m])) - floor(increase(aligned_aggregated_responses{job="aligned-aggregator"}[15m])) > 1 + expr: floor(max(increase(aligned_aggregator_received_tasks{job="aligned-aggregator"}[15m]))) - floor(max(increase(aligned_aggregated_responses{job="aligned-aggregator"}[15m]))) > 1 for: 30s # Annotation - additional informational labels to store more information annotations: From b2e6fe3223a3688d5d64bc86cc5b05ccc80c3224 Mon Sep 17 00:00:00 2001 From: JuArce <52429267+JuArce@users.noreply.github.com> Date: Wed, 17 Dec 2025 15:53:54 -0300 Subject: [PATCH 2/2] infra(prometheus): update rules to support multiple batchers and aggregators --- infra/ansible/playbooks/files/prometheus/rules.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/infra/ansible/playbooks/files/prometheus/rules.yml b/infra/ansible/playbooks/files/prometheus/rules.yml index 4aea4077df..3c65592a15 100644 --- a/infra/ansible/playbooks/files/prometheus/rules.yml +++ b/infra/ansible/playbooks/files/prometheus/rules.yml @@ -17,7 +17,7 @@ groups: - alert: TaskDifferenceAggregatorBatcher # Condition for alerting - expr: floor(max(increase(aligned_aggregator_received_tasks{job="aligned-aggregator"}[15m]))) - on() floor(max(increase(sent_batches{job="aligned-batcher"}[15m]))) > 1 + expr: floor(max(increase(aligned_aggregator_received_tasks{job="aligned-aggregator"}[15m]))) - on() floor(sum(increase(sent_batches{job="aligned-batcher"}[15m]))) > 1 for: 30s # Annotation - additional informational labels to store more information annotations: @@ -30,7 +30,7 @@ groups: - alert: TaskDifferenceAggregator # Condition for alerting - expr: floor(max(increase(aligned_aggregator_received_tasks{job="aligned-aggregator"}[15m]))) - floor(max(increase(aligned_aggregated_responses{job="aligned-aggregator"}[15m]))) > 1 + expr: floor(max(increase(aligned_aggregator_received_tasks{job="aligned-aggregator"}[15m]))) - floor(sum(increase(aligned_aggregated_responses{job="aligned-aggregator"}[15m]))) > 1 for: 30s # Annotation - additional informational labels to store more information annotations: