Skip to content
Merged
Changes from all commits
Commits
Show all changes
24 commits
Select commit Hold shift + click to select a range
203d1ec
[LTBE-16] added alerts and variables
DanieleRanaldo Oct 9, 2025
bb70b7c
[LTBE-16] removed space
DanieleRanaldo Oct 9, 2025
0f604da
Merge remote-tracking branch 'origin/main' into LTBE-16-creazione-all…
and-mora Oct 9, 2025
78c460c
[LTBE-16] added condition
DanieleRanaldo Oct 9, 2025
673eccf
Merge remote-tracking branch 'origin/main' into LTBE-16-creazione-all…
and-mora Oct 9, 2025
7c0e672
[LTBE-16] added monitor_resource_group_name env
DanieleRanaldo Oct 9, 2025
220f037
[LTBE-16] added condition on alert group and fix env
DanieleRanaldo Oct 9, 2025
86e2db2
[LTBE-16] added condition uat env on count
DanieleRanaldo Oct 9, 2025
12a4f55
Merge remote-tracking branch 'origin/main' into LTBE-16-creazione-all…
and-mora Oct 9, 2025
0e7708f
[LTBE-16] added locals
DanieleRanaldo Oct 10, 2025
e8d033c
precommit
and-mora Oct 10, 2025
7e46001
[LTBE-16] fix requested changes
DanieleRanaldo Oct 10, 2025
f3dfef5
[LTBE-16] fix requested changes
DanieleRanaldo Oct 10, 2025
6c99bf9
[LTBE-16] fix requested changes
DanieleRanaldo Oct 10, 2025
3092ec4
[LTBE-16] fix requested changes
DanieleRanaldo Oct 10, 2025
7ded128
[LTBE-16] fix precommit
DanieleRanaldo Oct 10, 2025
95fc998
[LTBE-16] fix alert
DanieleRanaldo Oct 14, 2025
9f706eb
[LTBE-16] removed kafka alerts
DanieleRanaldo Oct 16, 2025
ec6eed6
Merge branch 'main' into LTBE-16-creazione-allarmi
DanieleRanaldo Oct 16, 2025
4b0696e
pre-commit
and-mora Oct 16, 2025
618f2ea
[LTBE-16] fix
DanieleRanaldo Oct 16, 2025
5ca99cb
restore file
and-mora Oct 16, 2025
a1e0309
Merge remote-tracking branch 'origin/main' into LTBE-16-creazione-all…
and-mora Oct 16, 2025
ccd7d96
restore file
and-mora Oct 16, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
80 changes: 4 additions & 76 deletions src/70_domains/idpay_common/12_alerts.tf
Original file line number Diff line number Diff line change
@@ -1,3 +1,7 @@
# =============================================================
# Alert API EIE
# =============================================================

# =============================================================
# Portal Consent – post (5xx, 401, 429 errors over 5 minutes)
# =============================================================
Expand Down Expand Up @@ -649,82 +653,6 @@ QUERY
}
}

# =======================================================
# Kafka Consumer - Absent Consumer Alert (5 min)
# =======================================================
resource "azurerm_monitor_scheduled_query_rules_alert" "pari_kafka_consumer_absent_alert" {
count = contains(["p", "u"], var.env_short) ? 1 : 0
name = "pari-kafka-consumer-absent-alert"
resource_group_name = local.monitor_rg
location = var.location

description = "Kafka consumer 'idpay-asset-register-consumer-group' has not reported its lag metric for the last 5 minutes."
enabled = true
severity = 1

frequency = 5
time_window = 5

data_source_id = azurerm_log_analytics_workspace.log_analytics_workspace.id

query = <<QUERY
AppMetrics
| where TimeGenerated > ago(5m)
| where Name == "kafka_consumer_fetch_manager_records_lag_max"
| where Properties has "idpay-asset-register-consumer-group"
QUERY

trigger {
operator = "Equal"
threshold = 0
}

action {
action_group = [azurerm_monitor_action_group.email[0].id]
email_subject = "[PARI][HIGH] Kafka Consumer Absent: idpay-asset-register-consumer-group"
custom_webhook_payload = "{}"
}
}

# =======================================================
# Kafka Consumer - Average Lag Alert (10 min)
# =======================================================
resource "azurerm_monitor_scheduled_query_rules_alert" "pari_kafka_consumer_avg_lag_alert" {
count = contains(["p", "u"], var.env_short) ? 1 : 0
name = "pari-kafka-consumer-avg-lag-alert"
resource_group_name = local.monitor_rg
location = var.location

description = "Kafka consumer average lag is greater than 15 over the last 10 minutes. Based on the 'kafka_consumer_fetch_manager_records_lag_max' metric."
enabled = true
severity = 1

frequency = 5
time_window = 10

data_source_id = azurerm_log_analytics_workspace.log_analytics_workspace.id

query = <<QUERY
AppMetrics
| where TimeGenerated > ago(10m)
| where Name == "kafka_consumer_fetch_manager_records_lag_max"
| where Properties has "idpay-asset-register-consumer-group"
| summarize AvgLag = avg(Value)
| where AvgLag > 15
QUERY

trigger {
operator = "GreaterThanOrEqual"
threshold = 1
}

action {
action_group = [azurerm_monitor_action_group.email[0].id]
email_subject = "[PARI][HIGH] Kafka Consumer Lag Alert"
custom_webhook_payload = "{}"
}
}

# =======================================================
# Internal dependency – E-mail service
# =======================================================
Expand Down