Skip to content

Commit

Permalink
Add alert for cloud-sql-proxy connection failures
Browse files Browse the repository at this point in the history
Add an alert to report on connection errors coming from the
cloud-sql-proxy sidecars in the trillian and rekor deployments. This
should detect when the proxy service account user has lost its
permissions to access the sql instance.

Signed-off-by: Colleen Murphy <[email protected]>
  • Loading branch information
cmurphy committed Jul 2, 2024
1 parent 41a7bd0 commit dac9b11
Showing 1 changed file with 47 additions and 1 deletion.
48 changes: 47 additions & 1 deletion terraform/gcp/modules/monitoring/infra/alerts.tf
Original file line number Diff line number Diff line change
Expand Up @@ -275,6 +275,52 @@ resource "google_monitoring_alert_policy" "cloud_sql_disk_utilization" {
}


### Cloud SQL Proxy Alerts

# Cloud SQL Proxy Connection Failures
resource "google_monitoring_alert_policy" "cloudsqlconn_connection_failure" {
# In the absence of data, incident will auto-close in 7 days
alert_strategy {
auto_close = "604800s"
}

combiner = "OR"

# Connection failures are greater than 0
conditions {
condition_threshold {
aggregations {
alignment_period = "60s"
per_series_aligner = "ALIGN_RATE"
}

comparison = "COMPARISON_GT"
duration = "300s"
filter = "metric.type=\"prometheus.googleapis.com/cloudsqlconn_dial_failure_count/counter\" resource.type=\"prometheus_target\""
threshold_value = "0"
}

trigger {
count = "1"
percent = "0"
}

display_name = "Cloud SQL Proxy connections failing"
}

display_name = "Cloud SQL Proxy connections failing"

documentation {
content = "Cloud SQL Proxy connections have been failing for at least 5 minutes.\n"
mime_type = "text/markdown"
}

enabled = "true"
notification_channels = local.notification_channels
project = var.project_id
}


### KMS Alerts

resource "google_monitoring_alert_policy" "kms_read_request_alert" {
Expand Down Expand Up @@ -352,7 +398,7 @@ resource "google_monitoring_alert_policy" "kms_crypto_request_alert" {
threshold_value = "1000"

trigger {
count = "1"
count = "0"
percent = "0"
}
}
Expand Down

0 comments on commit dac9b11

Please sign in to comment.