diff --git a/cloud/azure/README.md b/cloud/azure/README.md index 3e65051..5ba5600 100644 --- a/cloud/azure/README.md +++ b/cloud/azure/README.md @@ -31,143 +31,194 @@ Inputs | Name | Description | Type | Default | Required | |------|-------------|:----:|:-----:|:-----:| +| apimanagement_failed_requests_message | Custom message for API Management failed requests monitor | string | `` | no | | apimanagement_failed_requests_silenced | Groups to mute for API Management failed requests monitor | map | `` | no | | apimanagement_failed_requests_threshold_critical | Maximum acceptable percent of failed requests | string | `90` | no | | apimanagement_failed_requests_threshold_warning | Warning regarding acceptable percent of failed requests | string | `50` | no | +| apimanagement_other_requests_message | Custom message for API Management other requests monitor | string | `` | no | | apimanagement_other_requests_silenced | Groups to mute for API Management other requests monitor | map | `` | no | | apimanagement_other_requests_threshold_critical | Maximum acceptable percent of other requests | string | `90` | no | | apimanagement_other_requests_threshold_warning | Warning regarding acceptable percent of other requests | string | `50` | no | +| apimanagement_status_message | Custom message for API Management status monitor | string | `` | no | | apimanagement_status_silenced | Groups to mute for API Management status monitor | map | `` | no | +| apimanagement_successful_requests_message | Custom message for API Management successful requests monitor | string | `` | no | | apimanagement_successful_requests_silenced | Groups to mute for API Management successful requests monitor | map | `` | no | | apimanagement_successful_requests_threshold_critical | Minimum acceptable percent of successful requests | string | `10` | no | | apimanagement_successful_requests_threshold_warning | Warning regarding acceptable percent of successful requests | string | `30` | no | +| apimanagement_unauthorized_requests_message | Custom message for API Management unauthorized requests monitor | string | `` | no | | apimanagement_unauthorized_requests_silenced | Groups to mute for API Management unauthorized requests monitor | map | `` | no | | apimanagement_unauthorized_requests_threshold_critical | Maximum acceptable percent of unauthorized requests | string | `90` | no | | apimanagement_unauthorized_requests_threshold_warning | Warning regarding acceptable percent of unauthorized requests | string | `50` | no | +| appservices_http_4xx_requests_message | Custom message for App Services 4xx requests monitor | string | `` | no | | appservices_http_4xx_requests_silenced | Groups to mute for App Services 4xx requests monitor | map | `` | no | | appservices_http_4xx_requests_threshold_critical | Maximum critical acceptable percent of 4xx errors | string | `90` | no | | appservices_http_4xx_requests_threshold_warning | Warning regarding acceptable percent of 4xx errors | string | `50` | no | +| appservices_http_5xx_requests_message | Custom message for App Services 5xx requests monitor | string | `` | no | | appservices_http_5xx_requests_silenced | Groups to mute for App Services 5xx requests monitor | map | `` | no | | appservices_http_5xx_requests_threshold_critical | Maximum critical acceptable percent of 5xx errors | string | `90` | no | | appservices_http_5xx_requests_threshold_warning | Warning regarding acceptable percent of 5xx errors | string | `50` | no | +| appservices_http_successful_requests_message | Custom message for App Services successful requests monitor | string | `` | no | | appservices_http_successful_requests_silenced | Groups to mute for App Services successful requests monitor | map | `` | no | | appservices_http_successful_requests_threshold_critical | Minimum critical acceptable percent of 2xx & 3xx requests | string | `10` | no | | appservices_http_successful_requests_threshold_warning | Warning regarding acceptable percent of 2xx & 3xx requests | string | `30` | no | +| appservices_memory_usage_message | Custom message for App Services memory usage monitor | string | `` | no | | appservices_memory_usage_silenced | Groups to mute for App Services memory usage monitor | map | `` | no | | appservices_memory_usage_threshold_critical | Alerting threshold in Mib | string | `1073741824` | no | | appservices_memory_usage_threshold_warning | Warning threshold in MiB | string | `536870912` | no | +| appservices_response_time_message | Custom message for App Services response time monitor | string | `` | no | | appservices_response_time_silenced | Groups to mute for App Services response time monitor | map | `` | no | | appservices_response_time_threshold_critical | Alerting threshold for response time in seconds | string | `10` | no | | appservices_response_time_threshold_warning | Warning threshold for response time in seconds | string | `5` | no | | delay | Delay in seconds for the metric evaluation | string | `600` | no | | environment | Architecture environment | string | - | yes | +| eventhub_errors_rate_message | Custom message for Event Hub errors monitor | string | `` | no | | eventhub_errors_rate_silenced | Groups to mute for Event Hub errors monitor | map | `` | no | | eventhub_errors_rate_thresold_critical | Errors ratio (percentage) to trigger the critical alert | string | `90` | no | | eventhub_errors_rate_thresold_warning | Errors ratio (percentage) to trigger a warning alert | string | `50` | no | +| eventhub_failed_requests_rate_message | Custom message for Event Hub failed requests monitor | string | `` | no | | eventhub_failed_requests_rate_silenced | Groups to mute for Event Hub failed requests monitor | map | `` | no | | eventhub_failed_requests_rate_thresold_critical | Failed requests ratio (percentage) to trigger the critical alert | string | `90` | no | | eventhub_failed_requests_rate_thresold_warning | Failed requests ratio (percentage) to trigger a warning alert | string | `50` | no | +| eventhub_status_message | Custom message for Event Hub status monitor | string | `` | no | | eventhub_status_silenced | Groups to mute for Event Hub status monitor | map | `` | no | | filter_tags_custom | Tags used for custom filtering when filter_tags_use_defaults is false | string | `*` | no | | filter_tags_use_defaults | Use default filter tags convention | string | `true` | no | +| iothub_dropped_d2c_telemetry_egress_message | Custom message for IoT Hub dropped d2c telemetry monitor | string | `` | no | | iothub_dropped_d2c_telemetry_egress_silenced | Groups to mute for IoT Hub dropped d2c telemetry monitor | map | `` | no | | iothub_dropped_d2c_telemetry_egress_threshold_critical | D2C Telemetry Dropped limit (critical threshold) | string | `1000` | no | | iothub_dropped_d2c_telemetry_egress_threshold_warning | D2C Telemetry Dropped limit (warning threshold) | string | `500` | no | +| iothub_failed_c2d_methods_rate_message | Custom message for IoT Hub failed c2d method monitor | string | `` | no | | iothub_failed_c2d_methods_rate_silenced | Groups to mute for IoT Hub failed c2d methods monitor | map | `` | no | | iothub_failed_c2d_methods_rate_threshold_critical | C2D Methods Failed rate limit (critical threshold) | string | `90` | no | | iothub_failed_c2d_methods_rate_threshold_warning | C2D Methods Failed rate limit (warning threshold) | string | `50` | no | +| iothub_failed_c2d_twin_read_rate_message | Custom message for IoT Hub failed c2d twin read monitor | string | `` | no | | iothub_failed_c2d_twin_read_rate_silenced | Groups to mute for IoT Hub failed c2d twin read monitor | map | `` | no | | iothub_failed_c2d_twin_read_rate_threshold_critical | C2D Twin Read Failed rate limit (critical threshold) | string | `90` | no | | iothub_failed_c2d_twin_read_rate_threshold_warning | C2D Twin Read Failed rate limit (warning threshold) | string | `50` | no | +| iothub_failed_c2d_twin_update_rate_message | Custom message for IoT Hub failed c2d twin update monitor | string | `` | no | | iothub_failed_c2d_twin_update_rate_silenced | Groups to mute for IoT Hub failed c2d twin update monitor | map | `` | no | | iothub_failed_c2d_twin_update_rate_threshold_critical | C2D Twin Update Failed rate limit (critical threshold) | string | `90` | no | | iothub_failed_c2d_twin_update_rate_threshold_warning | C2D Twin Update Failed rate limit (warning threshold) | string | `50` | no | +| iothub_failed_d2c_twin_read_rate_message | Custom message for IoT Hub failed d2c twin read monitor | string | `` | no | | iothub_failed_d2c_twin_read_rate_silenced | Groups to mute for IoT Hub failed d2c twin read monitor | map | `` | no | | iothub_failed_d2c_twin_read_rate_threshold_critical | D2C Twin Read Failed rate limit (critical threshold) | string | `90` | no | | iothub_failed_d2c_twin_read_rate_threshold_warning | D2C Twin Read Failed rate limit (warning threshold) | string | `50` | no | +| iothub_failed_d2c_twin_update_rate_message | Custom message for IoT Hub failed d2c twin update monitor | string | `` | no | | iothub_failed_d2c_twin_update_rate_silenced | Groups to mute for IoT Hub failed d2c twin update monitor | map | `` | no | | iothub_failed_d2c_twin_update_rate_threshold_critical | D2C Twin Update Failed rate limit (critical threshold) | string | `90` | no | | iothub_failed_d2c_twin_update_rate_threshold_warning | D2C Twin Update Failed rate limit (warning threshold) | string | `50` | no | +| iothub_failed_jobs_rate_message | Custom message for IoT Hub failed jobs monitor | string | `` | no | | iothub_failed_jobs_rate_silenced | Groups to mute for IoT Hub failed jobs monitor | map | `` | no | | iothub_failed_jobs_rate_threshold_critical | Jobs Failed rate limit (critical threshold) | string | `90` | no | | iothub_failed_jobs_rate_threshold_warning | Jobs Failed rate limit (warning threshold) | string | `50` | no | +| iothub_failed_listjobs_rate_message | Custom message for IoT Hub failed list jobs monitor | string | `` | no | | iothub_failed_listjobs_rate_silenced | Groups to mute for IoT Hub failed list jobs monitor | map | `` | no | | iothub_failed_listjobs_rate_threshold_critical | ListJobs Failed rate limit (critical threshold) | string | `90` | no | | iothub_failed_listjobs_rate_threshold_warning | ListJobs Failed rate limit (warning threshold) | string | `50` | no | +| iothub_failed_queryjobs_rate_message | Custom message for IoT Hub failed query jobs monitor | string | `` | no | | iothub_failed_queryjobs_rate_silenced | Groups to mute for IoT Hub failed query jobs monitor | map | `` | no | | iothub_failed_queryjobs_rate_threshold_critical | QueryJobs Failed rate limit (critical threshold) | string | `90` | no | | iothub_failed_queryjobs_rate_threshold_warning | QueryJobs Failed rate limit (warning threshold) | string | `50` | no | +| iothub_fallback_d2c_telemetry_egress_message | Custom message for IoT Hub fallback d2c telemetry monitor | string | `` | no | | iothub_fallback_d2c_telemetry_egress_silenced | Groups to mute for IoT Hub fallback d2c telemetry monitor | map | `` | no | | iothub_fallback_d2c_telemetry_egress_threshold_critical | D2C Telemetry Fallback limit (critical threshold) | string | `1000` | no | | iothub_fallback_d2c_telemetry_egress_threshold_warning | D2C Telemetry Fallback limit (warning threshold) | string | `500` | no | +| iothub_invalid_d2c_telemetry_egress_message | Custom message for IoT Hub invalid d2c telemetry monitor | string | `` | no | | iothub_invalid_d2c_telemetry_egress_silenced | Groups to mute for IoT Hub invalid d2c telemetry monitor | map | `` | no | | iothub_invalid_d2c_telemetry_egress_threshold_critical | D2C Telemetry Invalid limit (critical threshold) | string | `1000` | no | | iothub_invalid_d2c_telemetry_egress_threshold_warning | D2C Telemetry Invalid limit (warning threshold) | string | `500` | no | +| iothub_orphaned_d2c_telemetry_egress_message | Custom message for IoT Hub orphaned d2c telemetry monitor | string | `` | no | | iothub_orphaned_d2c_telemetry_egress_silenced | Groups to mute for IoT Hub orphaned d2c telemetry monitor | map | `` | no | | iothub_orphaned_d2c_telemetry_egress_threshold_critical | D2C Telemetry Orphaned limit (critical threshold) | string | `1000` | no | | iothub_orphaned_d2c_telemetry_egress_threshold_warning | D2C Telemetry Orphaned limit (warning threshold) | string | `500` | no | +| iothub_status_message | Custom message for IoT Hub status monitor | string | `` | no | | iothub_status_silenced | Groups to mute for IoT Hub status monitor | map | `` | no | +| iothub_too_many_d2c_telemetry_ingress_nosent_message | Custom message for IoT Hub unsent d2c telemetry monitor | string | `` | no | | iothub_too_many_d2c_telemetry_ingress_nosent_silenced | Groups to mute for IoT Hub unsent d2c telemetry monitor | map | `` | no | -| iothub_total_devices_silenced | Groups to mute for IoT Hub total device monitor | map | `` | no | +| iothub_total_devices_message | Custom message for IoT Hub total devices monitor | string | `` | no | +| iothub_total_devices_silenced | Groups to mute for IoT Hub total devices monitor | map | `` | no | | message | Message sent when a monitor is triggered | string | - | yes | | non_taggable_filter_tags | Tags used for filtering for components without tag support | string | `*` | no | +| redis_evictedkeys_limit_message | Custom message for Redis evicted keys monitor | string | `` | no | | redis_evictedkeys_limit_silenced | Groups to mute for Redis evicted keys monitor | map | `` | no | | redis_evictedkeys_limit_threshold_critical | Evicted keys limit (critical threshold) | string | `100` | no | | redis_evictedkeys_limit_threshold_warning | Evicted keys limit (warning threshold) | string | `0` | no | +| redis_percent_processor_time_message | Custom message for Redis processor monitor | string | `` | no | | redis_percent_processor_time_silenced | Groups to mute for Redis processor monitor | map | `` | no | | redis_percent_processor_time_threshold_critical | Processor time percent (critical threshold) | string | `80` | no | | redis_percent_processor_time_threshold_warning | Processor time percent (warning threshold) | string | `60` | no | +| redis_server_load_rate_message | Custom message for Redis server load monitor | string | `` | no | | redis_server_load_rate_silenced | Groups to mute for Redis server load monitor | map | `` | no | | redis_server_load_rate_threshold_critical | Server CPU load rate (critical threshold) | string | `90` | no | | redis_server_load_rate_threshold_warning | Server CPU load rate (warning threshold) | string | `70` | no | +| redis_status_message | Custom message for Redis status monitor | string | `` | no | +| redis_status_silenced | Groups to mute for Redis status monitor | map | `` | no | +| sqldatabase_cpu_message | Custom message for SQL CPU monitor | string | `` | no | | sqldatabase_cpu_silenced | Groups to mute for SQL CPU monitor | map | `` | no | | sqldatabase_cpu_threshold_critical | CPU usage in percent (critical threshold) | string | `90` | no | | sqldatabase_cpu_threshold_warning | CPU usage in percent (warning threshold) | string | `80` | no | +| sqldatabase_deadlock_message | Custom message for SQL Deadlock monitor | string | `` | no | | sqldatabase_deadlock_silenced | Groups to mute for SQL Deadlock monitor | map | `` | no | | sqldatabase_deadlock_threshold_critical | Amount of Deadlocks (critical threshold) | string | `1` | no | +| sqldatabase_diskspace_message | Custom message for SQL disk space monitor | string | `` | no | | sqldatabase_diskspace_silenced | Groups to mute for SQL disk space monitor | map | `` | no | | sqldatabase_diskspace_threshold_critical | Disk space used in percent (critical threshold) | string | `90` | no | | sqldatabase_diskspace_threshold_warning | Disk space used in percent (warning threshold) | string | `80` | no | +| sqldatabase_dtu_message | Custom message for SQL DTU monitor | string | `` | no | | sqldatabase_dtu_silenced | Groups to mute for SQL DTU monitor | map | `` | no | | sqldatabase_dtu_threshold_critical | Amount of DTU used (critical threshold) | string | `90` | no | | sqldatabase_dtu_threshold_warning | Amount of DTU used (warning threshold) | string | `85` | no | +| storage_authorization_error_requests_message | Custom message for Storage authorization errors monitor | string | `` | no | | storage_authorization_error_requests_silenced | Groups to mute for Storage authorization errors monitor | map | `` | no | | storage_authorization_error_requests_threshold_critical | Maximum acceptable percent of authorization error requests for a storage | string | `90` | no | | storage_authorization_error_requests_threshold_warning | Warning regarding acceptable percent of authorization error requests for a storage | string | `50` | no | +| storage_availability_message | Custom message for Storage availability monitor | string | `` | no | | storage_availability_silenced | Groups to mute for Storage availability monitor | map | `` | no | | storage_availability_threshold_critical | Minimum acceptable percent of availability for a storage | string | `50` | no | | storage_availability_threshold_warning | Warning regarding acceptable percent of availability for a storage | string | `90` | no | +| storage_client_other_error_requests_message | Custom message for Storage other errors monitor | string | `` | no | | storage_client_other_error_requests_silenced | Groups to mute for Storage other errors monitor | map | `` | no | | storage_client_other_error_requests_threshold_critical | Maximum acceptable percent of client other error requests for a storage | string | `90` | no | | storage_client_other_error_requests_threshold_warning | Warning regarding acceptable percent of client other error requests for a storage | string | `50` | no | +| storage_latency_message | Custom message for Storage latency monitor | string | `` | no | | storage_latency_silenced | Groups to mute for Storage latency monitor | map | `` | no | | storage_latency_threshold_critical | Maximum acceptable end to end latency (ms) for a storage | string | `2000` | no | | storage_latency_threshold_warning | Warning regarding acceptable end to end latency (ms) for a storage | string | `1000` | no | +| storage_network_error_requests_message | Custom message for Storage network errors monitor | string | `` | no | | storage_network_error_requests_silenced | Groups to mute for Storage network errors monitor | map | `` | no | | storage_network_error_requests_threshold_critical | Maximum acceptable percent of network error requests for a storage | string | `90` | no | | storage_network_error_requests_threshold_warning | Warning regarding acceptable percent of network error requests for a storage | string | `50` | no | +| storage_server_other_error_requests_message | Custom message for Storage server other errors monitor | string | `` | no | | storage_server_other_error_requests_silenced | Groups to mute for Storage server other errors monitor | map | `` | no | | storage_server_other_error_requests_threshold_critical | Maximum acceptable percent of server other error requests for a storage | string | `90` | no | | storage_server_other_error_requests_threshold_warning | Warning regarding acceptable percent of server other error requests for a storage | string | `50` | no | +| storage_successful_requests_message | Custom message for Storage sucessful requests monitor | string | `` | no | | storage_successful_requests_silenced | Groups to mute for Storage sucessful requests monitor | map | `` | no | | storage_successful_requests_threshold_critical | Minimum acceptable percent of successful requests for a storage | string | `10` | no | | storage_successful_requests_threshold_warning | Warning regarding acceptable percent of successful requests for a storage | string | `30` | no | +| storage_throttling_error_requests_message | Custom message for Storage throttling error monitor | string | `` | no | | storage_throttling_error_requests_silenced | Groups to mute for Storage throttling error monitor | map | `` | no | | storage_throttling_error_requests_threshold_critical | Maximum acceptable percent of throttling error requests for a storage | string | `90` | no | | storage_throttling_error_requests_threshold_warning | Warning regarding acceptable percent of throttling error requests for a storage | string | `50` | no | +| storage_timeout_error_requests_message | Custom message for Storage timeout monitor | string | `` | no | | storage_timeout_error_requests_silenced | Groups to mute for Storage timeout monitor | map | `` | no | | storage_timeout_error_requests_threshold_critical | Maximum acceptable percent of timeout error requests for a storage | string | `90` | no | | storage_timeout_error_requests_threshold_warning | Warning regarding acceptable percent of timeout error requests for a storage | string | `50` | no | +| streamanalytics_conversion_errors_message | Custom message for Stream Analytics conversion errors monitor | string | `` | no | | streamanalytics_conversion_errors_silenced | Groups to mute for Stream Analytics conversion errors monitor | map | `` | no | | streamanalytics_conversion_errors_threshold_critical | Conversion errors limit (critical threshold) | string | `10` | no | | streamanalytics_conversion_errors_threshold_warning | Conversion errors limit (warning threshold) | string | `0` | no | +| streamanalytics_failed_function_requests_message | Custom message for Stream Analytics failed requests monitor | string | `` | no | | streamanalytics_failed_function_requests_silenced | Groups to mute for Stream Analytics failed requests monitor | map | `` | no | | streamanalytics_failed_function_requests_threshold_critical | Failed Function Request rate limit (critical threshold) | string | `10` | no | | streamanalytics_failed_function_requests_threshold_warning | Failed Function Request rate limit (warning threshold) | string | `0` | no | +| streamanalytics_runtime_errors_message | Custom message for Stream Analytics runtime errors monitor | string | `` | no | | streamanalytics_runtime_errors_silenced | Groups to mute for Stream Analytics runtime errors monitor | map | `` | no | | streamanalytics_runtime_errors_threshold_critical | Runtime errors limit (critical threshold) | string | `10` | no | | streamanalytics_runtime_errors_threshold_warning | Runtime errors limit (warning threshold) | string | `0` | no | +| streamanalytics_status_message | Custom message for Stream Analytics status monitor | string | `` | no | | streamanalytics_status_silenced | Groups to mute for Stream Analytics status monitor | map | `` | no | +| streamanalytics_su_utilization_message | Custom message for Stream Analytics utilization monitor | string | `` | no | | streamanalytics_su_utilization_silenced | Groups to mute for Stream Analytics utilization monitor | map | `` | no | | streamanalytics_su_utilization_threshold_critical | Streaming Unit utilization rate limit (critical threshold) | string | `80` | no | | streamanalytics_su_utilization_threshold_warning | Streaming Unit utilization rate limit (warning threshold) | string | `60` | no | diff --git a/cloud/azure/apimanagement/README.md b/cloud/azure/apimanagement/README.md index 82de287..1fdf321 100644 --- a/cloud/azure/apimanagement/README.md +++ b/cloud/azure/apimanagement/README.md @@ -29,19 +29,24 @@ Inputs |------|-------------|:----:|:-----:|:-----:| | delay | Delay in seconds for the metric evaluation | string | `600` | no | | environment | Architecture environment | string | - | yes | +| failed_requests_message | Custom message for API Management failed requests monitor | string | `` | no | | failed_requests_silenced | Groups to mute for API Management failed requests monitor | map | `` | no | | failed_requests_threshold_critical | Maximum acceptable percent of failed requests | string | `90` | no | | failed_requests_threshold_warning | Warning regarding acceptable percent of failed requests | string | `50` | no | | filter_tags_custom | Tags used for custom filtering when filter_tags_use_defaults is false | string | `*` | no | | filter_tags_use_defaults | Use default filter tags convention | string | `true` | no | | message | Message sent when a Redis monitor is triggered | string | - | yes | +| other_requests_message | Custom message for API Management other requests monitor | string | `` | no | | other_requests_silenced | Groups to mute for API Management other requests monitor | map | `` | no | | other_requests_threshold_critical | Maximum acceptable percent of other requests | string | `90` | no | | other_requests_threshold_warning | Warning regarding acceptable percent of other requests | string | `50` | no | +| status_message | Custom message for API Management status monitor | string | `` | no | | status_silenced | Groups to mute for API Management status monitor | map | `` | no | +| successful_requests_message | Custom message for API Management successful requests monitor | string | `` | no | | successful_requests_silenced | Groups to mute for API Management successful requests monitor | map | `` | no | | successful_requests_threshold_critical | Minimum acceptable percent of successful requests | string | `10` | no | | successful_requests_threshold_warning | Warning regarding acceptable percent of successful requests | string | `30` | no | +| unauthorized_requests_message | Custom message for API Management unauthorized requests monitor | string | `` | no | | unauthorized_requests_silenced | Groups to mute for API Management unauthorized requests monitor | map | `` | no | | unauthorized_requests_threshold_critical | Maximum acceptable percent of unauthorized requests | string | `90` | no | | unauthorized_requests_threshold_warning | Warning regarding acceptable percent of unauthorized requests | string | `50` | no | diff --git a/cloud/azure/apimanagement/inputs.tf b/cloud/azure/apimanagement/inputs.tf index 74273b2..85d1b0a 100644 --- a/cloud/azure/apimanagement/inputs.tf +++ b/cloud/azure/apimanagement/inputs.tf @@ -31,12 +31,24 @@ variable "status_silenced" { default = {} } +variable "status_message" { + description = "Custom message for API Management status monitor" + type = "string" + default = "" +} + variable "failed_requests_silenced" { description = "Groups to mute for API Management failed requests monitor" type = "map" default = {} } +variable "failed_requests_message" { + description = "Custom message for API Management failed requests monitor" + type = "string" + default = "" +} + variable "failed_requests_threshold_critical" { description = "Maximum acceptable percent of failed requests" default = 90 @@ -53,6 +65,12 @@ variable "other_requests_silenced" { default = {} } +variable "other_requests_message" { + description = "Custom message for API Management other requests monitor" + type = "string" + default = "" +} + variable "other_requests_threshold_critical" { description = "Maximum acceptable percent of other requests" default = 90 @@ -69,6 +87,12 @@ variable "unauthorized_requests_silenced" { default = {} } +variable "unauthorized_requests_message" { + description = "Custom message for API Management unauthorized requests monitor" + type = "string" + default = "" +} + variable "unauthorized_requests_threshold_critical" { description = "Maximum acceptable percent of unauthorized requests" default = 90 @@ -85,6 +109,12 @@ variable "successful_requests_silenced" { default = {} } +variable "successful_requests_message" { + description = "Custom message for API Management successful requests monitor" + type = "string" + default = "" +} + variable "successful_requests_threshold_critical" { description = "Minimum acceptable percent of successful requests" default = 10 diff --git a/cloud/azure/apimanagement/monitors-azure-apimanagement.tf b/cloud/azure/apimanagement/monitors-azure-apimanagement.tf index 5a17080..a8d81ca 100644 --- a/cloud/azure/apimanagement/monitors-azure-apimanagement.tf +++ b/cloud/azure/apimanagement/monitors-azure-apimanagement.tf @@ -10,7 +10,7 @@ data "template_file" "filter" { resource "datadog_monitor" "apimgt_status" { name = "[${var.environment}] API Management is down" - message = "${var.message}" + message = "${coalesce(var.status_message, var.message)}" query = <` | no | | http_4xx_requests_threshold_critical | Maximum critical acceptable percent of 4xx errors | string | `90` | no | | http_4xx_requests_threshold_warning | Warning regarding acceptable percent of 4xx errors | string | `50` | no | +| http_5xx_requests_message | Custom message for App Services 5xx requests monitor | string | `` | no | | http_5xx_requests_silenced | Groups to mute for App Services 5xx requests monitor | map | `` | no | | http_5xx_requests_threshold_critical | Maximum critical acceptable percent of 5xx errors | string | `90` | no | | http_5xx_requests_threshold_warning | Warning regarding acceptable percent of 5xx errors | string | `50` | no | +| http_successful_requests_message | Custom message for App Services successful requests monitor | string | `` | no | | http_successful_requests_silenced | Groups to mute for App Services successful requests monitor | map | `` | no | | http_successful_requests_threshold_critical | Minimum critical acceptable percent of 2xx & 3xx requests | string | `10` | no | | http_successful_requests_threshold_warning | Warning regarding acceptable percent of 2xx & 3xx requests | string | `30` | no | +| memory_usage_message | Custom message for App Services memory usage monitor | string | `` | no | | memory_usage_silenced | Groups to mute for App Services memory usage monitor | map | `` | no | | memory_usage_threshold_critical | Alerting threshold in Mib | string | `1073741824` | no | | memory_usage_threshold_warning | Warning threshold in MiB | string | `536870912` | no | | message | Message sent when a monitor is triggered | string | - | yes | +| response_time_message | Custom message for App Services response time monitor | string | `` | no | | response_time_silenced | Groups to mute for App Services response time monitor | map | `` | no | | response_time_threshold_critical | Alerting threshold for response time in seconds | string | `10` | no | | response_time_threshold_warning | Warning threshold for response time in seconds | string | `5` | no | diff --git a/cloud/azure/app-services/inputs.tf b/cloud/azure/app-services/inputs.tf index 8ed4216..25ca97c 100644 --- a/cloud/azure/app-services/inputs.tf +++ b/cloud/azure/app-services/inputs.tf @@ -22,12 +22,19 @@ variable "delay" { default = 600 } +# Azure App Services specific variables variable "response_time_silenced" { description = "Groups to mute for App Services response time monitor" type = "map" default = {} } +variable "response_time_message" { + description = "Custom message for App Services response time monitor" + type = "string" + default = "" +} + variable "response_time_threshold_critical" { default = 10 description = "Alerting threshold for response time in seconds" @@ -44,6 +51,12 @@ variable "memory_usage_silenced" { default = {} } +variable "memory_usage_message" { + description = "Custom message for App Services memory usage monitor" + type = "string" + default = "" +} + variable "memory_usage_threshold_critical" { default = 1073741824 # 1Gb description = "Alerting threshold in Mib" @@ -60,6 +73,12 @@ variable "http_4xx_requests_silenced" { default = {} } +variable "http_4xx_requests_message" { + description = "Custom message for App Services 4xx requests monitor" + type = "string" + default = "" +} + variable "http_4xx_requests_threshold_critical" { default = 90 description = "Maximum critical acceptable percent of 4xx errors" @@ -76,6 +95,12 @@ variable "http_5xx_requests_silenced" { default = {} } +variable "http_5xx_requests_message" { + description = "Custom message for App Services 5xx requests monitor" + type = "string" + default = "" +} + variable "http_5xx_requests_threshold_critical" { default = 90 description = "Maximum critical acceptable percent of 5xx errors" @@ -92,6 +117,12 @@ variable "http_successful_requests_silenced" { default = {} } +variable "http_successful_requests_message" { + description = "Custom message for App Services successful requests monitor" + type = "string" + default = "" +} + variable "http_successful_requests_threshold_critical" { default = 10 description = "Minimum critical acceptable percent of 2xx & 3xx requests" diff --git a/cloud/azure/app-services/monitors-app_services.tf b/cloud/azure/app-services/monitors-app_services.tf index 62a68a8..c501bdf 100644 --- a/cloud/azure/app-services/monitors-app_services.tf +++ b/cloud/azure/app-services/monitors-app_services.tf @@ -10,7 +10,7 @@ data "template_file" "filter" { resource "datadog_monitor" "appservices_response_time" { name = "[${var.environment}] App Services response time too high {{comparator}} {{#is_alert}}{{threshold}}s{{/is_alert}}{{#is_warning}}{{warn_threshold}}s{{/is_warning}} ({{value}}s)" type = "metric alert" - message = "${var.message}" + message = "${coalesce(var.response_time_message, var.message)}" query = <` | no | | errors_rate_thresold_critical | Errors ratio (percentage) to trigger the critical alert | string | `90` | no | | errors_rate_thresold_warning | Errors ratio (percentage) to trigger a warning alert | string | `50` | no | +| failed_requests_rate_message | Custom message for Event Hub failed requests monitor | string | `` | no | | failed_requests_rate_silenced | Groups to mute for Event Hub failed requests monitor | map | `` | no | | failed_requests_rate_thresold_critical | Failed requests ratio (percentage) to trigger the critical alert | string | `90` | no | | failed_requests_rate_thresold_warning | Failed requests ratio (percentage) to trigger a warning alert | string | `50` | no | | filter_tags_custom | Tags used for custom filtering when filter_tags_use_defaults is false | string | `*` | no | | filter_tags_use_defaults | Use default filter tags convention | string | `true` | no | | message | Message sent when an alert is triggered | string | - | yes | +| status_message | Custom message for Event Hub status monitor | string | `` | no | | status_silenced | Groups to mute for Event Hub status monitor | map | `` | no | Related documentation diff --git a/cloud/azure/eventhub/inputs.tf b/cloud/azure/eventhub/inputs.tf index 3d60a29..77180f0 100644 --- a/cloud/azure/eventhub/inputs.tf +++ b/cloud/azure/eventhub/inputs.tf @@ -24,18 +24,31 @@ variable "filter_tags_custom" { default = "*" } +# Azure Event Hub specific variables variable "status_silenced" { description = "Groups to mute for Event Hub status monitor" type = "map" default = {} } +variable "status_message" { + description = "Custom message for Event Hub status monitor" + type = "string" + default = "" +} + variable "failed_requests_rate_silenced" { description = "Groups to mute for Event Hub failed requests monitor" type = "map" default = {} } +variable "failed_requests_rate_message" { + description = "Custom message for Event Hub failed requests monitor" + type = "string" + default = "" +} + variable "failed_requests_rate_thresold_critical" { description = "Failed requests ratio (percentage) to trigger the critical alert" default = 90 @@ -52,6 +65,12 @@ variable "errors_rate_silenced" { default = {} } +variable "errors_rate_message" { + description = "Custom message for Event Hub errors monitor" + type = "string" + default = "" +} + variable "errors_rate_thresold_critical" { description = "Errors ratio (percentage) to trigger the critical alert" default = 90 diff --git a/cloud/azure/eventhub/monitors-eventhub.tf b/cloud/azure/eventhub/monitors-eventhub.tf index 0d93b95..c96d967 100644 --- a/cloud/azure/eventhub/monitors-eventhub.tf +++ b/cloud/azure/eventhub/monitors-eventhub.tf @@ -8,7 +8,7 @@ data "template_file" "filter" { resource "datadog_monitor" "eventhub_status" { name = "[${var.environment}] Event Hub is down" - message = "${var.message}" + message = "${coalesce(var.status_message, var.message)}" query = <` | no | | dropped_d2c_telemetry_egress_threshold_critical | D2C Telemetry Dropped limit (critical threshold) | string | `1000` | no | | dropped_d2c_telemetry_egress_threshold_warning | D2C Telemetry Dropped limit (warning threshold) | string | `500` | no | | environment | Architecture Environment | string | - | yes | +| failed_c2d_methods_rate_message | Custom message for IoT Hub failed c2d method monitor | string | `` | no | | failed_c2d_methods_rate_silenced | Groups to mute for IoT Hub failed c2d methods monitor | map | `` | no | | failed_c2d_methods_rate_threshold_critical | C2D Methods Failed rate limit (critical threshold) | string | `90` | no | | failed_c2d_methods_rate_threshold_warning | C2D Methods Failed rate limit (warning threshold) | string | `50` | no | +| failed_c2d_twin_read_rate_message | Custom message for IoT Hub failed c2d twin read monitor | string | `` | no | | failed_c2d_twin_read_rate_silenced | Groups to mute for IoT Hub failed c2d twin read monitor | map | `` | no | | failed_c2d_twin_read_rate_threshold_critical | C2D Twin Read Failed rate limit (critical threshold) | string | `90` | no | | failed_c2d_twin_read_rate_threshold_warning | C2D Twin Read Failed rate limit (warning threshold) | string | `50` | no | +| failed_c2d_twin_update_rate_message | Custom message for IoT Hub failed c2d twin update monitor | string | `` | no | | failed_c2d_twin_update_rate_silenced | Groups to mute for IoT Hub failed c2d twin update monitor | map | `` | no | | failed_c2d_twin_update_rate_threshold_critical | C2D Twin Update Failed rate limit (critical threshold) | string | `90` | no | | failed_c2d_twin_update_rate_threshold_warning | C2D Twin Update Failed rate limit (warning threshold) | string | `50` | no | +| failed_d2c_twin_read_rate_message | Custom message for IoT Hub failed d2c twin read monitor | string | `` | no | | failed_d2c_twin_read_rate_silenced | Groups to mute for IoT Hub failed d2c twin read monitor | map | `` | no | | failed_d2c_twin_read_rate_threshold_critical | D2C Twin Read Failed rate limit (critical threshold) | string | `90` | no | | failed_d2c_twin_read_rate_threshold_warning | D2C Twin Read Failed rate limit (warning threshold) | string | `50` | no | +| failed_d2c_twin_update_rate_message | Custom message for IoT Hub failed d2c twin update monitor | string | `` | no | | failed_d2c_twin_update_rate_silenced | Groups to mute for IoT Hub failed d2c twin update monitor | map | `` | no | | failed_d2c_twin_update_rate_threshold_critical | D2C Twin Update Failed rate limit (critical threshold) | string | `90` | no | | failed_d2c_twin_update_rate_threshold_warning | D2C Twin Update Failed rate limit (warning threshold) | string | `50` | no | +| failed_jobs_rate_message | Custom message for IoT Hub failed jobs monitor | string | `` | no | | failed_jobs_rate_silenced | Groups to mute for IoT Hub failed jobs monitor | map | `` | no | | failed_jobs_rate_threshold_critical | Jobs Failed rate limit (critical threshold) | string | `90` | no | | failed_jobs_rate_threshold_warning | Jobs Failed rate limit (warning threshold) | string | `50` | no | +| failed_listjobs_rate_message | Custom message for IoT Hub failed list jobs monitor | string | `` | no | | failed_listjobs_rate_silenced | Groups to mute for IoT Hub failed list jobs monitor | map | `` | no | | failed_listjobs_rate_threshold_critical | ListJobs Failed rate limit (critical threshold) | string | `90` | no | | failed_listjobs_rate_threshold_warning | ListJobs Failed rate limit (warning threshold) | string | `50` | no | +| failed_queryjobs_rate_message | Custom message for IoT Hub failed query jobs monitor | string | `` | no | | failed_queryjobs_rate_silenced | Groups to mute for IoT Hub failed query jobs monitor | map | `` | no | | failed_queryjobs_rate_threshold_critical | QueryJobs Failed rate limit (critical threshold) | string | `90` | no | | failed_queryjobs_rate_threshold_warning | QueryJobs Failed rate limit (warning threshold) | string | `50` | no | +| fallback_d2c_telemetry_egress_message | Custom message for IoT Hub fallback d2c telemetry monitor | string | `` | no | | fallback_d2c_telemetry_egress_silenced | Groups to mute for IoT Hub fallback d2c telemetry monitor | map | `` | no | | fallback_d2c_telemetry_egress_threshold_critical | D2C Telemetry Fallback limit (critical threshold) | string | `1000` | no | | fallback_d2c_telemetry_egress_threshold_warning | D2C Telemetry Fallback limit (warning threshold) | string | `500` | no | | filter_tags | Tags used for filtering | string | `*` | no | +| invalid_d2c_telemetry_egress_message | Custom message for IoT Hub invalid d2c telemetry monitor | string | `` | no | | invalid_d2c_telemetry_egress_silenced | Groups to mute for IoT Hub invalid d2c telemetry monitor | map | `` | no | | invalid_d2c_telemetry_egress_threshold_critical | D2C Telemetry Invalid limit (critical threshold) | string | `1000` | no | | invalid_d2c_telemetry_egress_threshold_warning | D2C Telemetry Invalid limit (warning threshold) | string | `500` | no | | message | Message sent when an alert is triggered | string | - | yes | +| orphaned_d2c_telemetry_egress_message | Custom message for IoT Hub orphaned d2c telemetry monitor | string | `` | no | | orphaned_d2c_telemetry_egress_silenced | Groups to mute for IoT Hub orphaned d2c telemetry monitor | map | `` | no | | orphaned_d2c_telemetry_egress_threshold_critical | D2C Telemetry Orphaned limit (critical threshold) | string | `1000` | no | | orphaned_d2c_telemetry_egress_threshold_warning | D2C Telemetry Orphaned limit (warning threshold) | string | `500` | no | +| status_message | Custom message for IoT Hub status monitor | string | `` | no | | status_silenced | Groups to mute for IoT Hub status monitor | map | `` | no | +| too_many_d2c_telemetry_ingress_nosent_message | Custom message for IoT Hub unsent d2c telemetry monitor | string | `` | no | | too_many_d2c_telemetry_ingress_nosent_silenced | Groups to mute for IoT Hub unsent d2c telemetry monitor | map | `` | no | -| total_devices_silenced | Groups to mute for IoT Hub total device monitor | map | `` | no | +| total_devices_message | Custom message for IoT Hub total devices monitor | string | `` | no | +| total_devices_silenced | Groups to mute for IoT Hub total devices monitor | map | `` | no | Related documentation --------------------- diff --git a/cloud/azure/iothubs/inputs.tf b/cloud/azure/iothubs/inputs.tf index 2eaaefc..2555636 100644 --- a/cloud/azure/iothubs/inputs.tf +++ b/cloud/azure/iothubs/inputs.tf @@ -19,31 +19,55 @@ variable "filter_tags" { default = "*" } -# Azure IOT hubs specific +# IOT Hub specific variables variable "status_silenced" { description = "Groups to mute for IoT Hub status monitor" type = "map" default = {} } +variable "status_message" { + description = "Custom message for IoT Hub status monitor" + type = "string" + default = "" +} + variable "total_devices_silenced" { - description = "Groups to mute for IoT Hub total device monitor" + description = "Groups to mute for IoT Hub total devices monitor" type = "map" default = {} } +variable "total_devices_message" { + description = "Custom message for IoT Hub total devices monitor" + type = "string" + default = "" +} + variable "too_many_d2c_telemetry_ingress_nosent_silenced" { description = "Groups to mute for IoT Hub unsent d2c telemetry monitor" type = "map" default = {} } +variable "too_many_d2c_telemetry_ingress_nosent_message" { + description = "Custom message for IoT Hub unsent d2c telemetry monitor" + type = "string" + default = "" +} + variable "failed_jobs_rate_silenced" { description = "Groups to mute for IoT Hub failed jobs monitor" type = "map" default = {} } +variable "failed_jobs_rate_message" { + description = "Custom message for IoT Hub failed jobs monitor" + type = "string" + default = "" +} + variable "failed_jobs_rate_threshold_warning" { description = "Jobs Failed rate limit (warning threshold)" default = 50 @@ -60,6 +84,12 @@ variable "failed_listjobs_rate_silenced" { default = {} } +variable "failed_listjobs_rate_message" { + description = "Custom message for IoT Hub failed list jobs monitor" + type = "string" + default = "" +} + variable "failed_listjobs_rate_threshold_warning" { description = "ListJobs Failed rate limit (warning threshold)" default = 50 @@ -76,6 +106,12 @@ variable "failed_queryjobs_rate_silenced" { default = {} } +variable "failed_queryjobs_rate_message" { + description = "Custom message for IoT Hub failed query jobs monitor" + type = "string" + default = "" +} + variable "failed_queryjobs_rate_threshold_warning" { description = "QueryJobs Failed rate limit (warning threshold)" default = 50 @@ -92,6 +128,12 @@ variable "failed_c2d_methods_rate_silenced" { default = {} } +variable "failed_c2d_methods_rate_message" { + description = "Custom message for IoT Hub failed c2d method monitor" + type = "string" + default = "" +} + variable "failed_c2d_methods_rate_threshold_warning" { description = "C2D Methods Failed rate limit (warning threshold)" default = 50 @@ -108,6 +150,12 @@ variable "failed_c2d_twin_read_rate_silenced" { default = {} } +variable "failed_c2d_twin_read_rate_message" { + description = "Custom message for IoT Hub failed c2d twin read monitor" + type = "string" + default = "" +} + variable "failed_c2d_twin_read_rate_threshold_warning" { description = "C2D Twin Read Failed rate limit (warning threshold)" default = 50 @@ -124,6 +172,12 @@ variable "failed_c2d_twin_update_rate_silenced" { default = {} } +variable "failed_c2d_twin_update_rate_message" { + description = "Custom message for IoT Hub failed c2d twin update monitor" + type = "string" + default = "" +} + variable "failed_c2d_twin_update_rate_threshold_warning" { description = "C2D Twin Update Failed rate limit (warning threshold)" default = 50 @@ -140,6 +194,12 @@ variable "failed_d2c_twin_read_rate_silenced" { default = {} } +variable "failed_d2c_twin_read_rate_message" { + description = "Custom message for IoT Hub failed d2c twin read monitor" + type = "string" + default = "" +} + variable "failed_d2c_twin_read_rate_threshold_warning" { description = "D2C Twin Read Failed rate limit (warning threshold)" default = 50 @@ -156,6 +216,12 @@ variable "failed_d2c_twin_update_rate_silenced" { default = {} } +variable "failed_d2c_twin_update_rate_message" { + description = "Custom message for IoT Hub failed d2c twin update monitor" + type = "string" + default = "" +} + variable "failed_d2c_twin_update_rate_threshold_warning" { description = "D2C Twin Update Failed rate limit (warning threshold)" default = 50 @@ -172,6 +238,12 @@ variable "dropped_d2c_telemetry_egress_silenced" { default = {} } +variable "dropped_d2c_telemetry_egress_message" { + description = "Custom message for IoT Hub dropped d2c telemetry monitor" + type = "string" + default = "" +} + variable "dropped_d2c_telemetry_egress_threshold_warning" { description = "D2C Telemetry Dropped limit (warning threshold)" default = 500 @@ -188,6 +260,12 @@ variable "orphaned_d2c_telemetry_egress_silenced" { default = {} } +variable "orphaned_d2c_telemetry_egress_message" { + description = "Custom message for IoT Hub orphaned d2c telemetry monitor" + type = "string" + default = "" +} + variable "orphaned_d2c_telemetry_egress_threshold_warning" { description = "D2C Telemetry Orphaned limit (warning threshold)" default = 500 @@ -204,6 +282,12 @@ variable "invalid_d2c_telemetry_egress_silenced" { default = {} } +variable "invalid_d2c_telemetry_egress_message" { + description = "Custom message for IoT Hub invalid d2c telemetry monitor" + type = "string" + default = "" +} + variable "invalid_d2c_telemetry_egress_threshold_warning" { description = "D2C Telemetry Invalid limit (warning threshold)" default = 500 @@ -220,6 +304,12 @@ variable "fallback_d2c_telemetry_egress_silenced" { default = {} } +variable "fallback_d2c_telemetry_egress_message" { + description = "Custom message for IoT Hub fallback d2c telemetry monitor" + type = "string" + default = "" +} + variable "fallback_d2c_telemetry_egress_threshold_warning" { description = "D2C Telemetry Fallback limit (warning threshold)" default = 500 diff --git a/cloud/azure/iothubs/monitors-iothubs.tf b/cloud/azure/iothubs/monitors-iothubs.tf index 35cc12b..006556d 100644 --- a/cloud/azure/iothubs/monitors-iothubs.tf +++ b/cloud/azure/iothubs/monitors-iothubs.tf @@ -1,6 +1,6 @@ resource "datadog_monitor" "too_many_jobs_failed" { name = "[${var.environment}] IOT Hub Too many jobs failed {{comparator}} {{#is_alert}}{{threshold}}%{{/is_alert}}{{#is_warning}}{{warn_threshold}}%{{/is_warning}} ({{value}}%)" - message = "${var.message}" + message = "${coalesce(var.failed_jobs_rate_message, var.message)}" query = <` | no | | evictedkeys_limit_threshold_critical | Evicted keys limit (critical threshold) | string | `100` | no | | evictedkeys_limit_threshold_warning | Evicted keys limit (warning threshold) | string | `0` | no | | filter_tags_custom | Tags used for custom filtering when filter_tags_use_defaults is false | string | `*` | no | | filter_tags_use_defaults | Use default filter tags convention | string | `true` | no | | message | Message sent when a Redis monitor is triggered | string | - | yes | +| percent_processor_time_message | Custom message for Redis processor monitor | string | `` | no | | percent_processor_time_silenced | Groups to mute for Redis processor monitor | map | `` | no | | percent_processor_time_threshold_critical | Processor time percent (critical threshold) | string | `80` | no | | percent_processor_time_threshold_warning | Processor time percent (warning threshold) | string | `60` | no | +| server_load_rate_message | Custom message for Redis server load monitor | string | `` | no | | server_load_rate_silenced | Groups to mute for Redis server load monitor | map | `` | no | | server_load_rate_threshold_critical | Server CPU load rate (critical threshold) | string | `90` | no | | server_load_rate_threshold_warning | Server CPU load rate (warning threshold) | string | `70` | no | +| status_message | Custom message for Redis status monitor | string | `` | no | +| status_silenced | Groups to mute for Redis status monitor | map | `` | no | Related documentation --------------------- diff --git a/cloud/azure/redis/inputs.tf b/cloud/azure/redis/inputs.tf index 79a8592..bf637f5 100644 --- a/cloud/azure/redis/inputs.tf +++ b/cloud/azure/redis/inputs.tf @@ -24,19 +24,31 @@ variable "filter_tags_custom" { default = "*" } -# Azure Redis specific +# Azure Redis specific variables variable "status_silenced" { description = "Groups to mute for Redis status monitor" type = "map" default = {} } +variable "status_message" { + description = "Custom message for Redis status monitor" + type = "string" + default = "" +} + variable "evictedkeys_limit_silenced" { description = "Groups to mute for Redis evicted keys monitor" type = "map" default = {} } +variable "evictedkeys_limit_message" { + description = "Custom message for Redis evicted keys monitor" + type = "string" + default = "" +} + variable "evictedkeys_limit_threshold_warning" { description = "Evicted keys limit (warning threshold)" default = 0 @@ -53,6 +65,12 @@ variable "percent_processor_time_silenced" { default = {} } +variable "percent_processor_time_message" { + description = "Custom message for Redis processor monitor" + type = "string" + default = "" +} + variable "percent_processor_time_threshold_critical" { description = "Processor time percent (critical threshold)" default = 80 @@ -69,6 +87,12 @@ variable "server_load_rate_silenced" { default = {} } +variable "server_load_rate_message" { + description = "Custom message for Redis server load monitor" + type = "string" + default = "" +} + variable "server_load_rate_threshold_critical" { description = "Server CPU load rate (critical threshold)" default = 90 diff --git a/cloud/azure/redis/monitors-azure-redis.tf b/cloud/azure/redis/monitors-azure-redis.tf index 7b9ad62..b71ede9 100644 --- a/cloud/azure/redis/monitors-azure-redis.tf +++ b/cloud/azure/redis/monitors-azure-redis.tf @@ -8,7 +8,7 @@ data "template_file" "filter" { resource "datadog_monitor" "status" { name = "[${var.environment}] Redis {{name}} is down" - message = "${var.message}" + message = "${coalesce(var.status_message, var.message)}" query = <` | no | | cpu_threshold_critical | CPU usage in percent (critical threshold) | string | `90` | no | | cpu_threshold_warning | CPU usage in percent (warning threshold) | string | `80` | no | +| deadlock_message | Custom message for SQL Deadlock monitor | string | `` | no | | deadlock_silenced | Groups to mute for SQL Deadlock monitor | map | `` | no | | deadlock_threshold_critical | Amount of Deadlocks (critical threshold) | string | `1` | no | | delay | Delay in seconds for the metric evaluation | string | `600` | no | +| diskspace_message | Custom message for SQL disk space monitor | string | `` | no | | diskspace_silenced | Groups to mute for SQL disk space monitor | map | `` | no | | diskspace_threshold_critical | Disk space used in percent (critical threshold) | string | `90` | no | | diskspace_threshold_warning | Disk space used in percent (warning threshold) | string | `80` | no | +| dtu_message | Custom message for SQL DTU monitor | string | `` | no | | dtu_silenced | Groups to mute for SQL DTU monitor | map | `` | no | | dtu_threshold_critical | Amount of DTU used (critical threshold) | string | `90` | no | | dtu_threshold_warning | Amount of DTU used (warning threshold) | string | `85` | no | diff --git a/cloud/azure/sql-database/inputs.tf b/cloud/azure/sql-database/inputs.tf index 58be3d4..1d6d472 100644 --- a/cloud/azure/sql-database/inputs.tf +++ b/cloud/azure/sql-database/inputs.tf @@ -24,13 +24,19 @@ variable "filter_tags_custom" { default = "*" } -# Azure SQL Database specific +# Azure SQL Database specific variables variable "cpu_silenced" { description = "Groups to mute for SQL CPU monitor" type = "map" default = {} } +variable "cpu_message" { + description = "Custom message for SQL CPU monitor" + type = "string" + default = "" +} + variable "cpu_threshold_warning" { description = "CPU usage in percent (warning threshold)" default = "80" @@ -47,6 +53,12 @@ variable "diskspace_silenced" { default = {} } +variable "diskspace_message" { + description = "Custom message for SQL disk space monitor" + type = "string" + default = "" +} + variable "diskspace_threshold_warning" { description = "Disk space used in percent (warning threshold)" default = "80" @@ -63,6 +75,12 @@ variable "dtu_silenced" { default = {} } +variable "dtu_message" { + description = "Custom message for SQL DTU monitor" + type = "string" + default = "" +} + variable "dtu_threshold_warning" { description = "Amount of DTU used (warning threshold)" default = "85" @@ -79,6 +97,12 @@ variable "deadlock_silenced" { default = {} } +variable "deadlock_message" { + description = "Custom message for SQL Deadlock monitor" + type = "string" + default = "" +} + variable "deadlock_threshold_critical" { description = "Amount of Deadlocks (critical threshold)" default = "1" diff --git a/cloud/azure/sql-database/monitors-sql-database-basics.tf b/cloud/azure/sql-database/monitors-sql-database-basics.tf index 6df1cd3..76933aa 100644 --- a/cloud/azure/sql-database/monitors-sql-database-basics.tf +++ b/cloud/azure/sql-database/monitors-sql-database-basics.tf @@ -8,7 +8,7 @@ data "template_file" "filter" { resource "datadog_monitor" "sql-database_cpu_90_15min" { name = "[${var.environment}] SQL Database CPU too high {{comparator}} {{#is_alert}}{{threshold}}%{{/is_alert}}{{#is_warning}}{{warn_threshold}}%{{/is_warning}} ({{value}}%)" - message = "${var.message}" + message = "${coalesce(var.cpu_message, var.message)}" query = <` | no | | authorization_error_requests_threshold_critical | Maximum acceptable percent of authorization error requests for a storage | string | `90` | no | | authorization_error_requests_threshold_warning | Warning regarding acceptable percent of authorization error requests for a storage | string | `50` | no | +| availability_message | Custom message for Storage availability monitor | string | `` | no | | availability_silenced | Groups to mute for Storage availability monitor | map | `` | no | | availability_threshold_critical | Minimum acceptable percent of availability for a storage | string | `50` | no | | availability_threshold_warning | Warning regarding acceptable percent of availability for a storage | string | `90` | no | +| client_other_error_requests_message | Custom message for Storage other errors monitor | string | `` | no | | client_other_error_requests_silenced | Groups to mute for Storage other errors monitor | map | `` | no | | client_other_error_requests_threshold_critical | Maximum acceptable percent of client other error requests for a storage | string | `90` | no | | client_other_error_requests_threshold_warning | Warning regarding acceptable percent of client other error requests for a storage | string | `50` | no | @@ -45,22 +48,28 @@ Inputs | environment | Architecture environment | string | - | yes | | filter_tags_custom | Tags used for custom filtering when filter_tags_use_defaults is false | string | `*` | no | | filter_tags_use_defaults | Use default filter tags convention | string | `true` | no | +| latency_message | Custom message for Storage latency monitor | string | `` | no | | latency_silenced | Groups to mute for Storage latency monitor | map | `` | no | | latency_threshold_critical | Maximum acceptable end to end latency (ms) for a storage | string | `2000` | no | | latency_threshold_warning | Warning regarding acceptable end to end latency (ms) for a storage | string | `1000` | no | | message | Message sent when a Redis monitor is triggered | string | - | yes | +| network_error_requests_message | Custom message for Storage network errors monitor | string | `` | no | | network_error_requests_silenced | Groups to mute for Storage network errors monitor | map | `` | no | | network_error_requests_threshold_critical | Maximum acceptable percent of network error requests for a storage | string | `90` | no | | network_error_requests_threshold_warning | Warning regarding acceptable percent of network error requests for a storage | string | `50` | no | +| server_other_error_requests_message | Custom message for Storage server other errors monitor | string | `` | no | | server_other_error_requests_silenced | Groups to mute for Storage server other errors monitor | map | `` | no | | server_other_error_requests_threshold_critical | Maximum acceptable percent of server other error requests for a storage | string | `90` | no | | server_other_error_requests_threshold_warning | Warning regarding acceptable percent of server other error requests for a storage | string | `50` | no | +| successful_requests_message | Custom message for Storage sucessful requests monitor | string | `` | no | | successful_requests_silenced | Groups to mute for Storage sucessful requests monitor | map | `` | no | | successful_requests_threshold_critical | Minimum acceptable percent of successful requests for a storage | string | `10` | no | | successful_requests_threshold_warning | Warning regarding acceptable percent of successful requests for a storage | string | `30` | no | +| throttling_error_requests_message | Custom message for Storage throttling error monitor | string | `` | no | | throttling_error_requests_silenced | Groups to mute for Storage throttling error monitor | map | `` | no | | throttling_error_requests_threshold_critical | Maximum acceptable percent of throttling error requests for a storage | string | `90` | no | | throttling_error_requests_threshold_warning | Warning regarding acceptable percent of throttling error requests for a storage | string | `50` | no | +| timeout_error_requests_message | Custom message for Storage timeout monitor | string | `` | no | | timeout_error_requests_silenced | Groups to mute for Storage timeout monitor | map | `` | no | | timeout_error_requests_threshold_critical | Maximum acceptable percent of timeout error requests for a storage | string | `90` | no | | timeout_error_requests_threshold_warning | Warning regarding acceptable percent of timeout error requests for a storage | string | `50` | no | diff --git a/cloud/azure/storage/inputs.tf b/cloud/azure/storage/inputs.tf index f665a6e..6401007 100644 --- a/cloud/azure/storage/inputs.tf +++ b/cloud/azure/storage/inputs.tf @@ -24,13 +24,19 @@ variable "filter_tags_custom" { default = "*" } -# Azure Storage specific +# Azure Storage specific variables variable "availability_silenced" { description = "Groups to mute for Storage availability monitor" type = "map" default = {} } +variable "availability_message" { + description = "Custom message for Storage availability monitor" + type = "string" + default = "" +} + variable "availability_threshold_critical" { description = "Minimum acceptable percent of availability for a storage" default = 50 @@ -47,6 +53,12 @@ variable "successful_requests_silenced" { default = {} } +variable "successful_requests_message" { + description = "Custom message for Storage sucessful requests monitor" + type = "string" + default = "" +} + variable "successful_requests_threshold_critical" { description = "Minimum acceptable percent of successful requests for a storage" default = 10 @@ -63,6 +75,12 @@ variable "latency_silenced" { default = {} } +variable "latency_message" { + description = "Custom message for Storage latency monitor" + type = "string" + default = "" +} + variable "latency_threshold_critical" { description = "Maximum acceptable end to end latency (ms) for a storage" default = 2000 @@ -79,6 +97,12 @@ variable "timeout_error_requests_silenced" { default = {} } +variable "timeout_error_requests_message" { + description = "Custom message for Storage timeout monitor" + type = "string" + default = "" +} + variable "timeout_error_requests_threshold_critical" { description = "Maximum acceptable percent of timeout error requests for a storage" default = 90 @@ -95,6 +119,12 @@ variable "network_error_requests_silenced" { default = {} } +variable "network_error_requests_message" { + description = "Custom message for Storage network errors monitor" + type = "string" + default = "" +} + variable "network_error_requests_threshold_critical" { description = "Maximum acceptable percent of network error requests for a storage" default = 90 @@ -111,6 +141,12 @@ variable "throttling_error_requests_silenced" { default = {} } +variable "throttling_error_requests_message" { + description = "Custom message for Storage throttling error monitor" + type = "string" + default = "" +} + variable "throttling_error_requests_threshold_critical" { description = "Maximum acceptable percent of throttling error requests for a storage" default = 90 @@ -127,6 +163,12 @@ variable "server_other_error_requests_silenced" { default = {} } +variable "server_other_error_requests_message" { + description = "Custom message for Storage server other errors monitor" + type = "string" + default = "" +} + variable "server_other_error_requests_threshold_critical" { description = "Maximum acceptable percent of server other error requests for a storage" default = 90 @@ -143,6 +185,12 @@ variable "client_other_error_requests_silenced" { default = {} } +variable "client_other_error_requests_message" { + description = "Custom message for Storage other errors monitor" + type = "string" + default = "" +} + variable "client_other_error_requests_threshold_critical" { description = "Maximum acceptable percent of client other error requests for a storage" default = 90 @@ -159,6 +207,12 @@ variable "authorization_error_requests_silenced" { default = {} } +variable "authorization_error_requests_message" { + description = "Custom message for Storage authorization errors monitor" + type = "string" + default = "" +} + variable "authorization_error_requests_threshold_critical" { description = "Maximum acceptable percent of authorization error requests for a storage" default = 90 diff --git a/cloud/azure/storage/monitors-azure-storage.tf b/cloud/azure/storage/monitors-azure-storage.tf index 4f072e2..df5f5c4 100644 --- a/cloud/azure/storage/monitors-azure-storage.tf +++ b/cloud/azure/storage/monitors-azure-storage.tf @@ -8,7 +8,7 @@ data "template_file" "filter" { resource "datadog_monitor" "availability" { name = "[${var.environment}] Azure Storage is down" - message = "${var.message}" + message = "${coalesce(var.availability_message, var.message)}" query = <` | no | | conversion_errors_threshold_critical | Conversion errors limit (critical threshold) | string | `10` | no | | conversion_errors_threshold_warning | Conversion errors limit (warning threshold) | string | `0` | no | | delay | Delay in seconds for the metric evaluation | string | `600` | no | | environment | Architecture environment | string | - | yes | +| failed_function_requests_message | Custom message for Stream Analytics failed requests monitor | string | `` | no | | failed_function_requests_silenced | Groups to mute for Stream Analytics failed requests monitor | map | `` | no | | failed_function_requests_threshold_critical | Failed Function Request rate limit (critical threshold) | string | `10` | no | | failed_function_requests_threshold_warning | Failed Function Request rate limit (warning threshold) | string | `0` | no | | filter_tags_custom | Tags used for custom filtering when filter_tags_use_defaults is false | string | `*` | no | | filter_tags_use_defaults | Use default filter tags convention | string | `true` | no | | message | Message sent when a Redis monitor is triggered | string | - | yes | +| runtime_errors_message | Custom message for Stream Analytics runtime errors monitor | string | `` | no | | runtime_errors_silenced | Groups to mute for Stream Analytics runtime errors monitor | map | `` | no | | runtime_errors_threshold_critical | Runtime errors limit (critical threshold) | string | `10` | no | | runtime_errors_threshold_warning | Runtime errors limit (warning threshold) | string | `0` | no | +| status_message | Custom message for Stream Analytics status monitor | string | `` | no | | status_silenced | Groups to mute for Stream Analytics status monitor | map | `` | no | +| su_utilization_message | Custom message for Stream Analytics utilization monitor | string | `` | no | | su_utilization_silenced | Groups to mute for Stream Analytics utilization monitor | map | `` | no | | su_utilization_threshold_critical | Streaming Unit utilization rate limit (critical threshold) | string | `80` | no | | su_utilization_threshold_warning | Streaming Unit utilization rate limit (warning threshold) | string | `60` | no | diff --git a/cloud/azure/stream-analytics/inputs.tf b/cloud/azure/stream-analytics/inputs.tf index d0e86fc..cc1f969 100644 --- a/cloud/azure/stream-analytics/inputs.tf +++ b/cloud/azure/stream-analytics/inputs.tf @@ -24,19 +24,31 @@ variable "filter_tags_custom" { default = "*" } -# Azure Stream Analytics specific +# Azure Stream Analytics specific variables variable "status_silenced" { description = "Groups to mute for Stream Analytics status monitor" type = "map" default = {} } +variable "status_message" { + description = "Custom message for Stream Analytics status monitor" + type = "string" + default = "" +} + variable "su_utilization_silenced" { description = "Groups to mute for Stream Analytics utilization monitor" type = "map" default = {} } +variable "su_utilization_message" { + description = "Custom message for Stream Analytics utilization monitor" + type = "string" + default = "" +} + variable "su_utilization_threshold_warning" { description = "Streaming Unit utilization rate limit (warning threshold)" default = 60 @@ -53,6 +65,12 @@ variable "failed_function_requests_silenced" { default = {} } +variable "failed_function_requests_message" { + description = "Custom message for Stream Analytics failed requests monitor" + type = "string" + default = "" +} + variable "failed_function_requests_threshold_warning" { description = "Failed Function Request rate limit (warning threshold)" default = 0 @@ -69,6 +87,12 @@ variable "conversion_errors_silenced" { default = {} } +variable "conversion_errors_message" { + description = "Custom message for Stream Analytics conversion errors monitor" + type = "string" + default = "" +} + variable "conversion_errors_threshold_warning" { description = "Conversion errors limit (warning threshold)" default = 0 @@ -85,6 +109,12 @@ variable "runtime_errors_silenced" { default = {} } +variable "runtime_errors_message" { + description = "Custom message for Stream Analytics runtime errors monitor" + type = "string" + default = "" +} + variable "runtime_errors_threshold_warning" { description = "Runtime errors limit (warning threshold)" default = 0 diff --git a/cloud/azure/stream-analytics/monitors-stream-analytics.tf b/cloud/azure/stream-analytics/monitors-stream-analytics.tf index 71068c2..caa423f 100644 --- a/cloud/azure/stream-analytics/monitors-stream-analytics.tf +++ b/cloud/azure/stream-analytics/monitors-stream-analytics.tf @@ -8,7 +8,7 @@ data "template_file" "filter" { resource "datadog_monitor" "status" { name = "[${var.environment}] Stream Analytics is down" - message = "${var.message}" + message = "${coalesce(var.status_message, var.message)}" query = <