Skip to content

Commit

Permalink
Merge pull request #2314 from newrelic/release
Browse files Browse the repository at this point in the history
Release 3/7/23
  • Loading branch information
brammerl authored Mar 7, 2024
2 parents 3db467c + 2d49e7c commit 32aa5f3
Show file tree
Hide file tree
Showing 51 changed files with 2,711 additions and 191 deletions.
31 changes: 31 additions & 0 deletions alert-policies/temporal/ActivityEexcutionFail.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,31 @@
# Name of the alert
name: Activity Execution Fails

# Description and details
description: |+
This alert is triggered if the Temporal activity execution fails once within a 5 minutes window.
# Type of alert
type: STATIC

# NRQL query
nrql:

query: "SELECT latest(temporal_activity_execution_failed_total) AS 'execution failed' FROM Metric"

# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
valueFunction: SINGLE_VALUE

# List of Critical and Warning thresholds for the condition
terms:
- priority: CRITICAL
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 1
# Time in seconds; 120 - 3600
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL
# Duration after which a violation automatically closes
# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
violationTimeLimitSeconds: 86400
40 changes: 40 additions & 0 deletions alert-policies/temporal/ActivityExecutionLatency.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,40 @@
# Name of the alert
name: Activity Excution Latency

# Description and details
description: |+
This alert is triggered if the Temporal activity execution latency exceeds 5 seconds for 5 minutes.
# Type of alert
type: STATIC

# NRQL query
nrql:

query: "SELECT sum(temporal_activity_execution_latency_seconds_sum) FROM Metric"

# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
valueFunction: SINGLE_VALUE

# List of Critical and Warning thresholds for the condition
terms:
- priority: CRITICAL
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 5
# Time in seconds; 120 - 3600
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL
- priority: WARNING
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 4
# Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL
# Duration after which a violation automatically closes
# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
violationTimeLimitSeconds: 86400
40 changes: 40 additions & 0 deletions alert-policies/temporal/ActivityScheduleStartLatency.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,40 @@
# Name of the alert
name: Activity Schedule to Start Latency

# Description and details
description: |+
This alert is triggered if the Temporal activity schedule to start latency exceeds 5 seconds for 5 minutes.
# Type of alert
type: STATIC

# NRQL query
nrql:

query: "SELECT sum(temporal_activity_schedule_to_start_latency_sum) FROM Metric"

# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
valueFunction: SINGLE_VALUE

# List of Critical and Warning thresholds for the condition
terms:
- priority: CRITICAL
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 5
# Time in seconds; 120 - 3600
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL
- priority: WARNING
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 4
# Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL
# Duration after which a violation automatically closes
# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
violationTimeLimitSeconds: 86400
40 changes: 40 additions & 0 deletions alert-policies/temporal/MemoryUsagePercent.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,40 @@
# Name of the alert
name: Memory Usage Percent

# Description and details
description: |+
This alert is triggered if the memory usage exceeds 90% for 5 minutes.
# Type of alert
type: STATIC

# NRQL query
nrql:

query: "SELECT average(memoryUsedPercent) AS `Memory used %` FROM SystemSample"

# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
valueFunction: SINGLE_VALUE

# List of Critical and Warning thresholds for the condition
terms:
- priority: CRITICAL
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 90
# Time in seconds; 120 - 3600
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL
- priority: WARNING
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 85
# Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL
# Duration after which a violation automatically closes
# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
violationTimeLimitSeconds: 86400
4 changes: 2 additions & 2 deletions dashboards/amazon-athena/amazon-athena.json
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT average(provider.totalExecutionTime.Sum) / 1000 AS 'Average execution time (s)', max(provider.totalExecutionTime.Maximum) / 1000 AS 'Max execution time (s)', min(provider.totalExecutionTime.Minimum) / 1000 AS 'Min execution time (s)' FROM AwsAthenaWorkGroupSample WHERE providerExternalId LIKE '%' SINCE 1 hour ago"
"query": "SELECT (average(`getField`(`aws.athena.TotalExecutionTime`, `total`)) / 1000) AS `Average execution time (s)`, (max(`aws.athena.TotalExecutionTime`) / 1000) AS `Max execution time (s)`, (min(`aws.athena.TotalExecutionTime`) / 1000) AS `Min execution time (s)` FROM Metric WHERE (newrelic.cloudIntegrations.providerExternalId LIKE '%') SINCE 1 HOURS AGO"
}
]
}
Expand Down Expand Up @@ -101,7 +101,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT awsAccountId, awsRegion, providerExternalId FROM AwsAthenaWorkGroupSample SINCE 1 hour ago"
"query": "SELECT aws.accountId, aws.region, newrelic.cloudIntegrations.providerExternalId FROM Metric SINCE 1 HOURS AGO"
}
]
}
Expand Down
12 changes: 6 additions & 6 deletions dashboards/amazon-linux/amazon-linux.json
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT sum(aws.ec2.CPUCreditBalance) AS 'Total CPU Credit Balance', sum(aws.ec2.CPUCreditUsage) AS 'CPU credit used', sum(aws.ec2.CPUSurplusCreditsCharged) AS 'CPU Surplus Credit Charged' FROM Metric WHERE collector.name = 'cloudwatch-metric-streams' AND aws.Namespace = 'AWS/EC2' FACET aws.ec2.InstanceId SINCE 1 hour ago"
"query": "SELECT sum(`provider.cpuCreditBalance.Sum`) AS `Total CPU Credit Balance`, sum(`provider.cpuCreditUsage.Sum`) AS `CPU credit used`, sum(`provider.cpuSurplusCreditsCharged.Sum`) AS `CPU Surplus Credit Charged` FROM ComputeSample WHERE ((`provider` = 'Ec2Instance') AND ((`collector`.`name` = 'cloudwatch-metric-streams') AND (`aws`.`Namespace` = 'AWS/EC2'))) SINCE 1 HOURS AGO FACET (ec2InstanceId OR provider.ec2InstanceId)"
}
]
},
Expand Down Expand Up @@ -70,7 +70,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT sum(aws.ec2.StatusCheckFailed) AS 'Failed Checks' FROM Metric WHERE aws.Namespace = 'AWS/EC2' SINCE 1 hour ago"
"query": "SELECT sum(`provider.statusCheckFailed.Sum`) AS `Failed Checks` FROM ComputeSample WHERE ((`provider` = 'Ec2Instance') AND (`aws`.`Namespace` = 'AWS/EC2')) SINCE 1 HOURS AGO"
}
],
"thresholds": []
Expand Down Expand Up @@ -98,7 +98,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT average(aws.ec2.CPUUtilization) FROM Metric WHERE collector.name = 'cloudwatch-metric-streams' AND aws.Namespace = 'AWS/EC2' FACET aws.ec2.InstanceId SINCE 1 hour ago TIMESERIES 5 minutes "
"query": "SELECT average(`provider.cpuUtilization.Average`) FROM ComputeSample WHERE ((`provider` = 'Ec2Instance') AND ((`collector`.`name` = 'cloudwatch-metric-streams') AND (`aws`.`Namespace` = 'AWS/EC2'))) SINCE 1 HOURS AGO FACET (ec2InstanceId OR provider.ec2InstanceId) TIMESERIES 300000"
}
],
"yAxisLeft": {
Expand Down Expand Up @@ -128,7 +128,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT average(aws.ec2.NetworkIn), average(aws.ec2.NetworkOut) FROM Metric WHERE collector.name = 'cloudwatch-metric-streams' AND aws.Namespace = 'AWS/EC2' FACET aws.ec2.InstanceId SINCE 1 hour ago TIMESERIES 5 minutes "
"query": "SELECT average(`provider.networkInBytes.Average`), average(`provider.networkOutBytes.Average`) FROM ComputeSample WHERE ((`provider` = 'Ec2Instance') AND ((`collector`.`name` = 'cloudwatch-metric-streams') AND (`aws`.`Namespace` = 'AWS/EC2'))) SINCE 1 HOURS AGO FACET (ec2InstanceId OR provider.ec2InstanceId) TIMESERIES 300000"
}
],
"yAxisLeft": {
Expand Down Expand Up @@ -158,7 +158,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT average(aws.ec2.DiskReadOps), average(aws.ec2.DiskWriteOps) FROM Metric WHERE collector.name = 'cloudwatch-metric-streams' AND aws.Namespace = 'AWS/EC2' FACET aws.ec2.InstanceId SINCE 1 hour ago TIMESERIES 5 minutes "
"query": "SELECT average(`provider.diskReadOps.Average`), average(`provider.diskWriteOps.Average`) FROM ComputeSample WHERE ((`provider` = 'Ec2Instance') AND ((`collector`.`name` = 'cloudwatch-metric-streams') AND (`aws`.`Namespace` = 'AWS/EC2'))) SINCE 1 HOURS AGO FACET (ec2InstanceId OR provider.ec2InstanceId) TIMESERIES 300000"
}
],
"yAxisLeft": {
Expand Down Expand Up @@ -188,7 +188,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT average(aws.ec2.DiskReadBytes), average(aws.ec2.DiskWriteBytes) FROM Metric WHERE collector.name = 'cloudwatch-metric-streams' AND aws.Namespace = 'AWS/EC2' FACET aws.ec2.InstanceId SINCE 1 hour ago TIMESERIES 5 minutes "
"query": "SELECT average(`provider.diskReadBytes.Average`), average(`provider.diskWriteBytes.Average`) FROM ComputeSample WHERE ((`provider` = 'Ec2Instance') AND ((`collector`.`name` = 'cloudwatch-metric-streams') AND (`aws`.`Namespace` = 'AWS/EC2'))) SINCE 1 HOURS AGO FACET (ec2InstanceId OR provider.ec2InstanceId) TIMESERIES 300000"
}
],
"yAxisLeft": {
Expand Down
14 changes: 7 additions & 7 deletions dashboards/aws-billing/aws-billing.json
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT latest(`aws.billing.EstimatedCharges.byServiceCost`) FROM Metric since 1 day ago facet `aws.billing.ServiceName` limit 100"
"query": "SELECT latest(`provider.estimatedCharges.Maximum`) FROM FinanceSample WHERE (`provider` = 'BillingServiceCost') SINCE 1 DAYS AGO FACET provider.serviceName LIMIT 100"
}
]
}
Expand Down Expand Up @@ -56,7 +56,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT latest(`aws.billing.EstimatedCharges.byAccountCost`) FROM Metric since 1 day ago facet `provider.accountId` limit 100"
"query": "SELECT latest(`provider.estimatedCharges.Maximum`) FROM FinanceSample WHERE (`provider` = 'BillingAccountCost') SINCE 1 DAYS AGO FACET provider.accountId LIMIT 100"
}
]
}
Expand All @@ -82,7 +82,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT latest(`aws.billing.budgetType`) as 'Budget Type', max(`aws.billing.actualAmount.byBudget`) as 'Actual Amount', max(`aws.billing.limitAmount.byBudget`) as 'Budget Limit', latest(`aws.billing.forecastedAmount.byBudget`) as 'Forecast' FROM Metric facet `aws.billing.budgetName` since 1 day ago"
"query": "SELECT latest(provider.budgetType) AS `Budget Type`, max(provider.actualAmount) AS `Actual Amount`, max(provider.limitAmount) AS `Budget Limit`, latest(provider.forecastedAmount) AS `Forecast` FROM FinanceSample WHERE (`provider` = 'BillingBudget') SINCE 1 DAYS AGO FACET provider.budgetName"
}
]
}
Expand Down Expand Up @@ -117,7 +117,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT max(`aws.billing.actualAmount.byBudget`) FROM Metric where `aws.billing.budgetType` = 'COST' TIMESERIES auto since 4 days ago facet `aws.billing.budgetName`"
"query": "SELECT max(provider.actualAmount) FROM FinanceSample WHERE ((`provider` = 'BillingBudget') AND (provider.budgetType = 'COST')) SINCE 4 DAYS AGO FACET provider.budgetName TIMESERIES AUTO"
}
]
}
Expand All @@ -137,7 +137,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT max(`aws.billing.actualAmount.byBudget`) FROM Metric where `aws.billing.budgetType`='USAGE' TIMESERIES auto since 4 days ago facet `aws.billing.budgetName`"
"query": "SELECT max(provider.actualAmount) FROM FinanceSample WHERE ((`provider` = 'BillingBudget') AND (provider.budgetType = 'USAGE')) SINCE 4 DAYS AGO FACET provider.budgetName TIMESERIES AUTO"
}
]
}
Expand All @@ -157,7 +157,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT max(`aws.billing.forecastedAmount.byBudget`) FROM Metric where `aws.billing.budgetType`='COST' TIMESERIES auto since 4 days ago facet `aws.billing.budgetName`"
"query": "SELECT max(provider.forecastedAmount) FROM FinanceSample WHERE ((`provider` = 'BillingBudget') AND (provider.budgetType = 'COST')) SINCE 4 DAYS AGO FACET provider.budgetName TIMESERIES AUTO"
}
]
}
Expand All @@ -177,7 +177,7 @@
"nrqlQueries": [
{
"accountId": 0,
"query": "SELECT max(`aws.billing.forecastedAmount.byBudget`) FROM Metric where `aws.billing.budgetType`='USAGE' TIMESERIES auto since 4 days ago facet `aws.billing.budgetName`"
"query": "SELECT max(provider.forecastedAmount) FROM FinanceSample WHERE ((`provider` = 'BillingBudget') AND (provider.budgetType = 'USAGE')) SINCE 4 DAYS AGO FACET provider.budgetName TIMESERIES AUTO"
}
]
}
Expand Down
Binary file modified dashboards/aws-network-firewall/aws-network-firewall.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading

0 comments on commit 32aa5f3

Please sign in to comment.