Skip to content
5 changes: 5 additions & 0 deletions packages/azure_openai/changelog.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,9 @@
# newer versions go on top
- version: "1.10.0"
changes:
- description: Add Alerting Rule Templates.
type: enhancement
link: https://github.com/elastic/integrations/pull/15412
- version: "1.9.0"
changes:
- description: Add a flag `fips_compatible` to control whether the package is allowed in the ECH FedRAMP High environment.
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
{
"id": "latency_spike",
"type": "alerting_rule_template",
"attributes": {
"name": "[Azure OpenAI] Latency Spike",
"tags": ["Azure OpenAI",
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
"tags": ["Azure OpenAI",
"tags": ["azure", "openai", "latency"]

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This integration is specific to Azure OpenAI monitoring, so its good to keep Azure OpenAI.

"Latency Spike"],
"ruleTypeId": ".es-query",
"schedule": {
"interval": "1m"
},
"params": {
"searchType": "esqlQuery",
"timeWindowSize": 15,
"timeWindowUnit": "m",
"threshold": [
0
],
"thresholdComparator": ">",
"size": 100,
"esqlQuery": {
"esql": "FROM metrics-azure.ai_foundry-default\n| STATS time_to_response = AVG(azure.ai_foundry.time_to_response.avg) by azure.dimensions.model_deployment_name\n| WHERE time_to_response > 5000"
},
"aggType": "count",
"groupBy": "all",
"termSize": 5,
"sourceFields": [],
"timeField": "@timestamp",
"excludeHitsFromPreviousRun": true
},
"alertDelay": {
"active": 1
}
},
"managed": true,
"coreMigrationVersion": "8.8.0",
"typeMigrationVersion": "10.1.0"
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
{
"id": "provisioned_utilization",
"type": "alerting_rule_template",
"attributes": {
"name": "[Azure OpenAI] Provisioned Utilization",
"tags": ["Azure OpenAI",
"Provisioned Utilization"],
"ruleTypeId": ".es-query",
"schedule": {
"interval": "1m"
},
"params": {
"searchType": "esqlQuery",
"timeWindowSize": 15,
"timeWindowUnit": "m",
"threshold": [
0
],
"thresholdComparator": ">",
"size": 100,
"esqlQuery": {
"esql": "FROM metrics-azure.ai_foundry-default\\n| STATS provisioned_utilization = MAX(azure.ai_foundry.provisioned_utilization.avg) * 100\n by azure.dimensions.model_deployment_name\\n| WHERE provisioned_utilization > 85"
},
"aggType": "count",
"groupBy": "all",
"termSize": 5,
"sourceFields": [],
"timeField": "@timestamp",
"excludeHitsFromPreviousRun": true
},
"alertDelay": {
"active": 1
}
},
"managed": true,
"coreMigrationVersion": "8.8.0",
"typeMigrationVersion": "10.1.0"
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
{
"id": "quota_error_rates",
"type": "alerting_rule_template",
"attributes": {
"name": "[Azure OpenAI] Quota Error Rates",
"tags": ["Azure OpenAI",
"Quota Error Rates"],
"ruleTypeId": ".es-query",
"schedule": {
"interval": "1m"
},
"params": {
"searchType": "esqlQuery",
"timeWindowSize": 15,
"timeWindowUnit": "m",
"threshold": [
0
],
"thresholdComparator": "<",
"size": 100,
"esqlQuery": {
"esql": "FROM logs-azure_openai.logs-default\n| STATS quota_error = COUNT(http.response.status_code == 429) by azure.dimensions.model_deployment_name\n| WHERE quota_error > 0"
},
"aggType": "count",
"groupBy": "all",
"termSize": 5,
"sourceFields": [],
"timeField": "@timestamp",
"excludeHitsFromPreviousRun": true
},
"alertDelay": {
"active": 1
}
},
"managed": true,
"coreMigrationVersion": "8.8.0",
"typeMigrationVersion": "10.1.0"
}
4 changes: 2 additions & 2 deletions packages/azure_openai/manifest.yml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
format_version: 3.1.3
format_version: 3.5.0
name: azure_openai
title: "Azure OpenAI"
version: "1.9.0"
version: "1.10.0"
source:
license: "Elastic-2.0"
description: "Collects Azure OpenAI Logs and Metrics"
Expand Down