diff --git a/services/CognitiveServices/accounts/alerts.yaml b/services/CognitiveServices/accounts/alerts.yaml index 9d8a784db..2105993ce 100644 --- a/services/CognitiveServices/accounts/alerts.yaml +++ b/services/CognitiveServices/accounts/alerts.yaml @@ -308,19 +308,19 @@ - name: AzureOpenAIContextTokensCacheMatchRate description: Percentage of the prompt tokens hit the cache, avaiable for PTU-managed. type: Metric - verified: false - visible: false + verified: true + visible: true tags: manual-ck properties: metricName: AzureOpenAIContextTokensCacheMatchRate metricNamespace: Microsoft.CognitiveServices/accounts - severity: 0 + severity: 2 windowSize: PT5M evaluationFrequency: PT1M timeAggregation: Total operator: GreaterThan criterionType: StaticThresholdCriterion - threshold: 0.0 + threshold: 75 guid: 81f8369c-65bf-4194-bfd2-ffdfa2470577 - name: AzureOpenAIProvisionedManagedUtilization description: Utilization % for a provisoned-managed deployment, calculated as (PTUs consumed / PTUs deployed) x 100. @@ -342,19 +342,19 @@ - name: AzureOpenAIProvisionedManagedUtilizationV2 description: Utilization % for a provisoned-managed deployment, calculated as (PTUs consumed / PTUs deployed) x 100. type: Metric - verified: false - visible: false + verified: true + visible: true tags: manual-ck properties: metricName: AzureOpenAIProvisionedManagedUtilizationV2 metricNamespace: Microsoft.CognitiveServices/accounts - severity: 0 + severity: 2 windowSize: PT5M evaluationFrequency: PT1M timeAggregation: Total operator: GreaterThan criterionType: StaticThresholdCriterion - threshold: 0.0 + threshold: 80 guid: 693a3b37-1e2a-42d1-aaed-b1f374276d1c - name: AzureOpenAIRequests description: Number of calls made to the Azure OpenAI API over a period of time. @@ -374,21 +374,21 @@ threshold: 0.0 guid: a1528d17-f288-46b1-b084-8b8fe3af90fa - name: AzureOpenAITimeToResponse - description: Recommended latency (responsiveness) measure for streaming requests. + description: Recommended latency (responsiveness) measure for streaming requests. Time in milliseconds. type: Metric - verified: false - visible: false + verified: true + visible: true tags: manual-ck properties: metricName: AzureOpenAITimeToResponse metricNamespace: Microsoft.CognitiveServices/accounts - severity: 0 + severity: 2 windowSize: PT5M evaluationFrequency: PT1M timeAggregation: Total operator: GreaterThan criterionType: StaticThresholdCriterion - threshold: 0.0 + threshold: 200 guid: 995cc12a-1887-4669-92c5-70a6ca8bfe70 - name: BaselineEstimatorOverallReward description: Baseline Estimator Overall Reward.