2019-09-27 21:51:53 +00:00
|
|
|
// +build !providerless
|
|
|
|
|
|
|
|
/*
|
|
|
|
Copyright 2018 The Kubernetes Authors.
|
|
|
|
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
you may not use this file except in compliance with the License.
|
|
|
|
You may obtain a copy of the License at
|
|
|
|
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
limitations under the License.
|
|
|
|
*/
|
|
|
|
|
2020-03-26 21:07:15 +00:00
|
|
|
package metrics
|
2019-09-27 21:51:53 +00:00
|
|
|
|
|
|
|
import (
|
|
|
|
"strings"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"k8s.io/component-base/metrics"
|
|
|
|
"k8s.io/component-base/metrics/legacyregistry"
|
|
|
|
)
|
|
|
|
|
2020-12-01 01:06:26 +00:00
|
|
|
const (
|
|
|
|
azureMetricsNamespace = "cloudprovider_azure"
|
|
|
|
)
|
2019-09-27 21:51:53 +00:00
|
|
|
|
|
|
|
var (
|
|
|
|
metricLabels = []string{
|
|
|
|
"request", // API function that is being invoked
|
|
|
|
"resource_group", // Resource group of the resource being monitored
|
|
|
|
"subscription_id", // Subscription ID of the resource being monitored
|
2020-12-01 01:06:26 +00:00
|
|
|
"source", // Operation source(optional)
|
2019-09-27 21:51:53 +00:00
|
|
|
}
|
|
|
|
|
2020-12-01 01:06:26 +00:00
|
|
|
apiMetrics = registerAPIMetrics(metricLabels...)
|
|
|
|
operationMetrics = registerOperationMetrics(metricLabels...)
|
2019-09-27 21:51:53 +00:00
|
|
|
)
|
|
|
|
|
2020-12-01 01:06:26 +00:00
|
|
|
// apiCallMetrics is the metrics measuring the performance of a single API call
|
|
|
|
// e.g., GET, POST ...
|
|
|
|
type apiCallMetrics struct {
|
|
|
|
latency *metrics.HistogramVec
|
|
|
|
errors *metrics.CounterVec
|
|
|
|
rateLimitedCount *metrics.CounterVec
|
|
|
|
throttledCount *metrics.CounterVec
|
|
|
|
}
|
|
|
|
|
|
|
|
// operationCallMetrics is the metrics measuring the performance of a whole operation
|
|
|
|
// e.g., the create / update / delete process of a loadbalancer or route.
|
|
|
|
type operationCallMetrics struct {
|
|
|
|
operationLatency *metrics.HistogramVec
|
|
|
|
operationFailureCount *metrics.CounterVec
|
|
|
|
}
|
|
|
|
|
2020-03-26 21:07:15 +00:00
|
|
|
// MetricContext indicates the context for Azure client metrics.
|
|
|
|
type MetricContext struct {
|
2019-09-27 21:51:53 +00:00
|
|
|
start time.Time
|
|
|
|
attributes []string
|
|
|
|
}
|
|
|
|
|
2020-03-26 21:07:15 +00:00
|
|
|
// NewMetricContext creates a new MetricContext.
|
|
|
|
func NewMetricContext(prefix, request, resourceGroup, subscriptionID, source string) *MetricContext {
|
|
|
|
return &MetricContext{
|
2019-09-27 21:51:53 +00:00
|
|
|
start: time.Now(),
|
|
|
|
attributes: []string{prefix + "_" + request, strings.ToLower(resourceGroup), subscriptionID, source},
|
|
|
|
}
|
|
|
|
}
|
2020-03-26 21:07:15 +00:00
|
|
|
|
|
|
|
// RateLimitedCount records the metrics for rate limited request count.
|
|
|
|
func (mc *MetricContext) RateLimitedCount() {
|
2019-12-12 01:27:03 +00:00
|
|
|
apiMetrics.rateLimitedCount.WithLabelValues(mc.attributes...).Inc()
|
|
|
|
}
|
2019-09-27 21:51:53 +00:00
|
|
|
|
2020-03-26 21:07:15 +00:00
|
|
|
// ThrottledCount records the metrics for throttled request count.
|
|
|
|
func (mc *MetricContext) ThrottledCount() {
|
|
|
|
apiMetrics.throttledCount.WithLabelValues(mc.attributes...).Inc()
|
|
|
|
}
|
|
|
|
|
|
|
|
// Observe observes the request latency and failed requests.
|
|
|
|
func (mc *MetricContext) Observe(err error) error {
|
2019-09-27 21:51:53 +00:00
|
|
|
apiMetrics.latency.WithLabelValues(mc.attributes...).Observe(
|
|
|
|
time.Since(mc.start).Seconds())
|
|
|
|
if err != nil {
|
|
|
|
apiMetrics.errors.WithLabelValues(mc.attributes...).Inc()
|
|
|
|
}
|
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2020-12-01 01:06:26 +00:00
|
|
|
// ObserveOperationWithResult observes the request latency and failed requests of an operation.
|
|
|
|
func (mc *MetricContext) ObserveOperationWithResult(isOperationSucceeded bool) {
|
|
|
|
operationMetrics.operationLatency.WithLabelValues(mc.attributes...).Observe(
|
|
|
|
time.Since(mc.start).Seconds())
|
|
|
|
if !isOperationSucceeded {
|
|
|
|
mc.CountFailedOperation()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// CountFailedOperation increase the number of failed operations
|
|
|
|
func (mc *MetricContext) CountFailedOperation() {
|
|
|
|
operationMetrics.operationFailureCount.WithLabelValues(mc.attributes...).Inc()
|
|
|
|
}
|
|
|
|
|
2020-03-26 21:07:15 +00:00
|
|
|
// registerAPIMetrics registers the API metrics.
|
2019-09-27 21:51:53 +00:00
|
|
|
func registerAPIMetrics(attributes ...string) *apiCallMetrics {
|
|
|
|
metrics := &apiCallMetrics{
|
|
|
|
latency: metrics.NewHistogramVec(
|
|
|
|
&metrics.HistogramOpts{
|
2020-12-01 01:06:26 +00:00
|
|
|
Namespace: azureMetricsNamespace,
|
|
|
|
Name: "api_request_duration_seconds",
|
2019-09-27 21:51:53 +00:00
|
|
|
Help: "Latency of an Azure API call",
|
2020-10-14 19:03:41 +00:00
|
|
|
Buckets: []float64{.1, .25, .5, 1, 2.5, 5, 10, 15, 25, 50, 120, 300, 600, 1200},
|
2019-09-27 21:51:53 +00:00
|
|
|
StabilityLevel: metrics.ALPHA,
|
|
|
|
},
|
|
|
|
attributes,
|
|
|
|
),
|
|
|
|
errors: metrics.NewCounterVec(
|
|
|
|
&metrics.CounterOpts{
|
2020-12-01 01:06:26 +00:00
|
|
|
Namespace: azureMetricsNamespace,
|
|
|
|
Name: "api_request_errors",
|
2019-09-27 21:51:53 +00:00
|
|
|
Help: "Number of errors for an Azure API call",
|
|
|
|
StabilityLevel: metrics.ALPHA,
|
|
|
|
},
|
|
|
|
attributes,
|
|
|
|
),
|
2019-12-12 01:27:03 +00:00
|
|
|
rateLimitedCount: metrics.NewCounterVec(
|
|
|
|
&metrics.CounterOpts{
|
2020-12-01 01:06:26 +00:00
|
|
|
Namespace: azureMetricsNamespace,
|
|
|
|
Name: "api_request_ratelimited_count",
|
2019-12-12 01:27:03 +00:00
|
|
|
Help: "Number of rate limited Azure API calls",
|
|
|
|
StabilityLevel: metrics.ALPHA,
|
|
|
|
},
|
|
|
|
attributes,
|
|
|
|
),
|
2020-03-26 21:07:15 +00:00
|
|
|
throttledCount: metrics.NewCounterVec(
|
|
|
|
&metrics.CounterOpts{
|
2020-12-01 01:06:26 +00:00
|
|
|
Namespace: azureMetricsNamespace,
|
|
|
|
Name: "api_request_throttled_count",
|
2020-03-26 21:07:15 +00:00
|
|
|
Help: "Number of throttled Azure API calls",
|
|
|
|
StabilityLevel: metrics.ALPHA,
|
|
|
|
},
|
|
|
|
attributes,
|
|
|
|
),
|
2019-09-27 21:51:53 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
legacyregistry.MustRegister(metrics.latency)
|
|
|
|
legacyregistry.MustRegister(metrics.errors)
|
2019-12-12 01:27:03 +00:00
|
|
|
legacyregistry.MustRegister(metrics.rateLimitedCount)
|
2020-03-26 21:07:15 +00:00
|
|
|
legacyregistry.MustRegister(metrics.throttledCount)
|
2019-09-27 21:51:53 +00:00
|
|
|
|
|
|
|
return metrics
|
|
|
|
}
|
2020-12-01 01:06:26 +00:00
|
|
|
|
|
|
|
// registerOperationMetrics registers the operation metrics.
|
|
|
|
func registerOperationMetrics(attributes ...string) *operationCallMetrics {
|
|
|
|
metrics := &operationCallMetrics{
|
|
|
|
operationLatency: metrics.NewHistogramVec(
|
|
|
|
&metrics.HistogramOpts{
|
|
|
|
Namespace: azureMetricsNamespace,
|
|
|
|
Name: "op_duration_seconds",
|
|
|
|
Help: "Latency of an Azure service operation",
|
|
|
|
StabilityLevel: metrics.ALPHA,
|
|
|
|
Buckets: []float64{0.1, 0.2, 0.5, 1, 10, 20, 30, 40, 50, 60, 100, 200, 300},
|
|
|
|
},
|
|
|
|
attributes,
|
|
|
|
),
|
|
|
|
operationFailureCount: metrics.NewCounterVec(
|
|
|
|
&metrics.CounterOpts{
|
|
|
|
Namespace: azureMetricsNamespace,
|
|
|
|
Name: "op_failure_count",
|
|
|
|
Help: "Number of failed Azure service operations",
|
|
|
|
StabilityLevel: metrics.ALPHA,
|
|
|
|
},
|
|
|
|
attributes,
|
|
|
|
),
|
|
|
|
}
|
|
|
|
|
|
|
|
legacyregistry.MustRegister(metrics.operationLatency)
|
|
|
|
legacyregistry.MustRegister(metrics.operationFailureCount)
|
|
|
|
|
|
|
|
return metrics
|
|
|
|
}
|