mirror of
				https://github.com/k3s-io/kubernetes.git
				synced 2025-10-31 05:40:42 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			163 lines
		
	
	
		
			6.0 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			163 lines
		
	
	
		
			6.0 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| /*
 | |
| Copyright 2017 The Kubernetes Authors.
 | |
| 
 | |
| Licensed under the Apache License, Version 2.0 (the "License");
 | |
| you may not use this file except in compliance with the License.
 | |
| You may obtain a copy of the License at
 | |
| 
 | |
|     http://www.apache.org/licenses/LICENSE-2.0
 | |
| 
 | |
| Unless required by applicable law or agreed to in writing, software
 | |
| distributed under the License is distributed on an "AS IS" BASIS,
 | |
| WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
| See the License for the specific language governing permissions and
 | |
| limitations under the License.
 | |
| */
 | |
| 
 | |
| package util
 | |
| 
 | |
| import (
 | |
| 	"fmt"
 | |
| 	"strconv"
 | |
| 	"time"
 | |
| 
 | |
| 	"google.golang.org/grpc/codes"
 | |
| 	"google.golang.org/grpc/status"
 | |
| 	utilfeature "k8s.io/apiserver/pkg/util/feature"
 | |
| 	"k8s.io/component-base/metrics"
 | |
| 	"k8s.io/component-base/metrics/legacyregistry"
 | |
| 	"k8s.io/kubernetes/pkg/features"
 | |
| 	"k8s.io/kubernetes/pkg/volume"
 | |
| 	"k8s.io/kubernetes/pkg/volume/util/types"
 | |
| )
 | |
| 
 | |
| const (
 | |
| 	statusSuccess     = "success"
 | |
| 	statusFailUnknown = "fail-unknown"
 | |
| )
 | |
| 
 | |
| /*
 | |
|  * By default, all the following metrics are defined as falling under
 | |
|  * ALPHA stability level https://github.com/kubernetes/enhancements/blob/master/keps/sig-instrumentation/1209-metrics-stability/kubernetes-control-plane-metrics-stability.md#stability-classes)
 | |
|  *
 | |
|  * Promoting the stability level of the metric is a responsibility of the component owner, since it
 | |
|  * involves explicitly acknowledging support for the metric across multiple releases, in accordance with
 | |
|  * the metric stability policy.
 | |
|  */
 | |
| var storageOperationMetric = metrics.NewHistogramVec(
 | |
| 	&metrics.HistogramOpts{
 | |
| 		Name:           "storage_operation_duration_seconds",
 | |
| 		Help:           "Storage operation duration",
 | |
| 		Buckets:        []float64{.1, .25, .5, 1, 2.5, 5, 10, 15, 25, 50, 120, 300, 600},
 | |
| 		StabilityLevel: metrics.ALPHA,
 | |
| 	},
 | |
| 	[]string{"volume_plugin", "operation_name", "status", "migrated"},
 | |
| )
 | |
| 
 | |
| var storageOperationEndToEndLatencyMetric = metrics.NewHistogramVec(
 | |
| 	&metrics.HistogramOpts{
 | |
| 		Name:           "volume_operation_total_seconds",
 | |
| 		Help:           "Storage operation end to end duration in seconds",
 | |
| 		Buckets:        []float64{.1, .25, .5, 1, 2.5, 5, 10, 15, 25, 50, 120, 300, 600},
 | |
| 		StabilityLevel: metrics.ALPHA,
 | |
| 	},
 | |
| 	[]string{"plugin_name", "operation_name"},
 | |
| )
 | |
| 
 | |
| var csiOperationsLatencyMetric = metrics.NewHistogramVec(
 | |
| 	&metrics.HistogramOpts{
 | |
| 		Subsystem:      "csi",
 | |
| 		Name:           "operations_seconds",
 | |
| 		Help:           "Container Storage Interface operation duration with gRPC error code status total",
 | |
| 		Buckets:        []float64{.1, .25, .5, 1, 2.5, 5, 10, 15, 25, 50, 120, 300, 600},
 | |
| 		StabilityLevel: metrics.ALPHA,
 | |
| 	},
 | |
| 	[]string{"driver_name", "method_name", "grpc_status_code", "migrated"},
 | |
| )
 | |
| 
 | |
| func init() {
 | |
| 	registerMetrics()
 | |
| }
 | |
| 
 | |
| func registerMetrics() {
 | |
| 	// legacyregistry is the internal k8s wrapper around the prometheus
 | |
| 	// global registry, used specifically for metric stability enforcement
 | |
| 	legacyregistry.MustRegister(storageOperationMetric)
 | |
| 	legacyregistry.MustRegister(storageOperationEndToEndLatencyMetric)
 | |
| 	legacyregistry.MustRegister(csiOperationsLatencyMetric)
 | |
| }
 | |
| 
 | |
| // OperationCompleteHook returns a hook to call when an operation is completed
 | |
| func OperationCompleteHook(plugin, operationName string) func(types.CompleteFuncParam) {
 | |
| 	requestTime := time.Now()
 | |
| 	opComplete := func(c types.CompleteFuncParam) {
 | |
| 		timeTaken := time.Since(requestTime).Seconds()
 | |
| 		// Create metric with operation name and plugin name
 | |
| 		status := statusSuccess
 | |
| 		if *c.Err != nil {
 | |
| 			// TODO: Establish well-known error codes to be able to distinguish
 | |
| 			// user configuration errors from system errors.
 | |
| 			status = statusFailUnknown
 | |
| 		}
 | |
| 		migrated := false
 | |
| 		if c.Migrated != nil {
 | |
| 			migrated = *c.Migrated
 | |
| 		}
 | |
| 		storageOperationMetric.WithLabelValues(plugin, operationName, status, strconv.FormatBool(migrated)).Observe(timeTaken)
 | |
| 	}
 | |
| 	return opComplete
 | |
| }
 | |
| 
 | |
| // FSGroupCompleteHook returns a hook to call when volume recursive permission is changed
 | |
| func FSGroupCompleteHook(plugin volume.VolumePlugin, spec *volume.Spec) func(types.CompleteFuncParam) {
 | |
| 	return OperationCompleteHook(GetFullQualifiedPluginNameForVolume(plugin.GetPluginName(), spec), "volume_apply_access_control")
 | |
| }
 | |
| 
 | |
| // GetFullQualifiedPluginNameForVolume returns full qualified plugin name for
 | |
| // given volume. For CSI plugin, it appends plugin driver name at the end of
 | |
| // plugin name, e.g. kubernetes.io/csi:csi-hostpath. It helps to distinguish
 | |
| // between metrics emitted for CSI volumes which may be handled by different
 | |
| // CSI plugin drivers.
 | |
| func GetFullQualifiedPluginNameForVolume(pluginName string, spec *volume.Spec) string {
 | |
| 	if spec != nil {
 | |
| 		if spec.Volume != nil && spec.Volume.CSI != nil && utilfeature.DefaultFeatureGate.Enabled(features.CSIInlineVolume) {
 | |
| 			return fmt.Sprintf("%s:%s", pluginName, spec.Volume.CSI.Driver)
 | |
| 		}
 | |
| 		if spec.PersistentVolume != nil && spec.PersistentVolume.Spec.CSI != nil {
 | |
| 			return fmt.Sprintf("%s:%s", pluginName, spec.PersistentVolume.Spec.CSI.Driver)
 | |
| 		}
 | |
| 	}
 | |
| 	return pluginName
 | |
| }
 | |
| 
 | |
| // RecordOperationLatencyMetric records the end to end latency for certain operation
 | |
| // into metric volume_operation_total_seconds
 | |
| func RecordOperationLatencyMetric(plugin, operationName string, secondsTaken float64) {
 | |
| 	storageOperationEndToEndLatencyMetric.WithLabelValues(plugin, operationName).Observe(secondsTaken)
 | |
| }
 | |
| 
 | |
| // RecordCSIOperationLatencyMetrics records the CSI operation latency and grpc status
 | |
| // into metric csi_kubelet_operations_seconds
 | |
| func RecordCSIOperationLatencyMetrics(driverName string,
 | |
| 	operationName string,
 | |
| 	operationErr error,
 | |
| 	operationDuration time.Duration,
 | |
| 	migrated string) {
 | |
| 	csiOperationsLatencyMetric.WithLabelValues(driverName, operationName, getErrorCode(operationErr), migrated).Observe(operationDuration.Seconds())
 | |
| }
 | |
| 
 | |
| func getErrorCode(err error) string {
 | |
| 	if err == nil {
 | |
| 		return codes.OK.String()
 | |
| 	}
 | |
| 
 | |
| 	st, ok := status.FromError(err)
 | |
| 	if !ok {
 | |
| 		// This is not gRPC error. The operation must have failed before gRPC
 | |
| 		// method was called, otherwise we would get gRPC error.
 | |
| 		return "unknown-non-grpc"
 | |
| 	}
 | |
| 
 | |
| 	return st.Code().String()
 | |
| }
 |