Add network plugin metrics. The metrics are the same that were used in dockershim/kubelet until it was deprecated in kubernetes 1.23 https://github.com/kubernetes/kubernetes/blob/release-1.23/pkg/kubelet/dockershim/network/metrics/metrics.go Signed-off-by: Antonio Ojea <aojea@google.com>
		
			
				
	
	
		
			91 lines
		
	
	
		
			3.9 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			91 lines
		
	
	
		
			3.9 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
/*
 | 
						|
   Copyright The containerd Authors.
 | 
						|
 | 
						|
   Licensed under the Apache License, Version 2.0 (the "License");
 | 
						|
   you may not use this file except in compliance with the License.
 | 
						|
   You may obtain a copy of the License at
 | 
						|
 | 
						|
       http://www.apache.org/licenses/LICENSE-2.0
 | 
						|
 | 
						|
   Unless required by applicable law or agreed to in writing, software
 | 
						|
   distributed under the License is distributed on an "AS IS" BASIS,
 | 
						|
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | 
						|
   See the License for the specific language governing permissions and
 | 
						|
   limitations under the License.
 | 
						|
*/
 | 
						|
 | 
						|
package server
 | 
						|
 | 
						|
import (
 | 
						|
	metrics "github.com/docker/go-metrics"
 | 
						|
	prom "github.com/prometheus/client_golang/prometheus"
 | 
						|
)
 | 
						|
 | 
						|
var (
 | 
						|
	sandboxListTimer          metrics.Timer
 | 
						|
	sandboxCreateNetworkTimer metrics.Timer
 | 
						|
	sandboxDeleteNetwork      metrics.Timer
 | 
						|
 | 
						|
	sandboxRuntimeCreateTimer metrics.LabeledTimer
 | 
						|
	sandboxRuntimeStopTimer   metrics.LabeledTimer
 | 
						|
	sandboxRemoveTimer        metrics.LabeledTimer
 | 
						|
 | 
						|
	containerListTimer   metrics.Timer
 | 
						|
	containerRemoveTimer metrics.LabeledTimer
 | 
						|
	containerCreateTimer metrics.LabeledTimer
 | 
						|
	containerStopTimer   metrics.LabeledTimer
 | 
						|
	containerStartTimer  metrics.LabeledTimer
 | 
						|
 | 
						|
	networkPluginOperations        metrics.LabeledCounter
 | 
						|
	networkPluginOperationsErrors  metrics.LabeledCounter
 | 
						|
	networkPluginOperationsLatency metrics.LabeledTimer
 | 
						|
 | 
						|
	imagePulls           metrics.LabeledCounter
 | 
						|
	inProgressImagePulls metrics.Gauge
 | 
						|
	//  pull duration / (image size / 1MBi)
 | 
						|
	imagePullThroughput prom.Histogram
 | 
						|
)
 | 
						|
 | 
						|
func init() {
 | 
						|
	// these CRI metrics record latencies for successful operations around a sandbox and container's lifecycle.
 | 
						|
	ns := metrics.NewNamespace("containerd", "cri", nil)
 | 
						|
 | 
						|
	sandboxListTimer = ns.NewTimer("sandbox_list", "time to list sandboxes")
 | 
						|
	sandboxCreateNetworkTimer = ns.NewTimer("sandbox_create_network", "time to create the network for a sandbox")
 | 
						|
	sandboxDeleteNetwork = ns.NewTimer("sandbox_delete_network", "time to delete a sandbox's network")
 | 
						|
 | 
						|
	sandboxRuntimeCreateTimer = ns.NewLabeledTimer("sandbox_runtime_create", "time to create a sandbox in the runtime", "runtime")
 | 
						|
	sandboxRuntimeStopTimer = ns.NewLabeledTimer("sandbox_runtime_stop", "time to stop a sandbox", "runtime")
 | 
						|
	sandboxRemoveTimer = ns.NewLabeledTimer("sandbox_remove", "time to remove a sandbox", "runtime")
 | 
						|
 | 
						|
	containerListTimer = ns.NewTimer("container_list", "time to list containers")
 | 
						|
	containerRemoveTimer = ns.NewLabeledTimer("container_remove", "time to remove a container", "runtime")
 | 
						|
	containerCreateTimer = ns.NewLabeledTimer("container_create", "time to create a container", "runtime")
 | 
						|
	containerStopTimer = ns.NewLabeledTimer("container_stop", "time to stop a container", "runtime")
 | 
						|
	containerStartTimer = ns.NewLabeledTimer("container_start", "time to start a container", "runtime")
 | 
						|
 | 
						|
	networkPluginOperations = ns.NewLabeledCounter("network_plugin_operations_total", "cumulative number of network plugin operations by operation type", "operation_type")
 | 
						|
	networkPluginOperationsErrors = ns.NewLabeledCounter("network_plugin_operations_errors_total", "cumulative number of network plugin operations by operation type", "operation_type")
 | 
						|
	networkPluginOperationsLatency = ns.NewLabeledTimer("network_plugin_operations_duration_seconds", "latency in seconds of network plugin operations. Broken down by operation type", "operation_type")
 | 
						|
 | 
						|
	imagePulls = ns.NewLabeledCounter("image_pulls", "succeeded and failed counters", "status")
 | 
						|
	inProgressImagePulls = ns.NewGauge("in_progress_image_pulls", "in progress pulls", metrics.Total)
 | 
						|
	imagePullThroughput = prom.NewHistogram(
 | 
						|
		prom.HistogramOpts{
 | 
						|
			Name:    "image_pulling_throughput",
 | 
						|
			Help:    "image pull throughput",
 | 
						|
			Buckets: prom.DefBuckets,
 | 
						|
		},
 | 
						|
	)
 | 
						|
 | 
						|
	metrics.Register(ns)
 | 
						|
}
 | 
						|
 | 
						|
// for backwards compatibility with kubelet/dockershim metrics
 | 
						|
// https://github.com/containerd/containerd/issues/7801
 | 
						|
const (
 | 
						|
	networkStatusOp   = "get_pod_network_status"
 | 
						|
	networkSetUpOp    = "set_up_pod"
 | 
						|
	networkTearDownOp = "tear_down_pod"
 | 
						|
)
 |