Add runtime label to metrics

Signed-off-by: Maksym Pavlenko <pavlenko.maksym@gmail.com>
This commit is contained in:
Maksym Pavlenko 2021-07-23 10:04:46 -07:00
parent 34fb8d8967
commit efa8ab7158
6 changed files with 65 additions and 31 deletions

View File

@ -29,7 +29,7 @@ import (
"github.com/containerd/containerd/namespaces" "github.com/containerd/containerd/namespaces"
"github.com/containerd/containerd/runtime" "github.com/containerd/containerd/runtime"
"github.com/containerd/containerd/runtime/v1/linux" "github.com/containerd/containerd/runtime/v1/linux"
metrics "github.com/docker/go-metrics" "github.com/docker/go-metrics"
"github.com/sirupsen/logrus" "github.com/sirupsen/logrus"
) )
@ -55,8 +55,8 @@ type cgroupsMonitor struct {
publisher events.Publisher publisher events.Publisher
} }
func (m *cgroupsMonitor) Monitor(c runtime.Task) error { func (m *cgroupsMonitor) Monitor(c runtime.Task, labels map[string]string) error {
if err := m.collector.Add(c); err != nil { if err := m.collector.Add(c, labels); err != nil {
return err return err
} }
t, ok := c.(*linux.Task) t, ok := c.(*linux.Task)

View File

@ -28,7 +28,7 @@ import (
v1 "github.com/containerd/containerd/metrics/types/v1" v1 "github.com/containerd/containerd/metrics/types/v1"
"github.com/containerd/containerd/namespaces" "github.com/containerd/containerd/namespaces"
"github.com/containerd/typeurl" "github.com/containerd/typeurl"
metrics "github.com/docker/go-metrics" "github.com/docker/go-metrics"
"github.com/gogo/protobuf/types" "github.com/gogo/protobuf/types"
"github.com/prometheus/client_golang/prometheus" "github.com/prometheus/client_golang/prometheus"
) )
@ -53,7 +53,7 @@ func NewCollector(ns *metrics.Namespace) *Collector {
// add machine cpus and memory info // add machine cpus and memory info
c := &Collector{ c := &Collector{
ns: ns, ns: ns,
tasks: make(map[string]Statable), tasks: make(map[string]entry),
} }
c.metrics = append(c.metrics, pidMetrics...) c.metrics = append(c.metrics, pidMetrics...)
c.metrics = append(c.metrics, cpuMetrics...) c.metrics = append(c.metrics, cpuMetrics...)
@ -69,12 +69,19 @@ func taskID(id, namespace string) string {
return fmt.Sprintf("%s-%s", id, namespace) return fmt.Sprintf("%s-%s", id, namespace)
} }
type entry struct {
task Statable
// ns is an optional child namespace that contains additional to parent labels.
// This can be used to append task specific labels to be able to differentiate the different containerd metrics.
ns *metrics.Namespace
}
// Collector provides the ability to collect container stats and export // Collector provides the ability to collect container stats and export
// them in the prometheus format // them in the prometheus format
type Collector struct { type Collector struct {
mu sync.RWMutex mu sync.RWMutex
tasks map[string]Statable tasks map[string]entry
ns *metrics.Namespace ns *metrics.Namespace
metrics []*metric metrics []*metric
storedMetrics chan prometheus.Metric storedMetrics chan prometheus.Metric
@ -109,10 +116,11 @@ storedLoop:
wg.Wait() wg.Wait()
} }
func (c *Collector) collect(t Statable, ch chan<- prometheus.Metric, block bool, wg *sync.WaitGroup) { func (c *Collector) collect(entry entry, ch chan<- prometheus.Metric, block bool, wg *sync.WaitGroup) {
if wg != nil { if wg != nil {
defer wg.Done() defer wg.Done()
} }
t := entry.task
ctx := namespaces.WithNamespace(context.Background(), t.Namespace()) ctx := namespaces.WithNamespace(context.Background(), t.Namespace())
stats, err := t.Stats(ctx) stats, err := t.Stats(ctx)
if err != nil { if err != nil {
@ -129,13 +137,17 @@ func (c *Collector) collect(t Statable, ch chan<- prometheus.Metric, block bool,
log.L.WithError(err).Errorf("invalid metric type for %s", t.ID()) log.L.WithError(err).Errorf("invalid metric type for %s", t.ID())
return return
} }
ns := entry.ns
if ns == nil {
ns = c.ns
}
for _, m := range c.metrics { for _, m := range c.metrics {
m.collect(t.ID(), t.Namespace(), s, c.ns, ch, block) m.collect(t.ID(), t.Namespace(), s, ns, ch, block)
} }
} }
// Add adds the provided cgroup and id so that metrics are collected and exported // Add adds the provided cgroup and id so that metrics are collected and exported
func (c *Collector) Add(t Statable) error { func (c *Collector) Add(t Statable, labels map[string]string) error {
if c.ns == nil { if c.ns == nil {
return nil return nil
} }
@ -145,7 +157,11 @@ func (c *Collector) Add(t Statable) error {
if _, ok := c.tasks[id]; ok { if _, ok := c.tasks[id]; ok {
return nil // requests to collect metrics should be idempotent return nil // requests to collect metrics should be idempotent
} }
c.tasks[id] = t entry := entry{task: t}
if labels != nil {
entry.ns = c.ns.WithConstLabels(labels)
}
c.tasks[id] = entry
return nil return nil
} }
@ -165,6 +181,6 @@ func (c *Collector) RemoveAll() {
return return
} }
c.mu.Lock() c.mu.Lock()
c.tasks = make(map[string]Statable) c.tasks = make(map[string]entry)
c.mu.Unlock() c.mu.Unlock()
} }

View File

@ -23,7 +23,7 @@ import (
"github.com/containerd/containerd/events" "github.com/containerd/containerd/events"
"github.com/containerd/containerd/runtime" "github.com/containerd/containerd/runtime"
metrics "github.com/docker/go-metrics" "github.com/docker/go-metrics"
) )
// NewTaskMonitor returns a new cgroups monitor // NewTaskMonitor returns a new cgroups monitor
@ -42,8 +42,8 @@ type cgroupsMonitor struct {
publisher events.Publisher publisher events.Publisher
} }
func (m *cgroupsMonitor) Monitor(c runtime.Task) error { func (m *cgroupsMonitor) Monitor(c runtime.Task, labels map[string]string) error {
if err := m.collector.Add(c); err != nil { if err := m.collector.Add(c, labels); err != nil {
return err return err
} }
return nil return nil

View File

@ -27,7 +27,7 @@ import (
v2 "github.com/containerd/containerd/metrics/types/v2" v2 "github.com/containerd/containerd/metrics/types/v2"
"github.com/containerd/containerd/namespaces" "github.com/containerd/containerd/namespaces"
"github.com/containerd/typeurl" "github.com/containerd/typeurl"
metrics "github.com/docker/go-metrics" "github.com/docker/go-metrics"
"github.com/gogo/protobuf/types" "github.com/gogo/protobuf/types"
"github.com/prometheus/client_golang/prometheus" "github.com/prometheus/client_golang/prometheus"
) )
@ -47,7 +47,7 @@ func NewCollector(ns *metrics.Namespace) *Collector {
} }
c := &Collector{ c := &Collector{
ns: ns, ns: ns,
tasks: make(map[string]Statable), tasks: make(map[string]entry),
} }
c.metrics = append(c.metrics, pidMetrics...) c.metrics = append(c.metrics, pidMetrics...)
c.metrics = append(c.metrics, cpuMetrics...) c.metrics = append(c.metrics, cpuMetrics...)
@ -62,12 +62,19 @@ func taskID(id, namespace string) string {
return fmt.Sprintf("%s-%s", id, namespace) return fmt.Sprintf("%s-%s", id, namespace)
} }
type entry struct {
task Statable
// ns is an optional child namespace that contains additional to parent labels.
// This can be used to append task specific labels to be able to differentiate the different containerd metrics.
ns *metrics.Namespace
}
// Collector provides the ability to collect container stats and export // Collector provides the ability to collect container stats and export
// them in the prometheus format // them in the prometheus format
type Collector struct { type Collector struct {
mu sync.RWMutex mu sync.RWMutex
tasks map[string]Statable tasks map[string]entry
ns *metrics.Namespace ns *metrics.Namespace
metrics []*metric metrics []*metric
storedMetrics chan prometheus.Metric storedMetrics chan prometheus.Metric
@ -102,10 +109,11 @@ storedLoop:
wg.Wait() wg.Wait()
} }
func (c *Collector) collect(t Statable, ch chan<- prometheus.Metric, block bool, wg *sync.WaitGroup) { func (c *Collector) collect(entry entry, ch chan<- prometheus.Metric, block bool, wg *sync.WaitGroup) {
if wg != nil { if wg != nil {
defer wg.Done() defer wg.Done()
} }
t := entry.task
ctx := namespaces.WithNamespace(context.Background(), t.Namespace()) ctx := namespaces.WithNamespace(context.Background(), t.Namespace())
stats, err := t.Stats(ctx) stats, err := t.Stats(ctx)
if err != nil { if err != nil {
@ -122,13 +130,17 @@ func (c *Collector) collect(t Statable, ch chan<- prometheus.Metric, block bool,
log.L.WithError(err).Errorf("invalid metric type for %s", t.ID()) log.L.WithError(err).Errorf("invalid metric type for %s", t.ID())
return return
} }
ns := entry.ns
if ns == nil {
ns = c.ns
}
for _, m := range c.metrics { for _, m := range c.metrics {
m.collect(t.ID(), t.Namespace(), s, c.ns, ch, block) m.collect(t.ID(), t.Namespace(), s, ns, ch, block)
} }
} }
// Add adds the provided cgroup and id so that metrics are collected and exported // Add adds the provided cgroup and id so that metrics are collected and exported
func (c *Collector) Add(t Statable) error { func (c *Collector) Add(t Statable, labels map[string]string) error {
if c.ns == nil { if c.ns == nil {
return nil return nil
} }
@ -138,7 +150,11 @@ func (c *Collector) Add(t Statable) error {
if _, ok := c.tasks[id]; ok { if _, ok := c.tasks[id]; ok {
return nil // requests to collect metrics should be idempotent return nil // requests to collect metrics should be idempotent
} }
c.tasks[id] = t entry := entry{task: t}
if labels != nil {
entry.ns = c.ns.WithConstLabels(labels)
}
c.tasks[id] = entry
return nil return nil
} }
@ -158,6 +174,6 @@ func (c *Collector) RemoveAll() {
return return
} }
c.mu.Lock() c.mu.Lock()
c.tasks = make(map[string]Statable) c.tasks = make(map[string]entry)
c.mu.Unlock() c.mu.Unlock()
} }

View File

@ -18,10 +18,11 @@ package runtime
// TaskMonitor provides an interface for monitoring of containers within containerd // TaskMonitor provides an interface for monitoring of containers within containerd
type TaskMonitor interface { type TaskMonitor interface {
// Monitor adds the provided container to the monitor // Monitor adds the provided container to the monitor.
Monitor(Task) error // Labels are optional (can be nil) key value pairs to be added to the metrics namespace.
Monitor(task Task, labels map[string]string) error
// Stop stops and removes the provided container from the monitor // Stop stops and removes the provided container from the monitor
Stop(Task) error Stop(task Task) error
} }
// NewMultiTaskMonitor returns a new TaskMonitor broadcasting to the provided monitors // NewMultiTaskMonitor returns a new TaskMonitor broadcasting to the provided monitors
@ -39,7 +40,7 @@ func NewNoopMonitor() TaskMonitor {
type noopTaskMonitor struct { type noopTaskMonitor struct {
} }
func (mm *noopTaskMonitor) Monitor(c Task) error { func (mm *noopTaskMonitor) Monitor(c Task, labels map[string]string) error {
return nil return nil
} }
@ -51,9 +52,9 @@ type multiTaskMonitor struct {
monitors []TaskMonitor monitors []TaskMonitor
} }
func (mm *multiTaskMonitor) Monitor(c Task) error { func (mm *multiTaskMonitor) Monitor(task Task, labels map[string]string) error {
for _, m := range mm.monitors { for _, m := range mm.monitors {
if err := m.Monitor(c); err != nil { if err := m.Monitor(task, labels); err != nil {
return err return err
} }
} }

View File

@ -115,7 +115,7 @@ func initFunc(ic *plugin.InitContext) (interface{}, error) {
return nil, err return nil, err
} }
for _, t := range tasks { for _, t := range tasks {
l.monitor.Monitor(t) l.monitor.Monitor(t, nil)
} }
} }
v2Tasks, err := l.v2Runtime.Tasks(ic.Context, true) v2Tasks, err := l.v2Runtime.Tasks(ic.Context, true)
@ -123,7 +123,7 @@ func initFunc(ic *plugin.InitContext) (interface{}, error) {
return nil, err return nil, err
} }
for _, t := range v2Tasks { for _, t := range v2Tasks {
l.monitor.Monitor(t) l.monitor.Monitor(t, nil)
} }
return l, nil return l, nil
} }
@ -211,7 +211,8 @@ func (l *local) Create(ctx context.Context, r *api.CreateTaskRequest, _ ...grpc.
if err != nil { if err != nil {
return nil, errdefs.ToGRPC(err) return nil, errdefs.ToGRPC(err)
} }
if err := l.monitor.Monitor(c); err != nil { labels := map[string]string{"runtime": container.Runtime.Name}
if err := l.monitor.Monitor(c, labels); err != nil {
return nil, errors.Wrap(err, "monitor task") return nil, errors.Wrap(err, "monitor task")
} }
return &api.CreateTaskResponse{ return &api.CreateTaskResponse{