-
Notifications
You must be signed in to change notification settings - Fork 28
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
implemented GetStatsSummary and GetMetricsResource for Virtual Kubelet
- Loading branch information
Showing
4 changed files
with
366 additions
and
20 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
196 changes: 196 additions & 0 deletions
196
k3k-kubelet/provider/collectors/kubelet_resource_metrics.go
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,196 @@ | ||
/* | ||
Copyright (c) Microsoft Corporation. | ||
Licensed under the Apache 2.0 license. | ||
See https://github.com/virtual-kubelet/azure-aci/tree/master/pkg/metrics/collectors | ||
*/ | ||
|
||
package collectors | ||
|
||
import ( | ||
"time" | ||
|
||
stats "github.com/virtual-kubelet/virtual-kubelet/node/api/statsv1alpha1" | ||
compbasemetrics "k8s.io/component-base/metrics" | ||
) | ||
|
||
// defining metrics | ||
var ( | ||
nodeCPUUsageDesc = compbasemetrics.NewDesc("node_cpu_usage_seconds_total", | ||
"Cumulative cpu time consumed by the node in core-seconds", | ||
nil, | ||
nil, | ||
compbasemetrics.ALPHA, | ||
"") | ||
|
||
nodeMemoryUsageDesc = compbasemetrics.NewDesc("node_memory_working_set_bytes", | ||
"Current working set of the node in bytes", | ||
nil, | ||
nil, | ||
compbasemetrics.ALPHA, | ||
"") | ||
|
||
containerCPUUsageDesc = compbasemetrics.NewDesc("container_cpu_usage_seconds_total", | ||
"Cumulative cpu time consumed by the container in core-seconds", | ||
[]string{"container", "pod", "namespace"}, | ||
nil, | ||
compbasemetrics.ALPHA, | ||
"") | ||
|
||
containerMemoryUsageDesc = compbasemetrics.NewDesc("container_memory_working_set_bytes", | ||
"Current working set of the container in bytes", | ||
[]string{"container", "pod", "namespace"}, | ||
nil, | ||
compbasemetrics.ALPHA, | ||
"") | ||
|
||
podCPUUsageDesc = compbasemetrics.NewDesc("pod_cpu_usage_seconds_total", | ||
"Cumulative cpu time consumed by the pod in core-seconds", | ||
[]string{"pod", "namespace"}, | ||
nil, | ||
compbasemetrics.ALPHA, | ||
"") | ||
|
||
podMemoryUsageDesc = compbasemetrics.NewDesc("pod_memory_working_set_bytes", | ||
"Current working set of the pod in bytes", | ||
[]string{"pod", "namespace"}, | ||
nil, | ||
compbasemetrics.ALPHA, | ||
"") | ||
|
||
resourceScrapeResultDesc = compbasemetrics.NewDesc("scrape_error", | ||
"1 if there was an error while getting container metrics, 0 otherwise", | ||
nil, | ||
nil, | ||
compbasemetrics.ALPHA, | ||
"") | ||
|
||
containerStartTimeDesc = compbasemetrics.NewDesc("container_start_time_seconds", | ||
"Start time of the container since unix epoch in seconds", | ||
[]string{"container", "pod", "namespace"}, | ||
nil, | ||
compbasemetrics.ALPHA, | ||
"") | ||
) | ||
|
||
// NewResourceMetricsCollector returns a metrics.StableCollector which exports resource metrics | ||
func NewKubeletResourceMetricsCollector(podStats *stats.Summary) compbasemetrics.StableCollector { | ||
return &resourceMetricsCollector{ | ||
providerPodStats: podStats, | ||
} | ||
} | ||
|
||
type resourceMetricsCollector struct { | ||
compbasemetrics.BaseStableCollector | ||
|
||
providerPodStats *stats.Summary | ||
} | ||
|
||
// Check if resourceMetricsCollector implements necessary interface | ||
var _ compbasemetrics.StableCollector = &resourceMetricsCollector{} | ||
|
||
// DescribeWithStability implements compbasemetrics.StableCollector | ||
func (rc *resourceMetricsCollector) DescribeWithStability(ch chan<- *compbasemetrics.Desc) { | ||
ch <- nodeCPUUsageDesc | ||
ch <- nodeMemoryUsageDesc | ||
ch <- containerStartTimeDesc | ||
ch <- containerCPUUsageDesc | ||
ch <- containerMemoryUsageDesc | ||
ch <- podCPUUsageDesc | ||
ch <- podMemoryUsageDesc | ||
ch <- resourceScrapeResultDesc | ||
} | ||
|
||
// CollectWithStability implements compbasemetrics.StableCollector | ||
// Since new containers are frequently created and removed, using the Gauge would | ||
// leak metric collectors for containers or pods that no longer exist. Instead, implement | ||
// custom collector in a way that only collects metrics for active containers. | ||
func (rc *resourceMetricsCollector) CollectWithStability(ch chan<- compbasemetrics.Metric) { | ||
var errorCount float64 | ||
defer func() { | ||
ch <- compbasemetrics.NewLazyConstMetric(resourceScrapeResultDesc, compbasemetrics.GaugeValue, errorCount) | ||
}() | ||
|
||
statsSummary := *rc.providerPodStats | ||
rc.collectNodeCPUMetrics(ch, statsSummary.Node) | ||
rc.collectNodeMemoryMetrics(ch, statsSummary.Node) | ||
|
||
for _, pod := range statsSummary.Pods { | ||
for _, container := range pod.Containers { | ||
rc.collectContainerStartTime(ch, pod, container) | ||
rc.collectContainerCPUMetrics(ch, pod, container) | ||
rc.collectContainerMemoryMetrics(ch, pod, container) | ||
} | ||
rc.collectPodCPUMetrics(ch, pod) | ||
rc.collectPodMemoryMetrics(ch, pod) | ||
} | ||
} | ||
|
||
// implement collector methods and validate that correct data is used | ||
|
||
func (rc *resourceMetricsCollector) collectNodeCPUMetrics(ch chan<- compbasemetrics.Metric, s stats.NodeStats) { | ||
if s.CPU == nil || s.CPU.UsageCoreNanoSeconds == nil { | ||
return | ||
} | ||
|
||
ch <- compbasemetrics.NewLazyMetricWithTimestamp(s.CPU.Time.Time, | ||
compbasemetrics.NewLazyConstMetric(nodeCPUUsageDesc, compbasemetrics.CounterValue, float64(*s.CPU.UsageCoreNanoSeconds)/float64(time.Second))) | ||
} | ||
|
||
func (rc *resourceMetricsCollector) collectNodeMemoryMetrics(ch chan<- compbasemetrics.Metric, s stats.NodeStats) { | ||
if s.Memory == nil || s.Memory.WorkingSetBytes == nil { | ||
return | ||
} | ||
|
||
ch <- compbasemetrics.NewLazyMetricWithTimestamp(s.Memory.Time.Time, | ||
compbasemetrics.NewLazyConstMetric(nodeMemoryUsageDesc, compbasemetrics.GaugeValue, float64(*s.Memory.WorkingSetBytes))) | ||
} | ||
|
||
func (rc *resourceMetricsCollector) collectContainerStartTime(ch chan<- compbasemetrics.Metric, pod stats.PodStats, s stats.ContainerStats) { | ||
if s.StartTime.Unix() <= 0 { | ||
return | ||
} | ||
|
||
ch <- compbasemetrics.NewLazyMetricWithTimestamp(s.StartTime.Time, | ||
compbasemetrics.NewLazyConstMetric(containerStartTimeDesc, compbasemetrics.GaugeValue, float64(s.StartTime.UnixNano())/float64(time.Second), s.Name, pod.PodRef.Name, pod.PodRef.Namespace)) | ||
} | ||
|
||
func (rc *resourceMetricsCollector) collectContainerCPUMetrics(ch chan<- compbasemetrics.Metric, pod stats.PodStats, s stats.ContainerStats) { | ||
if s.CPU == nil || s.CPU.UsageCoreNanoSeconds == nil { | ||
return | ||
} | ||
|
||
ch <- compbasemetrics.NewLazyMetricWithTimestamp(s.CPU.Time.Time, | ||
compbasemetrics.NewLazyConstMetric(containerCPUUsageDesc, compbasemetrics.CounterValue, | ||
float64(*s.CPU.UsageCoreNanoSeconds)/float64(time.Second), s.Name, pod.PodRef.Name, pod.PodRef.Namespace)) | ||
} | ||
|
||
func (rc *resourceMetricsCollector) collectContainerMemoryMetrics(ch chan<- compbasemetrics.Metric, pod stats.PodStats, s stats.ContainerStats) { | ||
if s.Memory == nil || s.Memory.WorkingSetBytes == nil { | ||
return | ||
} | ||
|
||
ch <- compbasemetrics.NewLazyMetricWithTimestamp(s.Memory.Time.Time, | ||
compbasemetrics.NewLazyConstMetric(containerMemoryUsageDesc, compbasemetrics.GaugeValue, | ||
float64(*s.Memory.WorkingSetBytes), s.Name, pod.PodRef.Name, pod.PodRef.Namespace)) | ||
} | ||
|
||
func (rc *resourceMetricsCollector) collectPodCPUMetrics(ch chan<- compbasemetrics.Metric, pod stats.PodStats) { | ||
if pod.CPU == nil || pod.CPU.UsageCoreNanoSeconds == nil { | ||
return | ||
} | ||
|
||
ch <- compbasemetrics.NewLazyMetricWithTimestamp(pod.CPU.Time.Time, | ||
compbasemetrics.NewLazyConstMetric(podCPUUsageDesc, compbasemetrics.CounterValue, | ||
float64(*pod.CPU.UsageCoreNanoSeconds)/float64(time.Second), pod.PodRef.Name, pod.PodRef.Namespace)) | ||
} | ||
|
||
func (rc *resourceMetricsCollector) collectPodMemoryMetrics(ch chan<- compbasemetrics.Metric, pod stats.PodStats) { | ||
if pod.Memory == nil || pod.Memory.WorkingSetBytes == nil { | ||
return | ||
} | ||
|
||
ch <- compbasemetrics.NewLazyMetricWithTimestamp(pod.Memory.Time.Time, | ||
compbasemetrics.NewLazyConstMetric(podMemoryUsageDesc, compbasemetrics.GaugeValue, | ||
float64(*pod.Memory.WorkingSetBytes), pod.PodRef.Name, pod.PodRef.Namespace)) | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.