456 lines
14 KiB
Go
456 lines
14 KiB
Go
/*
|
|
Copyright 2020 KubeSphere Authors
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package metricsserver
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"time"
|
|
|
|
"k8s.io/api/core/v1"
|
|
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
|
|
"k8s.io/client-go/kubernetes"
|
|
"k8s.io/client-go/tools/clientcmd"
|
|
"k8s.io/klog"
|
|
|
|
promlabels "github.com/prometheus/prometheus/pkg/labels"
|
|
metricsapi "k8s.io/metrics/pkg/apis/metrics"
|
|
metricsV1beta1 "k8s.io/metrics/pkg/apis/metrics/v1beta1"
|
|
metricsclient "k8s.io/metrics/pkg/client/clientset/versioned"
|
|
|
|
"kubesphere.io/kubesphere/pkg/simple/client/k8s"
|
|
"kubesphere.io/kubesphere/pkg/simple/client/monitoring"
|
|
)
|
|
|
|
// metricsServer implements monitoring interface backend by metrics-server
|
|
type metricsServer struct {
|
|
metricsAPIAvailable bool
|
|
metricsClient metricsclient.Interface
|
|
k8s kubernetes.Interface
|
|
}
|
|
|
|
var (
|
|
supportedMetricsAPIs = map[string]bool{
|
|
"v1beta1": true,
|
|
}
|
|
)
|
|
|
|
const edgeNodeLabel = "node-role.kubernetes.io/edge"
|
|
|
|
func metricsAPISupported(discoveredAPIGroups *metav1.APIGroupList) bool {
|
|
for _, discoveredAPIGroup := range discoveredAPIGroups.Groups {
|
|
if discoveredAPIGroup.Name != metricsapi.GroupName {
|
|
continue
|
|
}
|
|
for _, version := range discoveredAPIGroup.Versions {
|
|
if _, found := supportedMetricsAPIs[version.Version]; found {
|
|
return true
|
|
}
|
|
}
|
|
}
|
|
return false
|
|
}
|
|
|
|
func (m metricsServer) listEdgeNodes() (map[string]v1.Node, error) {
|
|
nodes := make(map[string]v1.Node)
|
|
|
|
nodeClient := m.k8s.CoreV1()
|
|
|
|
nodeList, err := nodeClient.Nodes().List(context.TODO(), metav1.ListOptions{
|
|
LabelSelector: edgeNodeLabel,
|
|
})
|
|
if err != nil {
|
|
return nodes, err
|
|
}
|
|
|
|
for _, n := range nodeList.Items {
|
|
nodes[n.Name] = n
|
|
}
|
|
|
|
return nodes, nil
|
|
}
|
|
|
|
func (m metricsServer) filterEdgeNodeNames(edgeNodes map[string]v1.Node, opts *monitoring.QueryOptions) map[string]bool {
|
|
edgeNodeNamesFiltered := make(map[string]bool)
|
|
|
|
regexMatcher, err := promlabels.NewMatcher(promlabels.MatchRegexp, "edgenodefilter", opts.ResourceFilter)
|
|
|
|
if err != nil {
|
|
klog.Errorf("Edge node filter regexp error %v\n", err)
|
|
return edgeNodeNamesFiltered
|
|
}
|
|
|
|
for _, n := range edgeNodes {
|
|
if regexMatcher.Matches(n.Name) {
|
|
edgeNodeNamesFiltered[n.Name] = true
|
|
}
|
|
}
|
|
|
|
return edgeNodeNamesFiltered
|
|
}
|
|
|
|
func (m metricsServer) getNodeMetricsFromMetricsAPI() (*metricsapi.NodeMetricsList, error) {
|
|
var err error
|
|
versionedMetrics := &metricsV1beta1.NodeMetricsList{}
|
|
mc := m.metricsClient.MetricsV1beta1()
|
|
nm := mc.NodeMetricses()
|
|
versionedMetrics, err = nm.List(context.TODO(), metav1.ListOptions{LabelSelector: edgeNodeLabel})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
metrics := &metricsapi.NodeMetricsList{}
|
|
err = metricsV1beta1.Convert_v1beta1_NodeMetricsList_To_metrics_NodeMetricsList(versionedMetrics, metrics, nil)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return metrics, nil
|
|
}
|
|
|
|
func NewMetricsClient(k kubernetes.Interface, options *k8s.KubernetesOptions) monitoring.Interface {
|
|
config, err := clientcmd.BuildConfigFromFlags("", options.KubeConfig)
|
|
if err != nil {
|
|
klog.Error(err)
|
|
return nil
|
|
}
|
|
|
|
discoveryClient := k.Discovery()
|
|
apiGroups, err := discoveryClient.ServerGroups()
|
|
if err != nil {
|
|
klog.Error(err)
|
|
return nil
|
|
}
|
|
|
|
metricsAPIAvailable := metricsAPISupported(apiGroups)
|
|
|
|
if !metricsAPIAvailable {
|
|
klog.Warningf("Metrics API not available.")
|
|
return nil
|
|
}
|
|
|
|
metricsClient, err := metricsclient.NewForConfig(config)
|
|
if err != nil {
|
|
klog.Error(err)
|
|
return nil
|
|
}
|
|
|
|
return NewMetricsServer(k, metricsAPIAvailable, metricsClient)
|
|
}
|
|
|
|
func NewMetricsServer(k kubernetes.Interface, a bool, m metricsclient.Interface) monitoring.Interface {
|
|
var metricsServer metricsServer
|
|
|
|
metricsServer.k8s = k
|
|
metricsServer.metricsAPIAvailable = a
|
|
metricsServer.metricsClient = m
|
|
|
|
return metricsServer
|
|
}
|
|
|
|
func (m metricsServer) GetMetric(expr string, ts time.Time) monitoring.Metric {
|
|
var parsedResp monitoring.Metric
|
|
|
|
return parsedResp
|
|
}
|
|
|
|
func (m metricsServer) GetMetricOverTime(expr string, start, end time.Time, step time.Duration) monitoring.Metric {
|
|
var parsedResp monitoring.Metric
|
|
|
|
return parsedResp
|
|
}
|
|
|
|
const (
|
|
metricsNodeCPUUsage = "node_cpu_usage"
|
|
metricsNodeCPUTotal = "node_cpu_total"
|
|
metricsNodeCPUUltilisation = "node_cpu_utilisation"
|
|
metricsNodeMemoryUsageWoCache = "node_memory_usage_wo_cache"
|
|
metricsNodeMemoryTotal = "node_memory_total"
|
|
metricsNodeMemoryUltilisation = "node_memory_utilisation"
|
|
)
|
|
|
|
var edgeNodeMetrics = []string{metricsNodeCPUUsage, metricsNodeCPUTotal, metricsNodeCPUUltilisation, metricsNodeMemoryUsageWoCache, metricsNodeMemoryTotal, metricsNodeMemoryUltilisation}
|
|
|
|
func (m metricsServer) parseErrorResp(metrics []string, err error) []monitoring.Metric {
|
|
var res []monitoring.Metric
|
|
|
|
for _, metric := range metrics {
|
|
parsedResp := monitoring.Metric{MetricName: metric}
|
|
parsedResp.Error = err.Error()
|
|
}
|
|
|
|
return res
|
|
}
|
|
|
|
func (m metricsServer) GetNamedMetrics(metrics []string, ts time.Time, o monitoring.QueryOption) []monitoring.Metric {
|
|
var res []monitoring.Metric
|
|
|
|
opts := monitoring.NewQueryOptions()
|
|
o.Apply(opts)
|
|
if opts.Level == monitoring.LevelNode {
|
|
if !m.metricsAPIAvailable {
|
|
klog.Warningf("Metrics API not available.")
|
|
return m.parseErrorResp(metrics, errors.New("Metrics API not available."))
|
|
}
|
|
|
|
edgeNodes, err := m.listEdgeNodes()
|
|
if err != nil {
|
|
klog.Errorf("List edge nodes error %v\n", err)
|
|
return m.parseErrorResp(metrics, err)
|
|
}
|
|
|
|
edgeNodeNamesFiltered := m.filterEdgeNodeNames(edgeNodes, opts)
|
|
if len(edgeNodeNamesFiltered) == 0 {
|
|
klog.V(4).Infof("No edge node metrics is requested")
|
|
return res
|
|
}
|
|
|
|
metricsResult, err := m.getNodeMetricsFromMetricsAPI()
|
|
if err != nil {
|
|
klog.Errorf("Get edge node metrics error %v\n", err)
|
|
return m.parseErrorResp(metrics, err)
|
|
}
|
|
|
|
metricsMap := make(map[string]bool)
|
|
for _, m := range metrics {
|
|
metricsMap[m] = true
|
|
}
|
|
|
|
status := make(map[string]v1.NodeStatus)
|
|
for n, _ := range edgeNodeNamesFiltered {
|
|
status[n] = edgeNodes[n].Status
|
|
}
|
|
|
|
nodeMetrics := make(map[string]*monitoring.MetricData)
|
|
for _, enm := range edgeNodeMetrics {
|
|
_, ok := metricsMap[enm]
|
|
if ok {
|
|
nodeMetrics[enm] = &monitoring.MetricData{MetricType: monitoring.MetricTypeVector}
|
|
}
|
|
}
|
|
|
|
var usage v1.ResourceList
|
|
var cap v1.ResourceList
|
|
for _, m := range metricsResult.Items {
|
|
_, ok := edgeNodeNamesFiltered[m.Name]
|
|
if !ok {
|
|
continue
|
|
}
|
|
|
|
m.Usage.DeepCopyInto(&usage)
|
|
status[m.Name].Capacity.DeepCopyInto(&cap)
|
|
|
|
metricValues := make(map[string]*monitoring.MetricValue)
|
|
|
|
for _, enm := range edgeNodeMetrics {
|
|
metricValues[enm] = &monitoring.MetricValue{
|
|
Metadata: make(map[string]string),
|
|
}
|
|
metricValues[enm].Metadata["node"] = m.Name
|
|
metricValues[enm].Metadata["role"] = "edge"
|
|
}
|
|
for _, addr := range status[m.Name].Addresses {
|
|
if addr.Type == v1.NodeInternalIP {
|
|
for _, enm := range edgeNodeMetrics {
|
|
metricValues[enm].Metadata["host_ip"] = addr.Address
|
|
}
|
|
break
|
|
}
|
|
}
|
|
|
|
_, ok = metricsMap[metricsNodeCPUUsage]
|
|
if ok {
|
|
metricValues[metricsNodeCPUUsage].Sample = &monitoring.Point{float64(m.Timestamp.Unix()), float64(usage.Cpu().MilliValue()) / 1000}
|
|
}
|
|
_, ok = metricsMap[metricsNodeCPUTotal]
|
|
if ok {
|
|
metricValues[metricsNodeCPUTotal].Sample = &monitoring.Point{float64(m.Timestamp.Unix()), float64(cap.Cpu().MilliValue()) / 1000}
|
|
}
|
|
_, ok = metricsMap[metricsNodeCPUUltilisation]
|
|
if ok {
|
|
metricValues[metricsNodeCPUUltilisation].Sample = &monitoring.Point{float64(m.Timestamp.Unix()), float64(usage.Cpu().MilliValue()) / float64(cap.Cpu().MilliValue())}
|
|
}
|
|
_, ok = metricsMap[metricsNodeMemoryUsageWoCache]
|
|
if ok {
|
|
metricValues[metricsNodeMemoryUsageWoCache].Sample = &monitoring.Point{float64(m.Timestamp.Unix()), float64(usage.Memory().Value())}
|
|
}
|
|
_, ok = metricsMap[metricsNodeMemoryTotal]
|
|
if ok {
|
|
metricValues[metricsNodeMemoryTotal].Sample = &monitoring.Point{float64(m.Timestamp.Unix()), float64(cap.Memory().Value())}
|
|
}
|
|
_, ok = metricsMap[metricsNodeMemoryUltilisation]
|
|
if ok {
|
|
metricValues[metricsNodeMemoryUltilisation].Sample = &monitoring.Point{float64(m.Timestamp.Unix()), float64(usage.Memory().Value()) / float64(cap.Memory().Value())}
|
|
}
|
|
|
|
for _, enm := range edgeNodeMetrics {
|
|
_, ok = metricsMap[enm]
|
|
if ok {
|
|
nodeMetrics[enm].MetricValues = append(nodeMetrics[enm].MetricValues, *metricValues[enm])
|
|
}
|
|
}
|
|
}
|
|
|
|
for _, enm := range edgeNodeMetrics {
|
|
_, ok := metricsMap[enm]
|
|
if ok {
|
|
res = append(res, monitoring.Metric{MetricName: enm, MetricData: *nodeMetrics[enm]})
|
|
}
|
|
}
|
|
}
|
|
|
|
return res
|
|
}
|
|
|
|
func (m metricsServer) GetNamedMetricsOverTime(metrics []string, start, end time.Time, step time.Duration, o monitoring.QueryOption) []monitoring.Metric {
|
|
var res []monitoring.Metric
|
|
|
|
opts := monitoring.NewQueryOptions()
|
|
o.Apply(opts)
|
|
if opts.Level == monitoring.LevelNode {
|
|
if !m.metricsAPIAvailable {
|
|
klog.Warningf("Metrics API not available.")
|
|
return m.parseErrorResp(metrics, errors.New("Metrics API not available."))
|
|
}
|
|
|
|
edgeNodes, err := m.listEdgeNodes()
|
|
if err != nil {
|
|
klog.Errorf("List edge nodes error %v\n", err)
|
|
return m.parseErrorResp(metrics, err)
|
|
}
|
|
|
|
edgeNodeNamesFiltered := m.filterEdgeNodeNames(edgeNodes, opts)
|
|
if len(edgeNodeNamesFiltered) == 0 {
|
|
klog.V(4).Infof("No edge node metrics is requested")
|
|
return res
|
|
}
|
|
|
|
metricsResult, err := m.getNodeMetricsFromMetricsAPI()
|
|
if err != nil {
|
|
klog.Errorf("Get edge node metrics error %v\n", err)
|
|
return m.parseErrorResp(metrics, err)
|
|
}
|
|
|
|
metricsMap := make(map[string]bool)
|
|
for _, m := range metrics {
|
|
metricsMap[m] = true
|
|
}
|
|
|
|
status := make(map[string]v1.NodeStatus)
|
|
for n, _ := range edgeNodeNamesFiltered {
|
|
status[n] = edgeNodes[n].Status
|
|
}
|
|
|
|
nodeMetrics := make(map[string]*monitoring.MetricData)
|
|
for _, enm := range edgeNodeMetrics {
|
|
_, ok := metricsMap[enm]
|
|
if ok {
|
|
nodeMetrics[enm] = &monitoring.MetricData{MetricType: monitoring.MetricTypeMatrix}
|
|
}
|
|
}
|
|
|
|
var usage v1.ResourceList
|
|
var cap v1.ResourceList
|
|
for _, m := range metricsResult.Items {
|
|
_, ok := edgeNodeNamesFiltered[m.Name]
|
|
if !ok {
|
|
continue
|
|
}
|
|
|
|
m.Usage.DeepCopyInto(&usage)
|
|
status[m.Name].Capacity.DeepCopyInto(&cap)
|
|
|
|
metricValues := make(map[string]*monitoring.MetricValue)
|
|
|
|
for _, enm := range edgeNodeMetrics {
|
|
metricValues[enm] = &monitoring.MetricValue{
|
|
Metadata: make(map[string]string),
|
|
}
|
|
metricValues[enm].Metadata["node"] = m.Name
|
|
metricValues[enm].Metadata["role"] = "edge"
|
|
}
|
|
for _, addr := range status[m.Name].Addresses {
|
|
if addr.Type == v1.NodeInternalIP {
|
|
for _, enm := range edgeNodeMetrics {
|
|
metricValues[enm].Metadata["host_ip"] = addr.Address
|
|
}
|
|
break
|
|
}
|
|
}
|
|
|
|
_, ok = metricsMap[metricsNodeCPUUsage]
|
|
if ok {
|
|
metricValues[metricsNodeCPUUsage].Series = append(metricValues[metricsNodeCPUUsage].Series, monitoring.Point{float64(m.Timestamp.Unix()), float64(usage.Cpu().MilliValue()) / 1000})
|
|
}
|
|
_, ok = metricsMap[metricsNodeCPUTotal]
|
|
if ok {
|
|
metricValues[metricsNodeCPUTotal].Series = append(metricValues[metricsNodeCPUTotal].Series, monitoring.Point{float64(m.Timestamp.Unix()), float64(cap.Cpu().MilliValue()) / 1000})
|
|
}
|
|
_, ok = metricsMap[metricsNodeCPUUltilisation]
|
|
if ok {
|
|
metricValues[metricsNodeCPUUltilisation].Series = append(metricValues[metricsNodeCPUUltilisation].Series, monitoring.Point{float64(m.Timestamp.Unix()), float64(usage.Cpu().MilliValue()) / float64(cap.Cpu().MilliValue())})
|
|
}
|
|
_, ok = metricsMap[metricsNodeMemoryUsageWoCache]
|
|
if ok {
|
|
metricValues[metricsNodeMemoryUsageWoCache].Series = append(metricValues[metricsNodeMemoryUsageWoCache].Series, monitoring.Point{float64(m.Timestamp.Unix()), float64(usage.Memory().Value())})
|
|
}
|
|
_, ok = metricsMap[metricsNodeMemoryTotal]
|
|
if ok {
|
|
metricValues[metricsNodeMemoryTotal].Series = append(metricValues[metricsNodeMemoryTotal].Series, monitoring.Point{float64(m.Timestamp.Unix()), float64(cap.Memory().Value())})
|
|
}
|
|
_, ok = metricsMap[metricsNodeMemoryUltilisation]
|
|
if ok {
|
|
metricValues[metricsNodeMemoryUltilisation].Series = append(metricValues[metricsNodeMemoryUltilisation].Series, monitoring.Point{float64(m.Timestamp.Unix()), float64(usage.Memory().Value()) / float64(cap.Memory().Value())})
|
|
}
|
|
|
|
for _, enm := range edgeNodeMetrics {
|
|
_, ok = metricsMap[enm]
|
|
if ok {
|
|
nodeMetrics[enm].MetricValues = append(nodeMetrics[enm].MetricValues, *metricValues[enm])
|
|
}
|
|
}
|
|
}
|
|
|
|
for _, enm := range edgeNodeMetrics {
|
|
_, ok := metricsMap[enm]
|
|
if ok {
|
|
res = append(res, monitoring.Metric{MetricName: enm, MetricData: *nodeMetrics[enm]})
|
|
}
|
|
}
|
|
}
|
|
|
|
return res
|
|
}
|
|
|
|
func (m metricsServer) GetMetadata(namespace string) []monitoring.Metadata {
|
|
var meta []monitoring.Metadata
|
|
|
|
return meta
|
|
}
|
|
|
|
func (m metricsServer) GetMetricLabelSet(expr string, start, end time.Time) []map[string]string {
|
|
var res []map[string]string
|
|
|
|
return res
|
|
}
|
|
|
|
// meter
|
|
func (m metricsServer) GetNamedMeters(meters []string, time time.Time, opts []monitoring.QueryOption) []monitoring.Metric {
|
|
return nil
|
|
}
|
|
func (m metricsServer) GetNamedMetersOverTime(metrics []string, start, end time.Time, step time.Duration, opts []monitoring.QueryOption) []monitoring.Metric {
|
|
return nil
|
|
}
|