linkerd2/viz/metrics-api/grpc_server.go

241 lines
6.6 KiB
Go

package api
import (
"context"
"errors"
"fmt"
"time"
"github.com/golang/protobuf/ptypes/duration"
healthcheckPb "github.com/linkerd/linkerd2/controller/gen/common/healthcheck"
"github.com/linkerd/linkerd2/controller/k8s"
pkgK8s "github.com/linkerd/linkerd2/pkg/k8s"
"github.com/linkerd/linkerd2/pkg/prometheus"
pb "github.com/linkerd/linkerd2/viz/metrics-api/gen/viz"
"github.com/linkerd/linkerd2/viz/metrics-api/util"
promv1 "github.com/prometheus/client_golang/api/prometheus/v1"
log "github.com/sirupsen/logrus"
corev1 "k8s.io/api/core/v1"
"k8s.io/apimachinery/pkg/labels"
)
// Server specifies the interface the Viz metric API server should implement
type Server interface {
pb.ApiServer
}
type grpcServer struct {
prometheusAPI promv1.API
k8sAPI *k8s.API
controllerNamespace string
clusterDomain string
ignoredNamespaces []string
}
type podReport struct {
lastReport time.Time
processStartTimeSeconds time.Time
}
const (
podQuery = "max(process_start_time_seconds{%s}) by (pod, namespace)"
k8sClientSubsystemName = "kubernetes"
k8sClientCheckDescription = "linkerd viz can talk to Kubernetes"
promClientSubsystemName = "prometheus"
promClientCheckDescription = "linkerd viz can talk to Prometheus"
)
func newGrpcServer(
promAPI promv1.API,
k8sAPI *k8s.API,
controllerNamespace string,
clusterDomain string,
ignoredNamespaces []string,
) *grpcServer {
grpcServer := &grpcServer{
prometheusAPI: promAPI,
k8sAPI: k8sAPI,
controllerNamespace: controllerNamespace,
clusterDomain: clusterDomain,
ignoredNamespaces: ignoredNamespaces,
}
pb.RegisterApiServer(prometheus.NewGrpcServer(), grpcServer)
return grpcServer
}
func (s *grpcServer) ListPods(ctx context.Context, req *pb.ListPodsRequest) (*pb.ListPodsResponse, error) {
log.Debugf("ListPods request: %+v", req)
targetOwner := req.GetSelector().GetResource()
// Reports is a map from instance name to the absolute time of the most recent
// report from that instance and its process start time
reports := make(map[string]podReport)
if req.GetNamespace() != "" && req.GetSelector() != nil {
return nil, errors.New("cannot set both namespace and resource in the request. These are mutually exclusive")
}
labelSelector := labels.Everything()
if s := req.GetSelector().GetLabelSelector(); s != "" {
var err error
labelSelector, err = labels.Parse(s)
if err != nil {
return nil, fmt.Errorf("invalid label selector \"%s\": %s", s, err)
}
}
nsQuery := ""
namespace := ""
if req.GetNamespace() != "" {
namespace = req.GetNamespace()
} else if targetOwner.GetNamespace() != "" {
namespace = targetOwner.GetNamespace()
} else if targetOwner.GetType() == pkgK8s.Namespace {
namespace = targetOwner.GetName()
}
if namespace != "" {
nsQuery = fmt.Sprintf("namespace=\"%s\"", namespace)
}
processStartTimeQuery := fmt.Sprintf(podQuery, nsQuery)
// Query Prometheus for all pods present
vec, err := s.queryProm(ctx, processStartTimeQuery)
if err != nil && !errors.Is(err, ErrNoPrometheusInstance) {
return nil, err
}
for _, sample := range vec {
pod := string(sample.Metric["pod"])
timestamp := sample.Timestamp
reports[pod] = podReport{
lastReport: time.Unix(0, int64(timestamp)*int64(time.Millisecond)),
processStartTimeSeconds: time.Unix(0, int64(sample.Value)*int64(time.Second)),
}
}
var pods []*corev1.Pod
if namespace != "" {
pods, err = s.k8sAPI.Pod().Lister().Pods(namespace).List(labelSelector)
} else {
pods, err = s.k8sAPI.Pod().Lister().List(labelSelector)
}
if err != nil {
return nil, err
}
podList := make([]*pb.Pod, 0)
for _, pod := range pods {
if s.shouldIgnore(pod) {
continue
}
ownerKind, ownerName := s.k8sAPI.GetOwnerKindAndName(ctx, pod, false)
// filter out pods without matching owner
if targetOwner.GetNamespace() != "" && targetOwner.GetNamespace() != pod.GetNamespace() {
continue
}
if targetOwner.GetType() != "" && targetOwner.GetType() != ownerKind {
continue
}
if targetOwner.GetName() != "" && targetOwner.GetName() != ownerName {
continue
}
updated, added := reports[pod.Name]
item := util.K8sPodToPublicPod(*pod, ownerKind, ownerName)
item.Added = added
if added {
since := time.Since(updated.lastReport)
item.SinceLastReport = &duration.Duration{
Seconds: int64(since / time.Second),
Nanos: int32(since % time.Second),
}
sinceStarting := time.Since(updated.processStartTimeSeconds)
item.Uptime = &duration.Duration{
Seconds: int64(sinceStarting / time.Second),
Nanos: int32(sinceStarting % time.Second),
}
}
podList = append(podList, item)
}
rsp := pb.ListPodsResponse{Pods: podList}
log.Debugf("ListPods response: %s", rsp.String())
return &rsp, nil
}
func (s *grpcServer) SelfCheck(ctx context.Context, in *healthcheckPb.SelfCheckRequest) (*healthcheckPb.SelfCheckResponse, error) {
k8sClientCheck := &healthcheckPb.CheckResult{
SubsystemName: k8sClientSubsystemName,
CheckDescription: k8sClientCheckDescription,
Status: healthcheckPb.CheckStatus_OK,
}
_, err := s.k8sAPI.Pod().Lister().List(labels.Everything())
if err != nil {
k8sClientCheck.Status = healthcheckPb.CheckStatus_ERROR
k8sClientCheck.FriendlyMessageToUser = fmt.Sprintf("Error calling the Kubernetes API: %s", err)
}
response := &healthcheckPb.SelfCheckResponse{
Results: []*healthcheckPb.CheckResult{
k8sClientCheck,
},
}
if s.prometheusAPI != nil {
promClientCheck := &healthcheckPb.CheckResult{
SubsystemName: promClientSubsystemName,
CheckDescription: promClientCheckDescription,
Status: healthcheckPb.CheckStatus_OK,
}
_, err = s.queryProm(ctx, fmt.Sprintf(podQuery, ""))
if err != nil {
promClientCheck.Status = healthcheckPb.CheckStatus_ERROR
promClientCheck.FriendlyMessageToUser = fmt.Sprintf("Error calling Prometheus from the control plane: %s", err)
}
response.Results = append(response.Results, promClientCheck)
}
return response, nil
}
func (s *grpcServer) shouldIgnore(pod *corev1.Pod) bool {
for _, namespace := range s.ignoredNamespaces {
if pod.Namespace == namespace {
return true
}
}
return false
}
func (s *grpcServer) ListServices(ctx context.Context, req *pb.ListServicesRequest) (*pb.ListServicesResponse, error) {
log.Debugf("ListServices request: %+v", req)
services, err := s.k8sAPI.GetServices(req.Namespace, "")
if err != nil {
return nil, err
}
svcs := make([]*pb.Service, 0)
for _, svc := range services {
svcs = append(svcs, &pb.Service{
Name: svc.GetName(),
Namespace: svc.GetNamespace(),
})
}
return &pb.ListServicesResponse{Services: svcs}, nil
}