linkerd2/controller/api/public/grpc_server.go

276 lines
7.8 KiB
Go

package public
import (
"context"
"fmt"
"runtime"
"strings"
"time"
"github.com/golang/protobuf/ptypes/duration"
healthcheckPb "github.com/linkerd/linkerd2/controller/gen/common/healthcheck"
tapPb "github.com/linkerd/linkerd2/controller/gen/controller/tap"
pb "github.com/linkerd/linkerd2/controller/gen/public"
"github.com/linkerd/linkerd2/controller/k8s"
pkgK8s "github.com/linkerd/linkerd2/pkg/k8s"
"github.com/linkerd/linkerd2/pkg/version"
promv1 "github.com/prometheus/client_golang/api/prometheus/v1"
log "github.com/sirupsen/logrus"
"google.golang.org/grpc/codes"
"google.golang.org/grpc/status"
k8sV1 "k8s.io/api/core/v1"
"k8s.io/apimachinery/pkg/labels"
)
type (
grpcServer struct {
prometheusAPI promv1.API
tapClient tapPb.TapClient
k8sAPI *k8s.API
controllerNamespace string
ignoredNamespaces []string
}
)
type podReport struct {
lastReport time.Time
processStartTimeSeconds time.Time
}
const (
podQuery = "max(process_start_time_seconds{%s}) by (pod, namespace)"
k8sClientSubsystemName = "kubernetes"
k8sClientCheckDescription = "control plane can talk to Kubernetes"
promClientSubsystemName = "prometheus"
promClientCheckDescription = "control plane can talk to Prometheus"
)
func newGrpcServer(
promAPI promv1.API,
tapClient tapPb.TapClient,
k8sAPI *k8s.API,
controllerNamespace string,
ignoredNamespaces []string,
) *grpcServer {
return &grpcServer{
prometheusAPI: promAPI,
tapClient: tapClient,
k8sAPI: k8sAPI,
controllerNamespace: controllerNamespace,
ignoredNamespaces: ignoredNamespaces,
}
}
func (*grpcServer) Version(ctx context.Context, req *pb.Empty) (*pb.VersionInfo, error) {
return &pb.VersionInfo{GoVersion: runtime.Version(), ReleaseVersion: version.Version, BuildDate: "1970-01-01T00:00:00Z"}, nil
}
func (s *grpcServer) ListPods(ctx context.Context, req *pb.ListPodsRequest) (*pb.ListPodsResponse, error) {
log.Debugf("ListPods request: %+v", req)
// Reports is a map from instance name to the absolute time of the most recent
// report from that instance and its process start time
reports := make(map[string]podReport)
nsQuery := ""
if req.GetNamespace() != "" {
nsQuery = fmt.Sprintf("namespace=\"%s\"", req.GetNamespace())
}
processStartTimeQuery := fmt.Sprintf(podQuery, nsQuery)
// Query Prometheus for all pods present
vec, err := s.queryProm(ctx, processStartTimeQuery)
if err != nil {
return nil, err
}
for _, sample := range vec {
pod := string(sample.Metric["pod"])
timestamp := sample.Timestamp
reports[pod] = podReport{
lastReport: time.Unix(0, int64(timestamp)*int64(time.Millisecond)),
processStartTimeSeconds: time.Unix(0, int64(sample.Value)*int64(time.Second)),
}
}
var pods []*k8sV1.Pod
namespace := req.GetNamespace()
if namespace != "" {
pods, err = s.k8sAPI.Pod().Lister().Pods(namespace).List(labels.Everything())
} else {
pods, err = s.k8sAPI.Pod().Lister().List(labels.Everything())
}
if err != nil {
return nil, err
}
podList := make([]*pb.Pod, 0)
for _, pod := range pods {
if s.shouldIgnore(pod) {
continue
}
updated, added := reports[pod.Name]
status := string(pod.Status.Phase)
if pod.DeletionTimestamp != nil {
status = "Terminating"
}
controllerComponent := pod.Labels[pkgK8s.ControllerComponentLabel]
controllerNS := pod.Labels[pkgK8s.ControllerNSLabel]
proxyReady := false
for _, container := range pod.Status.ContainerStatuses {
if container.Name == pkgK8s.ProxyContainerName {
proxyReady = container.Ready
}
}
proxyVersion := ""
for _, container := range pod.Spec.Containers {
if container.Name == pkgK8s.ProxyContainerName {
parts := strings.Split(container.Image, ":")
proxyVersion = parts[1]
}
}
item := &pb.Pod{
Name: pod.Namespace + "/" + pod.Name,
Status: status,
PodIP: pod.Status.PodIP,
Added: added,
ControllerNamespace: controllerNS,
ControlPlane: controllerComponent != "",
ProxyReady: proxyReady,
ProxyVersion: proxyVersion,
}
ownerKind, ownerName := s.k8sAPI.GetOwnerKindAndName(pod)
namespacedOwnerName := pod.Namespace + "/" + ownerName
switch ownerKind {
case "deployment":
item.Owner = &pb.Pod_Deployment{Deployment: namespacedOwnerName}
case "replicaset":
item.Owner = &pb.Pod_ReplicaSet{ReplicaSet: namespacedOwnerName}
case "replicationcontroller":
item.Owner = &pb.Pod_ReplicationController{ReplicationController: namespacedOwnerName}
case "statefulset":
item.Owner = &pb.Pod_StatefulSet{StatefulSet: namespacedOwnerName}
case "daemonset":
item.Owner = &pb.Pod_DaemonSet{DaemonSet: namespacedOwnerName}
case "job":
item.Owner = &pb.Pod_Job{Job: namespacedOwnerName}
}
if added {
since := time.Since(updated.lastReport)
item.SinceLastReport = &duration.Duration{
Seconds: int64(since / time.Second),
Nanos: int32(since % time.Second),
}
sinceStarting := time.Since(updated.processStartTimeSeconds)
item.Uptime = &duration.Duration{
Seconds: int64(sinceStarting / time.Second),
Nanos: int32(sinceStarting % time.Second),
}
}
podList = append(podList, item)
}
rsp := pb.ListPodsResponse{Pods: podList}
log.Debugf("ListPods response: %+v", rsp)
return &rsp, nil
}
func (s *grpcServer) SelfCheck(ctx context.Context, in *healthcheckPb.SelfCheckRequest) (*healthcheckPb.SelfCheckResponse, error) {
k8sClientCheck := &healthcheckPb.CheckResult{
SubsystemName: k8sClientSubsystemName,
CheckDescription: k8sClientCheckDescription,
Status: healthcheckPb.CheckStatus_OK,
}
_, err := s.k8sAPI.Pod().Lister().List(labels.Everything())
if err != nil {
k8sClientCheck.Status = healthcheckPb.CheckStatus_ERROR
k8sClientCheck.FriendlyMessageToUser = fmt.Sprintf("Error calling the Kubernetes API: %s", err)
}
promClientCheck := &healthcheckPb.CheckResult{
SubsystemName: promClientSubsystemName,
CheckDescription: promClientCheckDescription,
Status: healthcheckPb.CheckStatus_OK,
}
_, err = s.queryProm(ctx, fmt.Sprintf(podQuery, ""))
if err != nil {
promClientCheck.Status = healthcheckPb.CheckStatus_ERROR
promClientCheck.FriendlyMessageToUser = fmt.Sprintf("Error calling Prometheus from the control plane: %s", err)
}
response := &healthcheckPb.SelfCheckResponse{
Results: []*healthcheckPb.CheckResult{
k8sClientCheck,
promClientCheck,
},
}
return response, nil
}
func (s *grpcServer) Tap(req *pb.TapRequest, stream pb.Api_TapServer) error {
return status.Error(codes.Unimplemented, "Tap is deprecated, use TapByResource")
}
// Pass through to tap service
func (s *grpcServer) TapByResource(req *pb.TapByResourceRequest, stream pb.Api_TapByResourceServer) error {
tapStream := stream.(tapServer)
tapClient, err := s.tapClient.TapByResource(tapStream.Context(), req)
if err != nil {
log.Errorf("Unexpected error tapping [%v]: %v", req, err)
return err
}
for {
select {
case <-tapStream.Context().Done():
return nil
default:
event, err := tapClient.Recv()
if err != nil {
return err
}
tapStream.Send(event)
}
}
}
func (s *grpcServer) shouldIgnore(pod *k8sV1.Pod) bool {
for _, namespace := range s.ignoredNamespaces {
if pod.Namespace == namespace {
return true
}
}
return false
}
func (s *grpcServer) ListServices(ctx context.Context, req *pb.ListServicesRequest) (*pb.ListServicesResponse, error) {
log.Debugf("ListServices request: %+v", req)
services, err := s.k8sAPI.GetServices(req.Namespace, "")
if err != nil {
return nil, err
}
svcs := make([]*pb.Service, 0)
for _, svc := range services {
svcs = append(svcs, &pb.Service{
Name: svc.GetName(),
Namespace: svc.GetNamespace(),
})
}
return &pb.ListServicesResponse{Services: svcs}, nil
}