notebooks/components/notebook-controller/controllers/notebook_controller.go

671 lines
21 KiB
Go

/*
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package controllers
import (
"context"
"encoding/json"
"fmt"
"os"
"strings"
"github.com/go-logr/logr"
reconcilehelper "github.com/kubeflow/kubeflow/components/common/reconcilehelper"
"github.com/kubeflow/kubeflow/components/notebook-controller/api/v1beta1"
"github.com/kubeflow/kubeflow/components/notebook-controller/pkg/culler"
"github.com/kubeflow/kubeflow/components/notebook-controller/pkg/metrics"
appsv1 "k8s.io/api/apps/v1"
corev1 "k8s.io/api/core/v1"
apierrs "k8s.io/apimachinery/pkg/api/errors"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
"k8s.io/apimachinery/pkg/apis/meta/v1/unstructured"
"k8s.io/apimachinery/pkg/runtime"
"k8s.io/apimachinery/pkg/types"
"k8s.io/apimachinery/pkg/util/intstr"
"k8s.io/client-go/tools/record"
ctrl "sigs.k8s.io/controller-runtime"
"sigs.k8s.io/controller-runtime/pkg/client"
"sigs.k8s.io/controller-runtime/pkg/event"
"sigs.k8s.io/controller-runtime/pkg/handler"
"sigs.k8s.io/controller-runtime/pkg/predicate"
"sigs.k8s.io/controller-runtime/pkg/reconcile"
"sigs.k8s.io/controller-runtime/pkg/source"
)
const DefaultContainerPort = 8888
const DefaultServingPort = 80
const AnnotationRewriteURI = "notebooks.kubeflow.org/http-rewrite-uri"
const AnnotationHeadersRequestSet = "notebooks.kubeflow.org/http-headers-request-set"
// The default fsGroup of PodSecurityContext.
// https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.11/#podsecuritycontext-v1-core
const DefaultFSGroup = int64(100)
/*
We generally want to ignore (not requeue) NotFound errors, since we'll get a
reconciliation request once the object exists, and requeuing in the meantime
won't help.
*/
func ignoreNotFound(err error) error {
if apierrs.IsNotFound(err) {
return nil
}
return err
}
// NotebookReconciler reconciles a Notebook object
type NotebookReconciler struct {
client.Client
Log logr.Logger
Scheme *runtime.Scheme
Metrics *metrics.Metrics
EventRecorder record.EventRecorder
}
// +kubebuilder:rbac:groups=core,resources=pods,verbs=get;list;watch
// +kubebuilder:rbac:groups=core,resources=events,verbs=get;list;watch;create
// +kubebuilder:rbac:groups=core,resources=services,verbs="*"
// +kubebuilder:rbac:groups=apps,resources=statefulsets,verbs="*"
// +kubebuilder:rbac:groups=kubeflow.org,resources=notebooks;notebooks/status;notebooks/finalizers,verbs="*"
// +kubebuilder:rbac:groups="networking.istio.io",resources=virtualservices,verbs="*"
func (r *NotebookReconciler) Reconcile(req ctrl.Request) (ctrl.Result, error) {
ctx := context.Background()
log := r.Log.WithValues("notebook", req.NamespacedName)
// TODO(yanniszark): Can we avoid reconciling Events and Notebook in the same queue?
event := &corev1.Event{}
var getEventErr error
getEventErr = r.Get(ctx, req.NamespacedName, event)
if getEventErr == nil {
involvedNotebook := &v1beta1.Notebook{}
nbName, err := nbNameFromInvolvedObject(r.Client, &event.InvolvedObject)
if err != nil {
return ctrl.Result{}, err
}
involvedNotebookKey := types.NamespacedName{Name: nbName, Namespace: req.Namespace}
if err := r.Get(ctx, involvedNotebookKey, involvedNotebook); err != nil {
log.Error(err, "unable to fetch Notebook by looking at event")
return ctrl.Result{}, ignoreNotFound(err)
}
r.EventRecorder.Eventf(involvedNotebook, event.Type, event.Reason,
"Reissued from %s/%s: %s", strings.ToLower(event.InvolvedObject.Kind), event.InvolvedObject.Name, event.Message)
}
if getEventErr != nil && !apierrs.IsNotFound(getEventErr) {
return ctrl.Result{}, getEventErr
}
// If not found, continue. Is not an event.
instance := &v1beta1.Notebook{}
if err := r.Get(ctx, req.NamespacedName, instance); err != nil {
log.Error(err, "unable to fetch Notebook")
return ctrl.Result{}, ignoreNotFound(err)
}
// Reconcile StatefulSet
ss := generateStatefulSet(instance)
if err := ctrl.SetControllerReference(instance, ss, r.Scheme); err != nil {
return ctrl.Result{}, err
}
// Check if the StatefulSet already exists
foundStateful := &appsv1.StatefulSet{}
justCreated := false
err := r.Get(ctx, types.NamespacedName{Name: ss.Name, Namespace: ss.Namespace}, foundStateful)
if err != nil && apierrs.IsNotFound(err) {
log.Info("Creating StatefulSet", "namespace", ss.Namespace, "name", ss.Name)
r.Metrics.NotebookCreation.WithLabelValues(ss.Namespace).Inc()
err = r.Create(ctx, ss)
justCreated = true
if err != nil {
log.Error(err, "unable to create Statefulset")
r.Metrics.NotebookFailCreation.WithLabelValues(ss.Namespace).Inc()
return ctrl.Result{}, err
}
} else if err != nil {
log.Error(err, "error getting Statefulset")
return ctrl.Result{}, err
}
// Update the foundStateful object and write the result back if there are any changes
if !justCreated && reconcilehelper.CopyStatefulSetFields(ss, foundStateful) {
log.Info("Updating StatefulSet", "namespace", ss.Namespace, "name", ss.Name)
err = r.Update(ctx, foundStateful)
if err != nil {
log.Error(err, "unable to update Statefulset")
return ctrl.Result{}, err
}
}
// Reconcile service
service := generateService(instance)
if err := ctrl.SetControllerReference(instance, service, r.Scheme); err != nil {
return ctrl.Result{}, err
}
// Check if the Service already exists
foundService := &corev1.Service{}
justCreated = false
err = r.Get(ctx, types.NamespacedName{Name: service.Name, Namespace: service.Namespace}, foundService)
if err != nil && apierrs.IsNotFound(err) {
log.Info("Creating Service", "namespace", service.Namespace, "name", service.Name)
err = r.Create(ctx, service)
justCreated = true
if err != nil {
log.Error(err, "unable to create Service")
return ctrl.Result{}, err
}
} else if err != nil {
log.Error(err, "error getting Statefulset")
return ctrl.Result{}, err
}
// Update the foundService object and write the result back if there are any changes
if !justCreated && reconcilehelper.CopyServiceFields(service, foundService) {
log.Info("Updating Service\n", "namespace", service.Namespace, "name", service.Name)
err = r.Update(ctx, foundService)
if err != nil {
log.Error(err, "unable to update Service")
return ctrl.Result{}, err
}
}
// Reconcile virtual service if we use ISTIO.
if os.Getenv("USE_ISTIO") == "true" {
err = r.reconcileVirtualService(instance)
if err != nil {
return ctrl.Result{}, err
}
}
// Update the readyReplicas if the status is changed
if foundStateful.Status.ReadyReplicas != instance.Status.ReadyReplicas {
log.Info("Updating Status", "namespace", instance.Namespace, "name", instance.Name)
instance.Status.ReadyReplicas = foundStateful.Status.ReadyReplicas
err = r.Status().Update(ctx, instance)
if err != nil {
return ctrl.Result{}, err
}
}
// Check the pod status
pod := &corev1.Pod{}
podFound := false
err = r.Get(ctx, types.NamespacedName{Name: ss.Name + "-0", Namespace: ss.Namespace}, pod)
if err != nil && apierrs.IsNotFound(err) {
// This should be reconciled by the StatefulSet
log.Info("Pod not found...")
} else if err != nil {
return ctrl.Result{}, err
} else {
// Got the pod
podFound = true
// Update status of the CR using the ContainerState of
// the container that has the same name as the CR.
// If no container of same name is found, the state of the CR is not updated.
if len(pod.Status.ContainerStatuses) > 0 {
notebookContainerFound := false
for i := range pod.Status.ContainerStatuses {
if pod.Status.ContainerStatuses[i].Name != instance.Name {
continue
}
if pod.Status.ContainerStatuses[i].State == instance.Status.ContainerState {
continue
}
log.Info("Updating Notebook CR state: ", "namespace", instance.Namespace, "name", instance.Name)
cs := pod.Status.ContainerStatuses[i].State
instance.Status.ContainerState = cs
oldConditions := instance.Status.Conditions
newCondition := getNextCondition(cs)
// Append new condition
if len(oldConditions) == 0 || oldConditions[0].Type != newCondition.Type ||
oldConditions[0].Reason != newCondition.Reason ||
oldConditions[0].Message != newCondition.Message {
log.Info("Appending to conditions: ", "namespace", instance.Namespace, "name", instance.Name, "type", newCondition.Type, "reason", newCondition.Reason, "message", newCondition.Message)
instance.Status.Conditions = append([]v1beta1.NotebookCondition{newCondition}, oldConditions...)
}
err = r.Status().Update(ctx, instance)
if err != nil {
return ctrl.Result{}, err
}
notebookContainerFound = true
break
}
if !notebookContainerFound {
log.Error(nil, "Could not find the Notebook container, will not update the status of the CR. No container has the same name as the CR.", "CR name:", instance.Name)
}
}
}
// Check if the Notebook needs to be stopped
if podFound && culler.NotebookNeedsCulling(instance.ObjectMeta) {
log.Info(fmt.Sprintf(
"Notebook %s/%s needs culling. Setting annotations",
instance.Namespace, instance.Name))
// Set annotations to the Notebook
culler.SetStopAnnotation(&instance.ObjectMeta, r.Metrics)
r.Metrics.NotebookCullingCount.WithLabelValues(instance.Namespace, instance.Name).Inc()
err = r.Update(ctx, instance)
if err != nil {
return ctrl.Result{}, err
}
} else if podFound && !culler.StopAnnotationIsSet(instance.ObjectMeta) {
// The Pod is either too fresh, or the idle time has passed and it has
// received traffic. In this case we will be periodically checking if
// it needs culling.
return ctrl.Result{RequeueAfter: culler.GetRequeueTime()}, nil
}
return ctrl.Result{}, nil
}
func getNextCondition(cs corev1.ContainerState) v1beta1.NotebookCondition {
var nbtype = ""
var nbreason = ""
var nbmsg = ""
if cs.Running != nil {
nbtype = "Running"
} else if cs.Waiting != nil {
nbtype = "Waiting"
nbreason = cs.Waiting.Reason
nbmsg = cs.Waiting.Message
} else {
nbtype = "Terminated"
nbreason = cs.Terminated.Reason
nbmsg = cs.Terminated.Reason
}
newCondition := v1beta1.NotebookCondition{
Type: nbtype,
LastProbeTime: metav1.Now(),
Reason: nbreason,
Message: nbmsg,
}
return newCondition
}
func generateStatefulSet(instance *v1beta1.Notebook) *appsv1.StatefulSet {
replicas := int32(1)
if culler.StopAnnotationIsSet(instance.ObjectMeta) {
replicas = 0
}
ss := &appsv1.StatefulSet{
ObjectMeta: metav1.ObjectMeta{
Name: instance.Name,
Namespace: instance.Namespace,
},
Spec: appsv1.StatefulSetSpec{
Replicas: &replicas,
Selector: &metav1.LabelSelector{
MatchLabels: map[string]string{
"statefulset": instance.Name,
},
},
Template: corev1.PodTemplateSpec{
ObjectMeta: metav1.ObjectMeta{Labels: map[string]string{
"statefulset": instance.Name,
"notebook-name": instance.Name,
}},
Spec: instance.Spec.Template.Spec,
},
},
}
// copy all of the Notebook labels to the pod including poddefault related labels
l := &ss.Spec.Template.ObjectMeta.Labels
for k, v := range instance.ObjectMeta.Labels {
(*l)[k] = v
}
podSpec := &ss.Spec.Template.Spec
container := &podSpec.Containers[0]
if container.WorkingDir == "" {
container.WorkingDir = "/home/jovyan"
}
if container.Ports == nil {
container.Ports = []corev1.ContainerPort{
{
ContainerPort: DefaultContainerPort,
Name: "notebook-port",
Protocol: "TCP",
},
}
}
container.Env = append(container.Env, corev1.EnvVar{
Name: "NB_PREFIX",
Value: "/notebook/" + instance.Namespace + "/" + instance.Name,
})
// For some platforms (like OpenShift), adding fsGroup: 100 is troublesome.
// This allows for those platforms to bypass the automatic addition of the fsGroup
// and will allow for the Pod Security Policy controller to make an appropriate choice
// https://github.com/kubernetes-sigs/controller-runtime/issues/4617
if value, exists := os.LookupEnv("ADD_FSGROUP"); !exists || value == "true" {
if podSpec.SecurityContext == nil {
fsGroup := DefaultFSGroup
podSpec.SecurityContext = &corev1.PodSecurityContext{
FSGroup: &fsGroup,
}
}
}
return ss
}
func generateService(instance *v1beta1.Notebook) *corev1.Service {
// Define the desired Service object
port := DefaultContainerPort
containerPorts := instance.Spec.Template.Spec.Containers[0].Ports
if containerPorts != nil {
port = int(containerPorts[0].ContainerPort)
}
svc := &corev1.Service{
ObjectMeta: metav1.ObjectMeta{
Name: instance.Name,
Namespace: instance.Namespace,
},
Spec: corev1.ServiceSpec{
Type: "ClusterIP",
Selector: map[string]string{"statefulset": instance.Name},
Ports: []corev1.ServicePort{
{
// Make port name follow Istio pattern so it can be managed by istio rbac
Name: "http-" + instance.Name,
Port: DefaultServingPort,
TargetPort: intstr.FromInt(port),
Protocol: "TCP",
},
},
},
}
return svc
}
func virtualServiceName(kfName string, namespace string) string {
return fmt.Sprintf("notebook-%s-%s", namespace, kfName)
}
func generateVirtualService(instance *v1beta1.Notebook) (*unstructured.Unstructured, error) {
name := instance.Name
namespace := instance.Namespace
clusterDomain := "cluster.local"
prefix := fmt.Sprintf("/notebook/%s/%s/", namespace, name)
// unpack annotations from Notebook resource
annotations := make(map[string]string)
for k, v := range instance.ObjectMeta.Annotations {
annotations[k] = v
}
rewrite := fmt.Sprintf("/notebook/%s/%s/", namespace, name)
// If AnnotationRewriteURI is present, use this value for "rewrite"
if _, ok := annotations[AnnotationRewriteURI]; ok && len(annotations[AnnotationRewriteURI]) > 0 {
rewrite = annotations[AnnotationRewriteURI]
}
if clusterDomainFromEnv, ok := os.LookupEnv("CLUSTER_DOMAIN"); ok {
clusterDomain = clusterDomainFromEnv
}
service := fmt.Sprintf("%s.%s.svc.%s", name, namespace, clusterDomain)
vsvc := &unstructured.Unstructured{}
vsvc.SetAPIVersion("networking.istio.io/v1alpha3")
vsvc.SetKind("VirtualService")
vsvc.SetName(virtualServiceName(name, namespace))
vsvc.SetNamespace(namespace)
if err := unstructured.SetNestedStringSlice(vsvc.Object, []string{"*"}, "spec", "hosts"); err != nil {
return nil, fmt.Errorf("Set .spec.hosts error: %v", err)
}
istioGateway := os.Getenv("ISTIO_GATEWAY")
if len(istioGateway) == 0 {
istioGateway = "kubeflow/kubeflow-gateway"
}
if err := unstructured.SetNestedStringSlice(vsvc.Object, []string{istioGateway},
"spec", "gateways"); err != nil {
return nil, fmt.Errorf("Set .spec.gateways error: %v", err)
}
headersRequestSet := make(map[string]string)
// If AnnotationHeadersRequestSet is present, use its values in "headers.request.set"
if _, ok := annotations[AnnotationHeadersRequestSet]; ok && len(annotations[AnnotationHeadersRequestSet]) > 0 {
requestHeadersBytes := []byte(annotations[AnnotationHeadersRequestSet])
if err := json.Unmarshal(requestHeadersBytes, &headersRequestSet); err != nil {
// if JSON decoding fails, set an empty map
headersRequestSet = make(map[string]string)
}
}
// cast from map[string]string, as SetNestedSlice needs map[string]interface{}
headersRequestSetInterface := make(map[string]interface{})
for key, element := range headersRequestSet {
headersRequestSetInterface[key] = element
}
// the http section of the istio VirtualService spec
http := []interface{}{
map[string]interface{}{
"headers": map[string]interface{}{
"request": map[string]interface{}{
"set": headersRequestSetInterface,
},
},
"match": []interface{}{
map[string]interface{}{
"uri": map[string]interface{}{
"prefix": prefix,
},
},
},
"rewrite": map[string]interface{}{
"uri": rewrite,
},
"route": []interface{}{
map[string]interface{}{
"destination": map[string]interface{}{
"host": service,
"port": map[string]interface{}{
"number": int64(DefaultServingPort),
},
},
},
},
"timeout": "300s",
},
}
// add http section to istio VirtualService spec
if err := unstructured.SetNestedSlice(vsvc.Object, http, "spec", "http"); err != nil {
return nil, fmt.Errorf("Set .spec.http error: %v", err)
}
return vsvc, nil
}
func (r *NotebookReconciler) reconcileVirtualService(instance *v1beta1.Notebook) error {
log := r.Log.WithValues("notebook", instance.Namespace)
virtualService, err := generateVirtualService(instance)
if err := ctrl.SetControllerReference(instance, virtualService, r.Scheme); err != nil {
return err
}
// Check if the virtual service already exists.
foundVirtual := &unstructured.Unstructured{}
justCreated := false
foundVirtual.SetAPIVersion("networking.istio.io/v1alpha3")
foundVirtual.SetKind("VirtualService")
err = r.Get(context.TODO(), types.NamespacedName{Name: virtualServiceName(instance.Name,
instance.Namespace), Namespace: instance.Namespace}, foundVirtual)
if err != nil && apierrs.IsNotFound(err) {
log.Info("Creating virtual service", "namespace", instance.Namespace, "name",
virtualServiceName(instance.Name, instance.Namespace))
err = r.Create(context.TODO(), virtualService)
justCreated = true
if err != nil {
return err
}
} else if err != nil {
return err
}
if !justCreated && reconcilehelper.CopyVirtualService(virtualService, foundVirtual) {
log.Info("Updating virtual service", "namespace", instance.Namespace, "name",
virtualServiceName(instance.Name, instance.Namespace))
err = r.Update(context.TODO(), foundVirtual)
if err != nil {
return err
}
}
return nil
}
func isStsOrPodEvent(event *corev1.Event) bool {
return event.InvolvedObject.Kind == "Pod" || event.InvolvedObject.Kind == "StatefulSet"
}
func nbNameFromInvolvedObject(c client.Client, object *corev1.ObjectReference) (string, error) {
name, namespace := object.Name, object.Namespace
if object.Kind == "StatefulSet" {
return name, nil
}
if object.Kind == "Pod" {
pod := &corev1.Pod{}
err := c.Get(
context.TODO(),
types.NamespacedName{
Namespace: namespace,
Name: name,
},
pod,
)
if err != nil {
return "", err
}
if nbName, ok := pod.Labels["notebook-name"]; ok {
return nbName, nil
}
}
return "", fmt.Errorf("object isn't related to a Notebook")
}
func nbNameExists(client client.Client, nbName string, namespace string) bool {
if err := client.Get(context.Background(), types.NamespacedName{Namespace: namespace, Name: nbName}, &v1beta1.Notebook{}); err != nil {
// If error != NotFound, trigger the reconcile call anyway to avoid loosing a potential relevant event
return !apierrs.IsNotFound(err)
}
return true
}
func (r *NotebookReconciler) SetupWithManager(mgr ctrl.Manager) error {
builder := ctrl.NewControllerManagedBy(mgr).
For(&v1beta1.Notebook{}).
Owns(&appsv1.StatefulSet{}).
Owns(&corev1.Service{})
// watch Istio virtual service
if os.Getenv("USE_ISTIO") == "true" {
virtualService := &unstructured.Unstructured{}
virtualService.SetAPIVersion("networking.istio.io/v1alpha3")
virtualService.SetKind("VirtualService")
builder.Owns(virtualService)
}
// TODO(lunkai): After this is fixed:
// https://github.com/kubernetes-sigs/controller-runtime/issues/572
// We don't have to call Build to get the controller.
c, err := builder.Build(r)
if err != nil {
return err
}
// watch underlying pod
mapFn := handler.ToRequestsFunc(
func(a handler.MapObject) []ctrl.Request {
return []ctrl.Request{
{NamespacedName: types.NamespacedName{
Name: a.Meta.GetLabels()["notebook-name"],
Namespace: a.Meta.GetNamespace(),
}},
}
})
p := predicate.Funcs{
UpdateFunc: func(e event.UpdateEvent) bool {
if _, ok := e.MetaOld.GetLabels()["notebook-name"]; !ok {
return false
}
return e.ObjectOld != e.ObjectNew
},
CreateFunc: func(e event.CreateEvent) bool {
if _, ok := e.Meta.GetLabels()["notebook-name"]; !ok {
return false
}
return true
},
}
eventToRequest := handler.ToRequestsFunc(
func(a handler.MapObject) []ctrl.Request {
return []reconcile.Request{
{NamespacedName: types.NamespacedName{
Name: a.Meta.GetName(),
Namespace: a.Meta.GetNamespace(),
}},
}
})
eventsPredicates := predicate.Funcs{
UpdateFunc: func(e event.UpdateEvent) bool {
event := e.ObjectNew.(*corev1.Event)
nbName, err := nbNameFromInvolvedObject(r.Client, &event.InvolvedObject)
if err != nil {
return false
}
return e.ObjectOld != e.ObjectNew &&
isStsOrPodEvent(event) &&
nbNameExists(r.Client, nbName, e.MetaNew.GetNamespace())
},
CreateFunc: func(e event.CreateEvent) bool {
event := e.Object.(*corev1.Event)
nbName, err := nbNameFromInvolvedObject(r.Client, &event.InvolvedObject)
if err != nil {
return false
}
return isStsOrPodEvent(event) &&
nbNameExists(r.Client, nbName, e.Meta.GetNamespace())
},
}
if err = c.Watch(
&source.Kind{Type: &corev1.Pod{}},
&handler.EnqueueRequestsFromMapFunc{
ToRequests: mapFn,
},
p); err != nil {
return err
}
if err = c.Watch(
&source.Kind{Type: &corev1.Event{}},
&handler.EnqueueRequestsFromMapFunc{
ToRequests: eventToRequest,
},
eventsPredicates); err != nil {
return err
}
return nil
}