kops/upup/pkg/fi/cloudup/scalewaytasks/instance.go

474 lines
14 KiB
Go

/*
Copyright 2022 The Kubernetes Authors.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package scalewaytasks
import (
"bytes"
"crypto/sha256"
"fmt"
"io"
"strconv"
"strings"
"github.com/scaleway/scaleway-sdk-go/api/instance/v1"
"github.com/scaleway/scaleway-sdk-go/api/marketplace/v2"
"github.com/scaleway/scaleway-sdk-go/scw"
"k8s.io/kops/upup/pkg/fi"
"k8s.io/kops/upup/pkg/fi/cloudup/scaleway"
"k8s.io/kops/upup/pkg/fi/cloudup/terraform"
"k8s.io/kops/upup/pkg/fi/cloudup/terraformWriter"
)
// +kops:fitask
type Instance struct {
Name *string
Lifecycle fi.Lifecycle
Zone *string
Role *string
CommercialType *string
Image *string
Tags []string
Count int
VolumeSize *int
NeedsUpdate []string
UserData *fi.Resource
LoadBalancer *LoadBalancer
}
var _ fi.CloudupTask = &Instance{}
var _ fi.CompareWithID = &Instance{}
func (s *Instance) CompareWithID() *string {
return s.Name
}
var _ fi.CloudupHasDependencies = &Instance{}
func (s *Instance) GetDependencies(tasks map[string]fi.CloudupTask) []fi.CloudupTask {
var deps []fi.CloudupTask
for _, task := range tasks {
if _, ok := task.(*Volume); ok {
deps = append(deps, task)
}
}
return deps
}
func (s *Instance) Find(c *fi.CloudupContext) (*Instance, error) {
cloud := c.T.Cloud.(scaleway.ScwCloud)
servers, err := cloud.GetClusterServers(cloud.ClusterName(s.Tags), s.Name)
if err != nil {
return nil, fmt.Errorf("error finding instances: %w", err)
}
if len(servers) == 0 {
return nil, nil
}
// Check if servers updates are needed
var needsUpdate []string
for _, server := range servers {
// Check if server is already marked as needing update
alreadyTagged := false
for _, tag := range server.Tags {
if tag == scaleway.TagNeedsUpdate {
alreadyTagged = true
}
}
if alreadyTagged {
continue
}
// Check commercial type differences
if server.CommercialType != *s.CommercialType {
needsUpdate = append(needsUpdate, server.ID)
continue
}
// Check image differences
diff, err := checkImageDifferences(c, cloud, server, fi.ValueOf(s.Image))
if err != nil {
return nil, fmt.Errorf("checking image differences in server %s (%s): %w", server.Name, server.ID, err)
}
if diff {
needsUpdate = append(needsUpdate, server.ID)
continue
}
// Check user-data differences
diff, err = checkUserDataDifferences(c, cloud, server, s.UserData)
if err != nil {
return nil, fmt.Errorf("checking user-data differences in server %s (%s): %w", server.Name, server.ID, err)
}
if diff {
needsUpdate = append(needsUpdate, server.ID)
}
}
server := servers[0]
igName := scaleway.InstanceGroupNameFromTags(server.Tags)
role := scaleway.InstanceRoleFromTags(server.Tags)
imageLabel, err := imageLabelFromID(c, cloud, server.Image.ID)
if err != nil {
return nil, err
}
return &Instance{
Name: fi.PtrTo(igName),
Lifecycle: s.Lifecycle,
Zone: fi.PtrTo(server.Zone.String()),
Role: fi.PtrTo(role),
CommercialType: fi.PtrTo(server.CommercialType),
Image: fi.PtrTo(imageLabel),
Tags: server.Tags,
Count: len(servers),
NeedsUpdate: needsUpdate,
UserData: s.UserData,
}, nil
}
func (s *Instance) Run(c *fi.CloudupContext) error {
return fi.CloudupDefaultDeltaRunMethod(s, c)
}
func (_ *Instance) CheckChanges(actual, expected, changes *Instance) error {
if actual != nil {
if changes.Name != nil {
return fi.CannotChangeField("Name")
}
if changes.Zone != nil {
return fi.CannotChangeField("Zone")
}
} else {
if expected.Name == nil {
return fi.RequiredField("Name")
}
if expected.Zone == nil {
return fi.RequiredField("Zone")
}
if expected.CommercialType == nil {
return fi.RequiredField("CommercialType")
}
if expected.Image == nil {
return fi.RequiredField("Image")
}
}
return nil
}
func (_ *Instance) RenderScw(t *scaleway.ScwAPITarget, actual, expected, changes *Instance) error {
instanceService := t.Cloud.InstanceService()
zone := scw.Zone(fi.ValueOf(expected.Zone))
userData, err := fi.ResourceAsBytes(*expected.UserData)
if err != nil {
return fmt.Errorf("error rendering instances: %w", err)
}
newInstanceCount := expected.Count
if actual != nil {
// Add "kops.k8s.io/needs-update" label to servers needing update
for _, serverID := range actual.NeedsUpdate {
server, err := instanceService.GetServer(&instance.GetServerRequest{
Zone: zone,
ServerID: serverID,
})
if err != nil {
return fmt.Errorf("rendering server group: listing existing servers: %w", err)
}
_, err = instanceService.UpdateServer(&instance.UpdateServerRequest{
Zone: zone,
ServerID: serverID,
Tags: scw.StringsPtr(append(server.Server.Tags, scaleway.TagNeedsUpdate)),
})
if err != nil {
return fmt.Errorf("rendering server group: adding update tag to server %q (%s): %w", server.Server.Name, serverID, err)
}
}
if expected.Count == actual.Count {
return nil
}
newInstanceCount = expected.Count - actual.Count
}
// If newInstanceCount > 0, we need to create new instances for this group
for i := 0; i < newInstanceCount; i++ {
// We create a unique name for each server
uniqueName, err := uniqueName(t.Cloud, scaleway.ClusterNameFromTags(expected.Tags), fi.ValueOf(expected.Name))
if err != nil {
return fmt.Errorf("error rendering server group %s: computing unique name for server: %w", fi.ValueOf(expected.Name), err)
}
createServerRequest := instance.CreateServerRequest{
Zone: zone,
Name: uniqueName,
CommercialType: fi.ValueOf(expected.CommercialType),
Image: expected.Image,
Tags: expected.Tags,
RoutedIPEnabled: fi.PtrTo(true),
}
// We resize the root volume if needed (for instance types with no local storage)
if expected.VolumeSize != nil {
createServerRequest.Volumes = map[string]*instance.VolumeServerTemplate{
"0": {
Boot: fi.PtrTo(true),
Size: fi.PtrTo(scw.Size(fi.ValueOf(expected.VolumeSize)) * scw.GB),
VolumeType: instance.VolumeVolumeTypeBSSD,
},
}
}
// We create the instance and wait for it to be ready
srv, err := instanceService.CreateServer(&createServerRequest)
if err != nil {
return fmt.Errorf("error creating instance of group %q: %w", fi.ValueOf(expected.Name), err)
}
_, err = instanceService.WaitForServer(&instance.WaitForServerRequest{
ServerID: srv.Server.ID,
Zone: zone,
})
if err != nil {
return fmt.Errorf("error waiting for instance %s of group %q: %w", srv.Server.ID, fi.ValueOf(expected.Name), err)
}
// We load the cloud-init script in the instance user data
err = instanceService.SetServerUserData(&instance.SetServerUserDataRequest{
ServerID: srv.Server.ID,
Zone: srv.Server.Zone,
Key: "cloud-init",
Content: bytes.NewBuffer(userData),
})
if err != nil {
return fmt.Errorf("error setting 'cloud-init' in user-data for instance %s of group %q: %w", srv.Server.ID, fi.ValueOf(expected.Name), err)
}
// We start the instance
_, err = instanceService.ServerAction(&instance.ServerActionRequest{
Zone: zone,
ServerID: srv.Server.ID,
Action: instance.ServerActionPoweron,
})
if err != nil {
return fmt.Errorf("error powering on instance %s of group %q: %w", srv.Server.ID, fi.ValueOf(expected.Name), err)
}
// We wait for the instance to be ready
_, err = instanceService.WaitForServer(&instance.WaitForServerRequest{
ServerID: srv.Server.ID,
Zone: zone,
})
if err != nil {
return fmt.Errorf("error waiting for instance %s of group %q: %w", srv.Server.ID, fi.ValueOf(expected.Name), err)
}
}
// If newInstanceCount < 0, we need to delete instances of this group
if newInstanceCount < 0 {
igInstances, err := t.Cloud.GetClusterServers(t.Cloud.ClusterName(actual.Tags), actual.Name)
if err != nil {
return fmt.Errorf("error deleting instance: %w", err)
}
for i := 0; i > newInstanceCount; i-- {
toDelete := igInstances[i*-1]
err = t.Cloud.DeleteServer(toDelete)
if err != nil {
return fmt.Errorf("error deleting instance of group %s: %w", toDelete.Name, err)
}
}
}
return nil
}
type terraformInstanceIP struct {
Tags []string `cty:"tags"`
}
type terraformInstance struct {
Name *string `cty:"name"`
IPID *terraformWriter.Literal `cty:"ip_id"`
Type *string `cty:"type"`
Tags []string `cty:"tags"`
Image *string `cty:"image"`
UserData map[string]*terraformWriter.Literal `cty:"user_data"`
RootVolume []terraformVolume `cty:"root_volume"`
EnableDynamicIP *bool `cty:"enable_dynamic_ip"`
ReplaceOnTypeChange *bool `cty:"replace_on_type_change"`
Lifecycle *terraform.Lifecycle `cty:"lifecycle"`
}
func (_ *Instance) RenderTerraform(t *terraform.TerraformTarget, actual, expected, changes *Instance) error {
for i := 0; i < expected.Count; i++ {
// We create a unique name for each server
uniqueName := fmt.Sprintf("%s-%d", fi.ValueOf(expected.Name), i)
tfName := strings.ReplaceAll(uniqueName, ".", "-")
tfInstance := terraformInstance{
Name: &uniqueName,
IPID: terraformWriter.LiteralProperty("scaleway_instance_ip", tfName, "id"),
Type: expected.CommercialType,
Tags: expected.Tags,
Image: expected.Image,
EnableDynamicIP: fi.PtrTo(true),
ReplaceOnTypeChange: fi.PtrTo(false),
Lifecycle: nil,
}
// We load the cloud-init script in the instance user data
if expected.UserData != nil {
userDataBytes, err := fi.ResourceAsBytes(fi.ValueOf(expected.UserData))
if err != nil {
return err
}
if userDataBytes != nil {
tfUserData, err := t.AddFileBytes("scaleway_instance_server", tfName, "user_data", userDataBytes, false)
if err != nil {
return err
}
tfInstance.UserData = map[string]*terraformWriter.Literal{
"cloud-init": tfUserData,
}
}
}
// We resize the root volume if needed (for instance types with no local storage)
if expected.VolumeSize != nil {
tfInstance.RootVolume = []terraformVolume{
{
SizeInGB: expected.VolumeSize,
Boot: fi.PtrTo(true),
},
}
}
// For control-plane instances, we want to ignore changes to additional volumes since the etcd-manager will
// attach etcd volumes outside of Terraform
if scaleway.InstanceRoleFromTags(expected.Tags) == scaleway.TagRoleControlPlane {
tfInstance.Lifecycle = &terraform.Lifecycle{
IgnoreChanges: []*terraformWriter.Literal{{String: "additional_volume_ids"}},
}
}
// We create an IP for the server (we only render it now to avoid duplicates if Instance task fails)
tfInstanceIP := terraformInstanceIP{}
for _, tag := range expected.Tags {
if strings.HasPrefix(tag, scaleway.TagClusterName) {
tfInstanceIP.Tags = []string{tag}
break
}
}
err := t.RenderResource("scaleway_instance_ip", tfName, tfInstanceIP)
if err != nil {
return err
}
err = t.RenderResource("scaleway_instance_server", tfName, tfInstance)
if err != nil {
return err
}
}
return nil
}
func checkImageDifferences(c *fi.CloudupContext, cloud scaleway.ScwCloud, actualServer *instance.Server, expectedImage string) (bool, error) {
localImage, err := cloud.MarketplaceService().GetLocalImageByLabel(&marketplace.GetLocalImageByLabelRequest{
ImageLabel: expectedImage,
Zone: actualServer.Zone,
CommercialType: actualServer.CommercialType,
}, scw.WithContext(c.Context()))
if err != nil {
return false, fmt.Errorf("getting image from the marketplace: %w", err)
}
if actualServer.Image.ID != localImage.ID {
return true, nil
}
return false, nil
}
func checkUserDataDifferences(c *fi.CloudupContext, cloud scaleway.ScwCloud, actualServer *instance.Server, expectedUserData *fi.Resource) (bool, error) {
actualUserData, err := cloud.InstanceService().GetServerUserData(&instance.GetServerUserDataRequest{
Zone: actualServer.Zone,
ServerID: actualServer.ID,
Key: "cloud-init",
}, scw.WithContext(c.Context()))
if err != nil {
return false, fmt.Errorf("getting actual user-data: %w", err)
}
actualUserDataBytes, err := io.ReadAll(actualUserData)
if err != nil {
return false, fmt.Errorf("reading actual user-data: %w", err)
}
expectedUserDataBytes, err := fi.ResourceAsBytes(*expectedUserData)
if err != nil {
return false, fmt.Errorf("reading expected user-data: %w", err)
}
if sha256.Sum256(actualUserDataBytes) != sha256.Sum256(expectedUserDataBytes) {
return true, nil
}
return false, nil
}
func imageLabelFromID(c *fi.CloudupContext, cloud scaleway.ScwCloud, id string) (string, error) {
localImage, err := cloud.MarketplaceService().GetLocalImage(&marketplace.GetLocalImageRequest{
LocalImageID: id,
}, scw.WithContext(c.Context()))
if err != nil {
return "", fmt.Errorf("getting image from the marketplace: %w", err)
}
return localImage.Label, nil
}
func findFirstFreeIndex(existing []*instance.Server) int {
index := 0
for {
found := false
for _, server := range existing {
if strings.HasSuffix(server.Name, strconv.Itoa(index)) {
found = true
index++
break
}
}
if !found {
return index
}
}
}
func uniqueName(cloud scaleway.ScwCloud, clusterName, igName string) (string, error) {
existing, err := cloud.GetClusterServers(clusterName, &igName)
if err != nil {
return "", err
}
index := findFirstFreeIndex(existing)
return fmt.Sprintf("%s-%d", igName, index), nil
}