mirror of https://github.com/docker/docs.git
416 lines
9.0 KiB
Go
416 lines
9.0 KiB
Go
package cluster
|
|
|
|
import (
|
|
"crypto/tls"
|
|
"errors"
|
|
"fmt"
|
|
"net"
|
|
"strings"
|
|
"sync"
|
|
"time"
|
|
|
|
log "github.com/Sirupsen/logrus"
|
|
"github.com/samalba/dockerclient"
|
|
)
|
|
|
|
const (
|
|
// Force-refresh the state of the node this often.
|
|
stateRefreshPeriod = 30 * time.Second
|
|
|
|
// Timeout for requests sent out to the node.
|
|
requestTimeout = 10 * time.Second
|
|
)
|
|
|
|
func NewNode(addr string) *Node {
|
|
e := &Node{
|
|
Addr: addr,
|
|
Labels: make(map[string]string),
|
|
ch: make(chan bool),
|
|
containers: make(map[string]*Container),
|
|
healthy: true,
|
|
}
|
|
return e
|
|
}
|
|
|
|
type Node struct {
|
|
sync.RWMutex
|
|
|
|
ID string
|
|
IP string
|
|
Addr string
|
|
Name string
|
|
Cpus int64
|
|
Memory int64
|
|
Labels map[string]string
|
|
|
|
ch chan bool
|
|
containers map[string]*Container
|
|
client dockerclient.Client
|
|
eventHandler EventHandler
|
|
healthy bool
|
|
}
|
|
|
|
// Connect will initialize a connection to the Docker daemon running on the
|
|
// host, gather machine specs (memory, cpu, ...) and monitor state changes.
|
|
func (n *Node) Connect(config *tls.Config) error {
|
|
c, err := dockerclient.NewDockerClientTimeout(n.Addr, config, time.Duration(requestTimeout))
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
addr, err := net.ResolveIPAddr("ip4", strings.Split(c.URL.Host, ":")[0])
|
|
if err != nil {
|
|
return err
|
|
}
|
|
n.IP = addr.IP.String()
|
|
|
|
return n.connectClient(c)
|
|
}
|
|
|
|
func (n *Node) connectClient(client dockerclient.Client) error {
|
|
n.client = client
|
|
|
|
// Fetch the engine labels.
|
|
if err := n.updateSpecs(); err != nil {
|
|
n.client = nil
|
|
return err
|
|
}
|
|
|
|
// Force a state update before returning.
|
|
if err := n.refreshContainers(); err != nil {
|
|
n.client = nil
|
|
return err
|
|
}
|
|
|
|
// Start the update loop.
|
|
go n.refreshLoop()
|
|
|
|
// Start monitoring events from the Node.
|
|
n.client.StartMonitorEvents(n.handler)
|
|
|
|
return nil
|
|
}
|
|
|
|
// IsConnected returns true if the engine is connected to a remote docker API
|
|
func (n *Node) IsConnected() bool {
|
|
return n.client != nil
|
|
}
|
|
|
|
func (n *Node) IsHealthy() bool {
|
|
return n.healthy
|
|
}
|
|
|
|
// Gather node specs (CPU, memory, constraints, ...).
|
|
func (n *Node) updateSpecs() error {
|
|
info, err := n.client.Info()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
// Older versions of Docker don't expose the ID field and are not supported
|
|
// by Swarm. Catch the error ASAP and refuse to connect.
|
|
if len(info.ID) == 0 {
|
|
return fmt.Errorf("Node %s is running an unsupported version of Docker Engine. Please upgrade.", n.Addr)
|
|
}
|
|
n.ID = info.ID
|
|
n.Name = info.Name
|
|
n.Cpus = info.NCPU
|
|
n.Memory = info.MemTotal
|
|
n.Labels = map[string]string{
|
|
"storagedriver": info.Driver,
|
|
"executiondriver": info.ExecutionDriver,
|
|
"kernelversion": info.KernelVersion,
|
|
"operatingsystem": info.OperatingSystem,
|
|
}
|
|
for _, label := range info.Labels {
|
|
kv := strings.SplitN(label, "=", 2)
|
|
n.Labels[kv[0]] = kv[1]
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// Refresh the list and status of containers running on the node.
|
|
func (n *Node) refreshContainers() error {
|
|
containers, err := n.client.ListContainers(true, false, "")
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
n.Lock()
|
|
defer n.Unlock()
|
|
|
|
merged := make(map[string]*Container)
|
|
for _, c := range containers {
|
|
merged, err = n.updateContainer(c, merged)
|
|
if err != nil {
|
|
log.Errorf("[%s/%s] Unable to update state of %s", n.ID, n.Name, c.Id)
|
|
}
|
|
}
|
|
|
|
n.containers = merged
|
|
|
|
log.Debugf("[%s/%s] Updated state", n.ID, n.Name)
|
|
return nil
|
|
}
|
|
|
|
// Refresh the status of a container running on the node.
|
|
func (n *Node) refreshContainer(ID string) error {
|
|
containers, err := n.client.ListContainers(true, false, fmt.Sprintf("{%q:[%q]}", "id", ID))
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
if len(containers) > 1 {
|
|
// We expect one container, if we get more than one, trigger a full refresh.
|
|
return n.refreshContainers()
|
|
}
|
|
|
|
n.Lock()
|
|
defer n.Unlock()
|
|
|
|
if len(containers) == 0 {
|
|
// The container doesn't exist on the node, remove it.
|
|
delete(n.containers, ID)
|
|
return nil
|
|
}
|
|
|
|
_, err = n.updateContainer(containers[0], n.containers)
|
|
return err
|
|
}
|
|
|
|
func (n *Node) ForceRefreshContainer(c dockerclient.Container) error {
|
|
return n.inspectContainer(c, n.containers, true)
|
|
}
|
|
|
|
func (n *Node) inspectContainer(c dockerclient.Container, containers map[string]*Container, lock bool) error {
|
|
|
|
container := &Container{}
|
|
container.Container = c
|
|
container.Node = n
|
|
|
|
info, err := n.client.InspectContainer(c.Id)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
container.Info = *info
|
|
|
|
// real CpuShares -> nb of CPUs
|
|
container.Info.Config.CpuShares = container.Info.Config.CpuShares / 100.0 * n.Cpus
|
|
|
|
if lock {
|
|
n.Lock()
|
|
defer n.Unlock()
|
|
}
|
|
containers[container.Id] = container
|
|
|
|
return nil
|
|
}
|
|
|
|
func (n *Node) updateContainer(c dockerclient.Container, containers map[string]*Container) (map[string]*Container, error) {
|
|
if current, exists := n.containers[c.Id]; exists {
|
|
// The container exists. Update its state.
|
|
current.Container = c
|
|
containers[current.Id] = current
|
|
} else {
|
|
// This is a brand new container.
|
|
if err := n.inspectContainer(c, containers, false); err != nil {
|
|
return nil, err
|
|
}
|
|
}
|
|
return containers, nil
|
|
}
|
|
|
|
func (n *Node) refreshContainersAsync() {
|
|
n.ch <- true
|
|
}
|
|
|
|
func (n *Node) refreshLoop() {
|
|
for {
|
|
var err error
|
|
select {
|
|
case <-n.ch:
|
|
err = n.refreshContainers()
|
|
case <-time.After(stateRefreshPeriod):
|
|
err = n.refreshContainers()
|
|
}
|
|
|
|
if err != nil {
|
|
n.healthy = false
|
|
log.Errorf("[%s/%s] Flagging node as dead. Updated state failed: %v", n.ID, n.Name, err)
|
|
} else {
|
|
if !n.healthy {
|
|
log.Infof("[%s/%s] Node came back to life. Hooray!", n.ID, n.Name)
|
|
}
|
|
n.healthy = true
|
|
}
|
|
}
|
|
}
|
|
|
|
// Return the sum of memory reserved by containers.
|
|
func (n *Node) ReservedMemory() int64 {
|
|
var r int64 = 0
|
|
n.RLock()
|
|
for _, c := range n.containers {
|
|
r += c.Info.Config.Memory
|
|
}
|
|
n.RUnlock()
|
|
return r
|
|
}
|
|
|
|
// Return the sum of CPUs reserved by containers.
|
|
func (n *Node) ReservedCpus() int64 {
|
|
var r int64 = 0
|
|
n.RLock()
|
|
for _, c := range n.containers {
|
|
r += c.Info.Config.CpuShares
|
|
}
|
|
n.RUnlock()
|
|
return r
|
|
}
|
|
|
|
func (n *Node) Create(config *dockerclient.ContainerConfig, name string, pullImage bool) (*Container, error) {
|
|
var (
|
|
err error
|
|
id string
|
|
client = n.client
|
|
)
|
|
|
|
newConfig := *config
|
|
|
|
// nb of CPUs -> real CpuShares
|
|
newConfig.CpuShares = config.CpuShares * 100 / n.Cpus
|
|
|
|
if id, err = client.CreateContainer(&newConfig, name); err != nil {
|
|
// If the error is other than not found, abort immediately.
|
|
if err != dockerclient.ErrNotFound || !pullImage {
|
|
return nil, err
|
|
}
|
|
// Otherwise, try to pull the image...
|
|
if err = n.Pull(config.Image); err != nil {
|
|
return nil, err
|
|
}
|
|
// ...And try again.
|
|
if id, err = client.CreateContainer(&newConfig, name); err != nil {
|
|
return nil, err
|
|
}
|
|
}
|
|
|
|
// Register the container immediately while waiting for a state refresh.
|
|
// Force a state refresh to pick up the newly created container.
|
|
n.refreshContainer(id)
|
|
|
|
n.RLock()
|
|
defer n.RUnlock()
|
|
|
|
return n.containers[id], nil
|
|
}
|
|
|
|
func (n *Node) ListImages() ([]string, error) {
|
|
images, err := n.client.ListImages()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
out := []string{}
|
|
|
|
for _, i := range images {
|
|
for _, t := range i.RepoTags {
|
|
out = append(out, t)
|
|
}
|
|
}
|
|
|
|
return out, nil
|
|
}
|
|
|
|
// Destroy and remove a container from the node.
|
|
func (n *Node) Destroy(container *Container, force bool) error {
|
|
if err := n.client.RemoveContainer(container.Id, force); err != nil {
|
|
return err
|
|
}
|
|
|
|
// Remove the container from the state. Eventually, the state refresh loop
|
|
// will rewrite this.
|
|
n.Lock()
|
|
defer n.Unlock()
|
|
delete(n.containers, container.Id)
|
|
|
|
return nil
|
|
}
|
|
|
|
func (n *Node) Pull(image string) error {
|
|
if err := n.client.PullImage(image, nil); err != nil {
|
|
return err
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// Register an event handler.
|
|
func (n *Node) Events(h EventHandler) error {
|
|
if n.eventHandler != nil {
|
|
return errors.New("event handler already set")
|
|
}
|
|
n.eventHandler = h
|
|
return nil
|
|
}
|
|
|
|
func (n *Node) Containers() []*Container {
|
|
containers := []*Container{}
|
|
n.RLock()
|
|
for _, container := range n.containers {
|
|
containers = append(containers, container)
|
|
}
|
|
n.RUnlock()
|
|
return containers
|
|
}
|
|
|
|
func (n *Node) String() string {
|
|
return fmt.Sprintf("node %s addr %s", n.ID, n.Addr)
|
|
}
|
|
|
|
func (n *Node) handler(ev *dockerclient.Event, args ...interface{}) {
|
|
// Something changed - refresh our internal state.
|
|
n.refreshContainer(ev.Id)
|
|
|
|
// If there is no event handler registered, abort right now.
|
|
if n.eventHandler == nil {
|
|
return
|
|
}
|
|
|
|
event := &Event{
|
|
Node: n,
|
|
Event: *ev,
|
|
}
|
|
|
|
n.eventHandler.Handle(event)
|
|
}
|
|
|
|
// Inject a container into the internal state.
|
|
func (n *Node) AddContainer(container *Container) error {
|
|
n.Lock()
|
|
defer n.Unlock()
|
|
|
|
if _, ok := n.containers[container.Id]; ok {
|
|
return errors.New("container already exists")
|
|
}
|
|
n.containers[container.Id] = container
|
|
return nil
|
|
}
|
|
|
|
// Remove a container from the internal test.
|
|
func (n *Node) RemoveContainer(container *Container) error {
|
|
n.Lock()
|
|
defer n.Unlock()
|
|
|
|
if _, ok := n.containers[container.Id]; !ok {
|
|
return errors.New("container not found")
|
|
}
|
|
delete(n.containers, container.Id)
|
|
return nil
|
|
}
|
|
|
|
// Wipes the internal container state.
|
|
func (n *Node) CleanupContainers() {
|
|
n.Lock()
|
|
n.containers = make(map[string]*Container)
|
|
n.Unlock()
|
|
}
|