package libimage import ( "context" "errors" "fmt" "io" "runtime" "strings" "time" "github.com/containers/common/pkg/config" registryTransport "github.com/containers/image/v5/docker" dockerArchiveTransport "github.com/containers/image/v5/docker/archive" dockerDaemonTransport "github.com/containers/image/v5/docker/daemon" "github.com/containers/image/v5/docker/reference" "github.com/containers/image/v5/manifest" ociArchiveTransport "github.com/containers/image/v5/oci/archive" ociTransport "github.com/containers/image/v5/oci/layout" "github.com/containers/image/v5/pkg/shortnames" storageTransport "github.com/containers/image/v5/storage" "github.com/containers/image/v5/transports/alltransports" "github.com/containers/image/v5/types" "github.com/containers/storage" digest "github.com/opencontainers/go-digest" ociSpec "github.com/opencontainers/image-spec/specs-go/v1" "github.com/sirupsen/logrus" ) // PullOptions allows for custommizing image pulls. type PullOptions struct { CopyOptions // If true, all tags of the image will be pulled from the container // registry. Only supported for the docker transport. AllTags bool } // Pull pulls the specified name. Name may refer to any of the supported // transports from github.com/containers/image. If no transport is encoded, // name will be treated as a reference to a registry (i.e., docker transport). // // Note that pullPolicy is only used when pulling from a container registry but // it *must* be different than the default value `config.PullPolicyUnsupported`. This // way, callers are forced to decide on the pull behaviour. The reasoning // behind is that some (commands of some) tools have different default pull // policies (e.g., buildah-bud versus podman-build). Making the pull-policy // choice explicit is an attempt to prevent silent regressions. // // The error is storage.ErrImageUnknown iff the pull policy is set to "never" // and no local image has been found. This allows for an easier integration // into some users of this package (e.g., Buildah). func (r *Runtime) Pull(ctx context.Context, name string, pullPolicy config.PullPolicy, options *PullOptions) ([]*Image, error) { logrus.Debugf("Pulling image %s (policy: %s)", name, pullPolicy) if options == nil { options = &PullOptions{} } var possiblyUnqualifiedName string // used for short-name resolution ref, err := alltransports.ParseImageName(name) if err != nil { // Check whether `name` points to a transport. If so, we // return the error. Otherwise we assume that `name` refers to // an image on a registry (e.g., "fedora"). // // NOTE: the `docker` transport is an exception to support a // `pull docker:latest` which would otherwise return an error. if t := alltransports.TransportFromImageName(name); t != nil && t.Name() != registryTransport.Transport.Name() { return nil, err } // If the image clearly refers to a local one, we can look it up directly. // In fact, we need to since they are not parseable. if strings.HasPrefix(name, "sha256:") || (len(name) == 64 && !strings.ContainsAny(name, "/.:@")) { if pullPolicy == config.PullPolicyAlways { return nil, fmt.Errorf("pull policy is always but image has been referred to by ID (%s)", name) } local, _, err := r.LookupImage(name, nil) if err != nil { return nil, err } return []*Image{local}, err } // Docker compat: strip off the tag iff name is tagged and digested // (e.g., fedora:latest@sha256...). In that case, the tag is stripped // off and entirely ignored. The digest is the sole source of truth. normalizedName, normalizeError := normalizeTaggedDigestedString(name) if normalizeError != nil { return nil, normalizeError } name = normalizedName // If the input does not include a transport assume it refers // to a registry. dockerRef, dockerErr := alltransports.ParseImageName("docker://" + name) if dockerErr != nil { return nil, err } ref = dockerRef possiblyUnqualifiedName = name } else if ref.Transport().Name() == registryTransport.Transport.Name() { // Normalize the input if we're referring to the docker // transport directly. That makes sure that a `docker://fedora` // will resolve directly to `docker.io/library/fedora:latest` // and not be subject to short-name resolution. named := ref.DockerReference() if named == nil { return nil, errors.New("internal error: unexpected nil reference") } possiblyUnqualifiedName = named.String() } if options.AllTags && ref.Transport().Name() != registryTransport.Transport.Name() { return nil, fmt.Errorf("pulling all tags is not supported for %s transport", ref.Transport().Name()) } if r.eventChannel != nil { defer r.writeEvent(&Event{ID: "", Name: name, Time: time.Now(), Type: EventTypeImagePull}) } // Some callers may set the platform via the system context at creation // time of the runtime. We need this information to decide whether we // need to enforce pulling from a registry (see // containers/podman/issues/10682). if options.Architecture == "" { options.Architecture = r.systemContext.ArchitectureChoice } if options.OS == "" { options.OS = r.systemContext.OSChoice } if options.Variant == "" { options.Variant = r.systemContext.VariantChoice } var ( pulledImages []string pullError error ) // Dispatch the copy operation. switch ref.Transport().Name() { // DOCKER REGISTRY case registryTransport.Transport.Name(): pulledImages, pullError = r.copyFromRegistry(ctx, ref, possiblyUnqualifiedName, pullPolicy, options) // DOCKER ARCHIVE case dockerArchiveTransport.Transport.Name(): pulledImages, pullError = r.copyFromDockerArchive(ctx, ref, &options.CopyOptions) // ALL OTHER TRANSPORTS default: pulledImages, pullError = r.copyFromDefault(ctx, ref, &options.CopyOptions) } if pullError != nil { return nil, pullError } localImages := []*Image{} for _, name := range pulledImages { image, _, err := r.LookupImage(name, nil) if err != nil { return nil, fmt.Errorf("locating pulled image %q name in containers storage: %w", name, err) } // Note that we can ignore the 2nd return value here. Some // images may ship with "wrong" platform, but we already warn // about it. Throwing an error is not (yet) the plan. matchError, _, err := image.matchesPlatform(ctx, options.OS, options.Architecture, options.Variant) if err != nil { return nil, fmt.Errorf("checking platform of image %s: %w", name, err) } // If the image does not match the expected/requested platform, // make sure to leave some breadcrumbs for the user. if matchError != nil { if options.Writer == nil { logrus.Warnf("%v", matchError) } else { fmt.Fprintf(options.Writer, "WARNING: %v\n", matchError) } } localImages = append(localImages, image) } return localImages, pullError } // nameFromAnnotations returns a reference string to be used as an image name, // or an empty string. The annotations map may be nil. func nameFromAnnotations(annotations map[string]string) string { if annotations == nil { return "" } // buildkit/containerd are using a custom annotation see // containers/podman/issues/12560. if annotations["io.containerd.image.name"] != "" { return annotations["io.containerd.image.name"] } return annotations[ociSpec.AnnotationRefName] } // copyFromDefault is the default copier for a number of transports. Other // transports require some specific dancing, sometimes Yoga. func (r *Runtime) copyFromDefault(ctx context.Context, ref types.ImageReference, options *CopyOptions) ([]string, error) { c, err := r.newCopier(options) if err != nil { return nil, err } defer c.close() // Figure out a name for the storage destination. var storageName, imageName string switch ref.Transport().Name() { case dockerDaemonTransport.Transport.Name(): // Normalize to docker.io if needed (see containers/podman/issues/10998). named, err := reference.ParseNormalizedNamed(ref.StringWithinTransport()) if err != nil { return nil, err } imageName = named.String() storageName = imageName case ociTransport.Transport.Name(): split := strings.SplitN(ref.StringWithinTransport(), ":", 2) storageName = toLocalImageName(split[0]) imageName = storageName case ociArchiveTransport.Transport.Name(): manifestDescriptor, err := ociArchiveTransport.LoadManifestDescriptorWithContext(r.SystemContext(), ref) if err != nil { return nil, err } storageName = nameFromAnnotations(manifestDescriptor.Annotations) switch len(storageName) { case 0: // If there's no reference name in the annotations, compute an ID. storageName, err = getImageID(ctx, ref, nil) if err != nil { return nil, err } imageName = "sha256:" + storageName[1:] default: named, err := NormalizeName(storageName) if err != nil { return nil, err } imageName = named.String() storageName = imageName } case storageTransport.Transport.Name(): storageName = ref.StringWithinTransport() named := ref.DockerReference() if named == nil { return nil, fmt.Errorf("could not get an image name for storage reference %q", ref) } imageName = named.String() default: // Path-based transports (e.g., dir) may include invalid // characters, so we should pessimistically generate an ID // instead of looking at the StringWithinTransport(). storageName, err = getImageID(ctx, ref, nil) if err != nil { return nil, err } imageName = "sha256:" + storageName[1:] } // Create a storage reference. destRef, err := storageTransport.Transport.ParseStoreReference(r.store, storageName) if err != nil { return nil, fmt.Errorf("parsing %q: %w", storageName, err) } _, err = c.copy(ctx, ref, destRef) return []string{imageName}, err } // storageReferencesFromArchiveReader returns a slice of image references inside the // archive reader. A docker archive may include more than one image and this // method allows for extracting them into containers storage references which // can later be used from copying. func (r *Runtime) storageReferencesReferencesFromArchiveReader(ctx context.Context, readerRef types.ImageReference, reader *dockerArchiveTransport.Reader) ([]types.ImageReference, []string, error) { destNames, err := reader.ManifestTagsForReference(readerRef) if err != nil { return nil, nil, err } var imageNames []string if len(destNames) == 0 { destName, err := getImageID(ctx, readerRef, &r.systemContext) if err != nil { return nil, nil, err } destNames = append(destNames, destName) // Make sure the image can be loaded after the pull by // replacing the @ with sha256:. imageNames = append(imageNames, "sha256:"+destName[1:]) } else { for i := range destNames { ref, err := NormalizeName(destNames[i]) if err != nil { return nil, nil, err } destNames[i] = ref.String() } imageNames = destNames } references := []types.ImageReference{} for _, destName := range destNames { destRef, err := storageTransport.Transport.ParseStoreReference(r.store, destName) if err != nil { return nil, nil, fmt.Errorf("parsing dest reference name %#v: %w", destName, err) } references = append(references, destRef) } return references, imageNames, nil } // copyFromDockerArchive copies one image from the specified reference. func (r *Runtime) copyFromDockerArchive(ctx context.Context, ref types.ImageReference, options *CopyOptions) ([]string, error) { // There may be more than one image inside the docker archive, so we // need a quick glimpse inside. reader, readerRef, err := dockerArchiveTransport.NewReaderForReference(&r.systemContext, ref) if err != nil { return nil, err } defer func() { if err := reader.Close(); err != nil { logrus.Errorf("Closing reader of docker archive: %v", err) } }() return r.copyFromDockerArchiveReaderReference(ctx, reader, readerRef, options) } // copyFromDockerArchiveReaderReference copies the specified readerRef from reader. func (r *Runtime) copyFromDockerArchiveReaderReference(ctx context.Context, reader *dockerArchiveTransport.Reader, readerRef types.ImageReference, options *CopyOptions) ([]string, error) { c, err := r.newCopier(options) if err != nil { return nil, err } defer c.close() // Get a slice of storage references we can copy. references, destNames, err := r.storageReferencesReferencesFromArchiveReader(ctx, readerRef, reader) if err != nil { return nil, err } // Now copy all of the images. Use readerRef for performance. for _, destRef := range references { if _, err := c.copy(ctx, readerRef, destRef); err != nil { return nil, err } } return destNames, nil } // copyFromRegistry pulls the specified, possibly unqualified, name from a // registry. On successful pull it returns the ID of the image in local // storage. // // If options.All is set, all tags from the specified registry will be pulled. func (r *Runtime) copyFromRegistry(ctx context.Context, ref types.ImageReference, inputName string, pullPolicy config.PullPolicy, options *PullOptions) ([]string, error) { // Sanity check. if err := pullPolicy.Validate(); err != nil { return nil, err } if !options.AllTags { return r.copySingleImageFromRegistry(ctx, inputName, pullPolicy, options) } // Copy all tags named := reference.TrimNamed(ref.DockerReference()) tags, err := registryTransport.GetRepositoryTags(ctx, &r.systemContext, ref) if err != nil { return nil, err } pulledIDs := []string{} for _, tag := range tags { select { // Let's be gentle with Podman remote. case <-ctx.Done(): return nil, fmt.Errorf("pulling cancelled") default: // We can continue. } tagged, err := reference.WithTag(named, tag) if err != nil { return nil, fmt.Errorf("creating tagged reference (name %s, tag %s): %w", named.String(), tag, err) } pulled, err := r.copySingleImageFromRegistry(ctx, tagged.String(), pullPolicy, options) if err != nil { return nil, err } pulledIDs = append(pulledIDs, pulled...) } return pulledIDs, nil } // imageIDsForManifest() parses the manifest of the copied image and then looks // up the IDs of the matching image. There's a small slice of time, between // when we copy the image into local storage and when we go to look for it // using the name that we gave it when we copied it, when the name we wanted to // assign to the image could have been moved, but the image's ID will remain // the same until it is deleted. func (r *Runtime) imagesIDsForManifest(manifestBytes []byte, sys *types.SystemContext) ([]string, error) { var imageDigest digest.Digest manifestType := manifest.GuessMIMEType(manifestBytes) if manifest.MIMETypeIsMultiImage(manifestType) { list, err := manifest.ListFromBlob(manifestBytes, manifestType) if err != nil { return nil, fmt.Errorf("parsing manifest list: %w", err) } d, err := list.ChooseInstance(sys) if err != nil { return nil, fmt.Errorf("choosing instance from manifest list: %w", err) } imageDigest = d } else { d, err := manifest.Digest(manifestBytes) if err != nil { return nil, fmt.Errorf("digesting manifest") } imageDigest = d } images, err := r.store.ImagesByDigest(imageDigest) if err != nil { return nil, fmt.Errorf("listing images by manifest digest: %w", err) } results := make([]string, 0, len(images)) for _, image := range images { results = append(results, image.ID) } if len(results) == 0 { return nil, fmt.Errorf("identifying new image by manifest digest: %w", storage.ErrImageUnknown) } return results, nil } // copySingleImageFromRegistry pulls the specified, possibly unqualified, name // from a registry. On successful pull it returns the ID of the image in local // storage. func (r *Runtime) copySingleImageFromRegistry(ctx context.Context, imageName string, pullPolicy config.PullPolicy, options *PullOptions) ([]string, error) { //nolint:gocyclo // Sanity check. if err := pullPolicy.Validate(); err != nil { return nil, err } var ( localImage *Image resolvedImageName string err error ) // Always check if there's a local image. If so, we should use its // resolved name for pulling. Assume we're doing a `pull foo`. // If there's already a local image "localhost/foo", then we should // attempt pulling that instead of doing the full short-name dance. // // NOTE that we only do platform checks if the specified values differ // from the local platform. Unfortunately, there are many images used // in the wild which don't set the correct value(s) in the config // causing various issues such as containers/podman/issues/10682. lookupImageOptions := &LookupImageOptions{Variant: options.Variant} if options.Architecture != runtime.GOARCH { lookupImageOptions.Architecture = options.Architecture } if options.OS != runtime.GOOS { lookupImageOptions.OS = options.OS } localImage, resolvedImageName, err = r.LookupImage(imageName, lookupImageOptions) if err != nil && !errors.Is(err, storage.ErrImageUnknown) { logrus.Errorf("Looking up %s in local storage: %v", imageName, err) } // If the local image is corrupted, we need to repull it. if localImage != nil { if err := localImage.isCorrupted(imageName); err != nil { logrus.Error(err) localImage = nil } } customPlatform := len(options.Architecture)+len(options.OS)+len(options.Variant) > 0 if customPlatform && pullPolicy != config.PullPolicyAlways && pullPolicy != config.PullPolicyNever { // Unless the pull policy is always/never, we must // pessimistically assume that the local image has an invalid // architecture (see containers/podman/issues/10682). Hence, // whenever the user requests a custom platform, set the pull // policy to "newer" to make sure we're pulling down the // correct image. // // NOTE that this is will even override --pull={false,never}. pullPolicy = config.PullPolicyNewer logrus.Debugf("Enforcing pull policy to %q to pull custom platform (arch: %q, os: %q, variant: %q) - local image may mistakenly specify wrong platform", pullPolicy, options.Architecture, options.OS, options.Variant) } if pullPolicy == config.PullPolicyNever { if localImage != nil { logrus.Debugf("Pull policy %q and %s resolved to local image %s", pullPolicy, imageName, resolvedImageName) return []string{resolvedImageName}, nil } logrus.Debugf("Pull policy %q but no local image has been found for %s", pullPolicy, imageName) return nil, fmt.Errorf("%s: %w", imageName, storage.ErrImageUnknown) } if pullPolicy == config.PullPolicyMissing && localImage != nil { return []string{resolvedImageName}, nil } // If we looked up the image by ID, we cannot really pull from anywhere. if localImage != nil && strings.HasPrefix(localImage.ID(), imageName) { switch pullPolicy { case config.PullPolicyAlways: return nil, fmt.Errorf("pull policy is always but image has been referred to by ID (%s)", imageName) default: return []string{resolvedImageName}, nil } } // If we found a local image, we should use its locally resolved name // (see containers/buildah/issues/2904). An exception is if a custom // platform is specified (e.g., `--arch=arm64`). In that case, we need // to pessimistically pull the image since some images declare wrong // platforms making platform checks absolutely unreliable (see // containers/podman/issues/10682). // // In other words: multi-arch support can only be as good as the images // in the wild, so we shouldn't break things for our users by trying to // insist that they make sense. if localImage != nil && !customPlatform { if imageName != resolvedImageName { logrus.Debugf("Image %s resolved to local image %s which will be used for pulling", imageName, resolvedImageName) } imageName = resolvedImageName } sys := r.systemContextCopy() resolved, err := shortnames.Resolve(sys, imageName) if err != nil { if localImage != nil && pullPolicy == config.PullPolicyNewer { return []string{resolvedImageName}, nil } return nil, err } // NOTE: Below we print the description from the short-name resolution. // In theory we could print it here. In practice, however, this is // causing a hard time for Buildah uses who are doing a `buildah from // image` and expect just the container name to be printed if the image // is present locally. // The pragmatic solution is to only print the description when we found // a _newer_ image that we're about to pull. wroteDesc := false writeDesc := func() error { if wroteDesc { return nil } wroteDesc = true if desc := resolved.Description(); len(desc) > 0 { logrus.Debug(desc) if options.Writer != nil { if _, err := options.Writer.Write([]byte(desc + "\n")); err != nil { return err } } } return nil } c, err := r.newCopier(&options.CopyOptions) if err != nil { return nil, err } defer c.close() var pullErrors []error for _, candidate := range resolved.PullCandidates { candidateString := candidate.Value.String() logrus.Debugf("Attempting to pull candidate %s for %s", candidateString, imageName) srcRef, err := registryTransport.NewReference(candidate.Value) if err != nil { return nil, err } if pullPolicy == config.PullPolicyNewer && localImage != nil { isNewer, err := localImage.hasDifferentDigestWithSystemContext(ctx, srcRef, c.systemContext) if err != nil { pullErrors = append(pullErrors, err) continue } if !isNewer { logrus.Debugf("Skipping pull candidate %s as the image is not newer (pull policy %s)", candidateString, pullPolicy) continue } } destRef, err := storageTransport.Transport.ParseStoreReference(r.store, candidate.Value.String()) if err != nil { return nil, err } if err := writeDesc(); err != nil { return nil, err } if options.Writer != nil { if _, err := io.WriteString(options.Writer, fmt.Sprintf("Trying to pull %s...\n", candidateString)); err != nil { return nil, err } } var manifestBytes []byte if manifestBytes, err = c.copy(ctx, srcRef, destRef); err != nil { logrus.Debugf("Error pulling candidate %s: %v", candidateString, err) pullErrors = append(pullErrors, err) continue } if err := candidate.Record(); err != nil { // Only log the recording errors. Podman has seen // reports where users set most of the system to // read-only which can cause issues. logrus.Errorf("Error recording short-name alias %q: %v", candidateString, err) } logrus.Debugf("Pulled candidate %s successfully", candidateString) if ids, err := r.imagesIDsForManifest(manifestBytes, sys); err == nil { return ids, nil } return []string{candidate.Value.String()}, nil } if localImage != nil && pullPolicy == config.PullPolicyNewer { return []string{resolvedImageName}, nil } if len(pullErrors) == 0 { return nil, fmt.Errorf("internal error: no image pulled (pull policy %s)", pullPolicy) } return nil, resolved.FormatPullErrors(pullErrors) }