2016-04-27 18:49:01 +00:00
|
|
|
package storage
|
2016-01-19 22:26:15 +00:00
|
|
|
|
|
|
|
import (
|
2017-08-11 22:31:16 +00:00
|
|
|
"context"
|
2016-01-19 22:26:15 +00:00
|
|
|
"fmt"
|
|
|
|
|
2020-08-24 11:18:39 +00:00
|
|
|
"github.com/distribution/distribution/v3"
|
|
|
|
"github.com/distribution/distribution/v3/registry/storage/driver"
|
2023-08-30 15:50:56 +00:00
|
|
|
"github.com/distribution/reference"
|
2016-12-17 00:28:34 +00:00
|
|
|
"github.com/opencontainers/go-digest"
|
2016-01-19 22:26:15 +00:00
|
|
|
)
|
|
|
|
|
2016-03-24 23:03:25 +00:00
|
|
|
func emit(format string, a ...interface{}) {
|
2016-04-27 18:49:01 +00:00
|
|
|
fmt.Printf(format+"\n", a...)
|
2016-03-23 23:42:50 +00:00
|
|
|
}
|
|
|
|
|
2017-06-06 08:02:47 +00:00
|
|
|
// GCOpts contains options for garbage collector
|
|
|
|
type GCOpts struct {
|
|
|
|
DryRun bool
|
|
|
|
RemoveUntagged bool
|
|
|
|
}
|
|
|
|
|
|
|
|
// ManifestDel contains manifest structure which will be deleted
|
|
|
|
type ManifestDel struct {
|
|
|
|
Name string
|
|
|
|
Digest digest.Digest
|
|
|
|
Tags []string
|
|
|
|
}
|
|
|
|
|
2016-04-27 18:49:01 +00:00
|
|
|
// MarkAndSweep performs a mark and sweep of registry data
|
2017-06-06 08:02:47 +00:00
|
|
|
func MarkAndSweep(ctx context.Context, storageDriver driver.StorageDriver, registry distribution.Namespace, opts GCOpts) error {
|
2016-01-19 22:26:15 +00:00
|
|
|
repositoryEnumerator, ok := registry.(distribution.RepositoryEnumerator)
|
|
|
|
if !ok {
|
2016-03-30 18:35:24 +00:00
|
|
|
return fmt.Errorf("unable to convert Namespace to RepositoryEnumerator")
|
2016-01-19 22:26:15 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// mark
|
|
|
|
markSet := make(map[digest.Digest]struct{})
|
2017-06-06 08:02:47 +00:00
|
|
|
manifestArr := make([]ManifestDel, 0)
|
2016-03-24 23:03:25 +00:00
|
|
|
err := repositoryEnumerator.Enumerate(ctx, func(repoName string) error {
|
2016-10-13 15:04:19 +00:00
|
|
|
emit(repoName)
|
2016-03-23 23:42:50 +00:00
|
|
|
|
2016-01-19 22:26:15 +00:00
|
|
|
var err error
|
2017-01-14 01:06:03 +00:00
|
|
|
named, err := reference.WithName(repoName)
|
2016-01-19 22:26:15 +00:00
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to parse repo name %s: %v", repoName, err)
|
|
|
|
}
|
|
|
|
repository, err := registry.Repository(ctx, named)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to construct repository: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
manifestService, err := repository.Manifests(ctx)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to construct manifest service: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
manifestEnumerator, ok := manifestService.(distribution.ManifestEnumerator)
|
|
|
|
if !ok {
|
2016-03-30 18:35:24 +00:00
|
|
|
return fmt.Errorf("unable to convert ManifestService into ManifestEnumerator")
|
2016-01-19 22:26:15 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
err = manifestEnumerator.Enumerate(ctx, func(dgst digest.Digest) error {
|
2017-06-06 08:02:47 +00:00
|
|
|
if opts.RemoveUntagged {
|
|
|
|
// fetch all tags where this manifest is the latest one
|
|
|
|
tags, err := repository.Tags(ctx).Lookup(ctx, distribution.Descriptor{Digest: dgst})
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to retrieve tags for digest %v: %v", dgst, err)
|
|
|
|
}
|
|
|
|
if len(tags) == 0 {
|
|
|
|
// fetch all tags from repository
|
|
|
|
// all of these tags could contain manifest in history
|
|
|
|
// which means that we need check (and delete) those references when deleting manifest
|
|
|
|
allTags, err := repository.Tags(ctx).All(ctx)
|
|
|
|
if err != nil {
|
2024-02-24 17:08:17 +00:00
|
|
|
if _, ok := err.(distribution.ErrManifestUnknownRevision); !ok {
|
|
|
|
return nil
|
|
|
|
}
|
2017-06-06 08:02:47 +00:00
|
|
|
return fmt.Errorf("failed to retrieve tags %v", err)
|
|
|
|
}
|
|
|
|
manifestArr = append(manifestArr, ManifestDel{Name: repoName, Digest: dgst, Tags: allTags})
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
2016-03-24 23:03:25 +00:00
|
|
|
// Mark the manifest's blob
|
2016-10-13 15:04:19 +00:00
|
|
|
emit("%s: marking manifest %s ", repoName, dgst)
|
2016-01-19 22:26:15 +00:00
|
|
|
markSet[dgst] = struct{}{}
|
|
|
|
|
2024-02-24 17:08:17 +00:00
|
|
|
return markManifestReferences(dgst, manifestService, ctx, func(d digest.Digest) bool {
|
|
|
|
_, marked := markSet[d]
|
|
|
|
if !marked {
|
|
|
|
markSet[d] = struct{}{}
|
|
|
|
emit("%s: marking blob %s", repoName, d)
|
|
|
|
}
|
|
|
|
return marked
|
|
|
|
})
|
2016-01-19 22:26:15 +00:00
|
|
|
})
|
|
|
|
|
2019-02-05 00:42:44 +00:00
|
|
|
// In certain situations such as unfinished uploads, deleting all
|
|
|
|
// tags in S3 or removing the _manifests folder manually, this
|
|
|
|
// error may be of type PathNotFound.
|
|
|
|
//
|
|
|
|
// In these cases we can continue marking other manifests safely.
|
|
|
|
if _, ok := err.(driver.PathNotFoundError); ok {
|
|
|
|
return nil
|
2016-04-26 04:14:00 +00:00
|
|
|
}
|
|
|
|
|
2016-01-19 22:26:15 +00:00
|
|
|
return err
|
|
|
|
})
|
|
|
|
if err != nil {
|
2016-11-14 22:03:01 +00:00
|
|
|
return fmt.Errorf("failed to mark: %v", err)
|
2016-01-19 22:26:15 +00:00
|
|
|
}
|
|
|
|
|
2024-02-24 17:08:17 +00:00
|
|
|
manifestArr = unmarkReferencedManifest(manifestArr, markSet)
|
|
|
|
|
2016-01-19 22:26:15 +00:00
|
|
|
// sweep
|
2017-06-06 08:02:47 +00:00
|
|
|
vacuum := NewVacuum(ctx, storageDriver)
|
|
|
|
if !opts.DryRun {
|
|
|
|
for _, obj := range manifestArr {
|
|
|
|
err = vacuum.RemoveManifest(obj.Name, obj.Digest, obj.Tags)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to delete manifest %s: %v", obj.Digest, err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2016-01-19 22:26:15 +00:00
|
|
|
blobService := registry.Blobs()
|
|
|
|
deleteSet := make(map[digest.Digest]struct{})
|
|
|
|
err = blobService.Enumerate(ctx, func(dgst digest.Digest) error {
|
|
|
|
// check if digest is in markSet. If not, delete it!
|
|
|
|
if _, ok := markSet[dgst]; !ok {
|
|
|
|
deleteSet[dgst] = struct{}{}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
2016-03-30 18:35:24 +00:00
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("error enumerating blobs: %v", err)
|
|
|
|
}
|
2017-06-06 08:02:47 +00:00
|
|
|
emit("\n%d blobs marked, %d blobs and %d manifests eligible for deletion", len(markSet), len(deleteSet), len(manifestArr))
|
2016-01-19 22:26:15 +00:00
|
|
|
for dgst := range deleteSet {
|
2016-10-13 15:04:19 +00:00
|
|
|
emit("blob eligible for deletion: %s", dgst)
|
2017-06-06 08:02:47 +00:00
|
|
|
if opts.DryRun {
|
2016-03-23 23:42:50 +00:00
|
|
|
continue
|
|
|
|
}
|
2016-01-19 22:26:15 +00:00
|
|
|
err = vacuum.RemoveBlob(string(dgst))
|
|
|
|
if err != nil {
|
2016-11-14 22:03:01 +00:00
|
|
|
return fmt.Errorf("failed to delete blob %s: %v", dgst, err)
|
2016-01-19 22:26:15 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
2024-02-24 17:08:17 +00:00
|
|
|
|
|
|
|
// unmarkReferencedManifest filters out manifest present in markSet
|
|
|
|
func unmarkReferencedManifest(manifestArr []ManifestDel, markSet map[digest.Digest]struct{}) []ManifestDel {
|
|
|
|
filtered := make([]ManifestDel, 0)
|
|
|
|
for _, obj := range manifestArr {
|
|
|
|
if _, ok := markSet[obj.Digest]; !ok {
|
|
|
|
emit("manifest eligible for deletion: %s", obj)
|
|
|
|
filtered = append(filtered, obj)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return filtered
|
|
|
|
}
|
|
|
|
|
|
|
|
// markManifestReferences marks the manifest references
|
|
|
|
func markManifestReferences(dgst digest.Digest, manifestService distribution.ManifestService, ctx context.Context, ingester func(digest.Digest) bool) error {
|
|
|
|
manifest, err := manifestService.Get(ctx, dgst)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to retrieve manifest for digest %v: %v", dgst, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
descriptors := manifest.References()
|
|
|
|
for _, descriptor := range descriptors {
|
|
|
|
|
|
|
|
// do not visit references if already marked
|
|
|
|
if ingester(descriptor.Digest) {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
if ok, _ := manifestService.Exists(ctx, descriptor.Digest); ok {
|
|
|
|
err := markManifestReferences(descriptor.Digest, manifestService, ctx, ingester)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|