2022-09-30 12:35:16 -05:00
|
|
|
package storage
|
|
|
|
|
|
|
|
import (
|
2023-07-13 11:31:39 -05:00
|
|
|
"bytes"
|
2023-09-05 11:48:56 -05:00
|
|
|
"context"
|
2022-09-30 12:35:16 -05:00
|
|
|
"encoding/json"
|
2022-11-15 01:21:49 -05:00
|
|
|
"errors"
|
2023-08-23 12:59:52 -05:00
|
|
|
"fmt"
|
2023-11-01 11:09:21 -05:00
|
|
|
"math/rand"
|
2022-09-30 12:35:16 -05:00
|
|
|
"path"
|
|
|
|
"strings"
|
2023-11-01 11:09:21 -05:00
|
|
|
"time"
|
2022-09-30 12:35:16 -05:00
|
|
|
|
2023-09-01 12:54:39 -05:00
|
|
|
"github.com/docker/distribution/registry/storage/driver"
|
2022-09-30 12:35:16 -05:00
|
|
|
godigest "github.com/opencontainers/go-digest"
|
2023-07-13 11:31:39 -05:00
|
|
|
"github.com/opencontainers/image-spec/schema"
|
2022-11-15 01:21:49 -05:00
|
|
|
imeta "github.com/opencontainers/image-spec/specs-go"
|
2022-09-30 12:35:16 -05:00
|
|
|
ispec "github.com/opencontainers/image-spec/specs-go/v1"
|
2022-10-20 11:39:20 -05:00
|
|
|
|
2024-01-31 23:34:07 -05:00
|
|
|
zerr "zotregistry.dev/zot/errors"
|
|
|
|
zcommon "zotregistry.dev/zot/pkg/common"
|
|
|
|
"zotregistry.dev/zot/pkg/extensions/monitoring"
|
|
|
|
zlog "zotregistry.dev/zot/pkg/log"
|
|
|
|
"zotregistry.dev/zot/pkg/scheduler"
|
|
|
|
storageConstants "zotregistry.dev/zot/pkg/storage/constants"
|
|
|
|
storageTypes "zotregistry.dev/zot/pkg/storage/types"
|
2023-05-10 12:15:33 -05:00
|
|
|
)
|
|
|
|
|
2023-08-19 00:52:03 -05:00
|
|
|
const (
|
|
|
|
manifestWithEmptyLayersErrMsg = "layers: Array must have at least 1 items"
|
2023-08-23 12:59:52 -05:00
|
|
|
cosignSignatureTagSuffix = "sig"
|
2023-08-19 00:52:03 -05:00
|
|
|
)
|
2023-07-13 11:31:39 -05:00
|
|
|
|
2022-09-30 12:35:16 -05:00
|
|
|
func GetTagsByIndex(index ispec.Index) []string {
|
|
|
|
tags := make([]string, 0)
|
|
|
|
|
|
|
|
for _, manifest := range index.Manifests {
|
|
|
|
v, ok := manifest.Annotations[ispec.AnnotationRefName]
|
|
|
|
if ok {
|
|
|
|
tags = append(tags, v)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return tags
|
|
|
|
}
|
|
|
|
|
|
|
|
func GetManifestDescByReference(index ispec.Index, reference string) (ispec.Descriptor, bool) {
|
|
|
|
var manifestDesc ispec.Descriptor
|
|
|
|
|
|
|
|
for _, manifest := range index.Manifests {
|
|
|
|
if reference == manifest.Digest.String() {
|
|
|
|
return manifest, true
|
|
|
|
}
|
|
|
|
|
|
|
|
v, ok := manifest.Annotations[ispec.AnnotationRefName]
|
|
|
|
if ok && v == reference {
|
|
|
|
return manifest, true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return manifestDesc, false
|
|
|
|
}
|
|
|
|
|
2023-05-26 13:08:19 -05:00
|
|
|
func ValidateManifest(imgStore storageTypes.ImageStore, repo, reference, mediaType string, body []byte,
|
2023-09-01 12:54:39 -05:00
|
|
|
log zlog.Logger,
|
2024-07-19 11:56:31 -05:00
|
|
|
) error {
|
2022-09-30 12:35:16 -05:00
|
|
|
// validate the manifest
|
|
|
|
if !IsSupportedMediaType(mediaType) {
|
|
|
|
log.Debug().Interface("actual", mediaType).
|
|
|
|
Msg("bad manifest media type")
|
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return zerr.ErrBadManifest
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
if len(body) == 0 {
|
|
|
|
log.Debug().Int("len", len(body)).Msg("invalid body length")
|
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return zerr.ErrBadManifest
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
|
2022-11-08 03:38:16 -05:00
|
|
|
switch mediaType {
|
|
|
|
case ispec.MediaTypeImageManifest:
|
2022-09-30 12:35:16 -05:00
|
|
|
var manifest ispec.Manifest
|
2023-07-13 11:31:39 -05:00
|
|
|
|
|
|
|
// validate manifest
|
|
|
|
if err := ValidateManifestSchema(body); err != nil {
|
2023-12-08 03:05:02 -05:00
|
|
|
log.Error().Err(err).Msg("failed to validate OCIv1 image manifest schema")
|
2023-07-13 11:31:39 -05:00
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return zerr.NewError(zerr.ErrBadManifest).AddDetail("jsonSchemaValidation", err.Error())
|
2023-07-13 11:31:39 -05:00
|
|
|
}
|
|
|
|
|
2022-09-30 12:35:16 -05:00
|
|
|
if err := json.Unmarshal(body, &manifest); err != nil {
|
2023-12-08 03:05:02 -05:00
|
|
|
log.Error().Err(err).Msg("failed to unmarshal JSON")
|
2022-09-30 12:35:16 -05:00
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return zerr.ErrBadManifest
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
|
2023-09-02 03:28:31 -05:00
|
|
|
// validate blobs only for known media types
|
|
|
|
if manifest.Config.MediaType == ispec.MediaTypeImageConfig ||
|
|
|
|
manifest.Config.MediaType == ispec.MediaTypeEmptyJSON {
|
|
|
|
// validate config blob - a lightweight check if the blob is present
|
|
|
|
ok, _, _, err := imgStore.StatBlob(repo, manifest.Config.Digest)
|
|
|
|
if !ok || err != nil {
|
2023-12-08 03:05:02 -05:00
|
|
|
log.Error().Err(err).Str("digest", manifest.Config.Digest.String()).
|
|
|
|
Msg("failed to stat blob due to missing config blob")
|
2023-09-02 03:28:31 -05:00
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return zerr.ErrBadManifest
|
2023-09-02 03:28:31 -05:00
|
|
|
}
|
|
|
|
|
2023-07-13 11:31:39 -05:00
|
|
|
// validate layers - a lightweight check if the blob is present
|
|
|
|
for _, layer := range manifest.Layers {
|
|
|
|
if IsNonDistributable(layer.MediaType) {
|
|
|
|
log.Debug().Str("digest", layer.Digest.String()).Str("mediaType", layer.MediaType).
|
|
|
|
Msg("skip checking non-distributable layer exists")
|
2022-09-30 12:35:16 -05:00
|
|
|
|
2023-07-13 11:31:39 -05:00
|
|
|
continue
|
|
|
|
}
|
2022-11-08 03:38:16 -05:00
|
|
|
|
2023-09-01 12:54:39 -05:00
|
|
|
ok, _, _, err := imgStore.StatBlob(repo, layer.Digest)
|
2023-07-13 11:31:39 -05:00
|
|
|
if !ok || err != nil {
|
2023-12-08 03:05:02 -05:00
|
|
|
log.Error().Err(err).Str("digest", layer.Digest.String()).
|
|
|
|
Msg("failed to validate manifest due to missing layer blob")
|
2022-11-08 03:38:16 -05:00
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return zerr.ErrBadManifest
|
2023-07-13 11:31:39 -05:00
|
|
|
}
|
2022-11-08 03:38:16 -05:00
|
|
|
}
|
|
|
|
}
|
2023-07-13 11:31:39 -05:00
|
|
|
case ispec.MediaTypeImageIndex:
|
|
|
|
// validate manifest
|
|
|
|
if err := ValidateImageIndexSchema(body); err != nil {
|
2023-12-08 03:05:02 -05:00
|
|
|
log.Error().Err(err).Msg("failed to validate OCIv1 image index manifest schema")
|
2022-09-30 12:35:16 -05:00
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return zerr.NewError(zerr.ErrBadManifest).AddDetail("jsonSchemaValidation", err.Error())
|
2023-07-13 11:31:39 -05:00
|
|
|
}
|
2022-09-30 12:35:16 -05:00
|
|
|
|
2023-07-13 11:31:39 -05:00
|
|
|
var indexManifest ispec.Index
|
|
|
|
if err := json.Unmarshal(body, &indexManifest); err != nil {
|
2023-12-08 03:05:02 -05:00
|
|
|
log.Error().Err(err).Msg("failed to unmarshal JSON")
|
2023-05-01 14:49:41 -05:00
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return zerr.ErrBadManifest
|
2023-05-01 14:49:41 -05:00
|
|
|
}
|
|
|
|
|
2023-07-13 11:31:39 -05:00
|
|
|
for _, manifest := range indexManifest.Manifests {
|
2023-09-01 12:54:39 -05:00
|
|
|
if ok, _, _, err := imgStore.StatBlob(repo, manifest.Digest); !ok || err != nil {
|
2023-12-08 03:05:02 -05:00
|
|
|
log.Error().Err(err).Str("digest", manifest.Digest.String()).
|
|
|
|
Msg("failed to stat manifest due to missing manifest blob")
|
2023-07-13 11:31:39 -05:00
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return zerr.ErrBadManifest
|
2023-07-13 11:31:39 -05:00
|
|
|
}
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return nil
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
// Returns the canonical digest or the digest provided by the reference if any
|
|
|
|
// Per spec, the canonical digest would always be returned to the client in
|
|
|
|
// request headers, but that does not make sense if the client requested a different digest algorithm
|
|
|
|
// See https://github.com/opencontainers/distribution-spec/issues/494
|
|
|
|
func GetAndValidateRequestDigest(body []byte, reference string, log zlog.Logger) (
|
|
|
|
godigest.Digest, error,
|
|
|
|
) {
|
|
|
|
expectedDigest, err := godigest.Parse(reference)
|
|
|
|
if err != nil {
|
|
|
|
// This is a non-digest reference
|
|
|
|
return godigest.Canonical.FromBytes(body), err
|
|
|
|
}
|
2022-09-30 12:35:16 -05:00
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
actualDigest := expectedDigest.Algorithm().FromBytes(body)
|
2022-09-30 12:35:16 -05:00
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
if expectedDigest.String() != actualDigest.String() {
|
|
|
|
log.Error().Str("actual", actualDigest.String()).Str("expected", expectedDigest.String()).
|
|
|
|
Msg("failed to validate manifest digest")
|
|
|
|
|
|
|
|
return actualDigest, zerr.ErrBadManifest
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
|
2024-07-19 11:56:31 -05:00
|
|
|
return actualDigest, nil
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
|
2022-10-05 05:21:14 -05:00
|
|
|
/*
|
2022-11-18 12:35:28 -05:00
|
|
|
CheckIfIndexNeedsUpdate verifies if an index needs to be updated given a new manifest descriptor.
|
2022-10-05 05:21:14 -05:00
|
|
|
|
|
|
|
Returns whether or not index needs update, in the latter case it will also return the previous digest.
|
|
|
|
*/
|
2022-09-30 12:35:16 -05:00
|
|
|
func CheckIfIndexNeedsUpdate(index *ispec.Index, desc *ispec.Descriptor,
|
2023-09-01 12:54:39 -05:00
|
|
|
log zlog.Logger,
|
2022-09-30 12:35:16 -05:00
|
|
|
) (bool, godigest.Digest, error) {
|
|
|
|
var oldDgst godigest.Digest
|
|
|
|
|
|
|
|
var reference string
|
|
|
|
|
|
|
|
tag, ok := desc.Annotations[ispec.AnnotationRefName]
|
|
|
|
if ok {
|
|
|
|
reference = tag
|
|
|
|
} else {
|
|
|
|
reference = desc.Digest.String()
|
|
|
|
}
|
|
|
|
|
|
|
|
updateIndex := true
|
|
|
|
|
|
|
|
for midx, manifest := range index.Manifests {
|
|
|
|
manifest := manifest
|
|
|
|
if reference == manifest.Digest.String() {
|
|
|
|
// nothing changed, so don't update
|
|
|
|
updateIndex = false
|
|
|
|
|
|
|
|
break
|
|
|
|
}
|
|
|
|
|
|
|
|
v, ok := manifest.Annotations[ispec.AnnotationRefName]
|
|
|
|
if ok && v == reference {
|
|
|
|
if manifest.Digest.String() == desc.Digest.String() {
|
|
|
|
// nothing changed, so don't update
|
|
|
|
updateIndex = false
|
|
|
|
|
|
|
|
break
|
|
|
|
}
|
|
|
|
|
|
|
|
// manifest contents have changed for the same tag,
|
|
|
|
// so update index.json descriptor
|
|
|
|
log.Info().
|
|
|
|
Int64("old size", manifest.Size).
|
|
|
|
Int64("new size", desc.Size).
|
|
|
|
Str("old digest", manifest.Digest.String()).
|
|
|
|
Str("new digest", desc.Digest.String()).
|
|
|
|
Str("old mediaType", manifest.MediaType).
|
|
|
|
Str("new mediaType", desc.MediaType).
|
|
|
|
Msg("updating existing tag with new manifest contents")
|
|
|
|
|
|
|
|
// changing media-type is disallowed!
|
|
|
|
if manifest.MediaType != desc.MediaType {
|
|
|
|
err := zerr.ErrBadManifest
|
|
|
|
log.Error().Err(err).
|
|
|
|
Str("old mediaType", manifest.MediaType).
|
|
|
|
Str("new mediaType", desc.MediaType).Msg("cannot change media-type")
|
2024-07-29 12:32:51 -05:00
|
|
|
|
2023-08-23 12:59:52 -05:00
|
|
|
reason := fmt.Sprintf("changing manifest media-type from \"%s\" to \"%s\" is disallowed",
|
|
|
|
manifest.MediaType, desc.MediaType)
|
2022-09-30 12:35:16 -05:00
|
|
|
|
2023-08-23 12:59:52 -05:00
|
|
|
return false, "", zerr.NewError(err).AddDetail("reason", reason)
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
oldDesc := *desc
|
|
|
|
|
|
|
|
desc = &manifest
|
|
|
|
oldDgst = manifest.Digest
|
|
|
|
desc.Size = oldDesc.Size
|
|
|
|
desc.Digest = oldDesc.Digest
|
|
|
|
|
|
|
|
index.Manifests = append(index.Manifests[:midx], index.Manifests[midx+1:]...)
|
|
|
|
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return updateIndex, oldDgst, nil
|
|
|
|
}
|
|
|
|
|
2022-11-24 14:00:22 -05:00
|
|
|
// GetIndex returns the contents of index.json.
|
2023-09-01 12:54:39 -05:00
|
|
|
func GetIndex(imgStore storageTypes.ImageStore, repo string, log zlog.Logger) (ispec.Index, error) {
|
2022-09-30 12:35:16 -05:00
|
|
|
var index ispec.Index
|
|
|
|
|
|
|
|
buf, err := imgStore.GetIndexContent(repo)
|
|
|
|
if err != nil {
|
2023-09-01 12:54:39 -05:00
|
|
|
if errors.As(err, &driver.PathNotFoundError{}) {
|
|
|
|
return index, zerr.ErrRepoNotFound
|
|
|
|
}
|
|
|
|
|
2022-09-30 12:35:16 -05:00
|
|
|
return index, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := json.Unmarshal(buf, &index); err != nil {
|
|
|
|
log.Error().Err(err).Str("dir", path.Join(imgStore.RootDir(), repo)).Msg("invalid JSON")
|
|
|
|
|
|
|
|
return index, zerr.ErrRepoBadVersion
|
|
|
|
}
|
|
|
|
|
|
|
|
return index, nil
|
|
|
|
}
|
|
|
|
|
2022-11-24 14:00:22 -05:00
|
|
|
// GetImageIndex returns a multiarch type image.
|
2023-09-01 12:54:39 -05:00
|
|
|
func GetImageIndex(imgStore storageTypes.ImageStore, repo string, digest godigest.Digest, log zlog.Logger,
|
2023-05-26 13:08:19 -05:00
|
|
|
) (ispec.Index, error) {
|
2022-11-24 14:00:22 -05:00
|
|
|
var imageIndex ispec.Index
|
|
|
|
|
|
|
|
if err := digest.Validate(); err != nil {
|
|
|
|
return imageIndex, err
|
|
|
|
}
|
|
|
|
|
|
|
|
buf, err := imgStore.GetBlobContent(repo, digest)
|
|
|
|
if err != nil {
|
|
|
|
return imageIndex, err
|
|
|
|
}
|
|
|
|
|
|
|
|
indexPath := path.Join(imgStore.RootDir(), repo, "blobs",
|
|
|
|
digest.Algorithm().String(), digest.Encoded())
|
|
|
|
|
|
|
|
if err := json.Unmarshal(buf, &imageIndex); err != nil {
|
|
|
|
log.Error().Err(err).Str("path", indexPath).Msg("invalid JSON")
|
|
|
|
|
|
|
|
return imageIndex, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return imageIndex, nil
|
|
|
|
}
|
|
|
|
|
2023-09-01 12:54:39 -05:00
|
|
|
func GetImageManifest(imgStore storageTypes.ImageStore, repo string, digest godigest.Digest, log zlog.Logger,
|
2023-05-10 12:15:33 -05:00
|
|
|
) (ispec.Manifest, error) {
|
|
|
|
var manifestContent ispec.Manifest
|
|
|
|
|
|
|
|
manifestBlob, err := imgStore.GetBlobContent(repo, digest)
|
|
|
|
if err != nil {
|
|
|
|
return manifestContent, err
|
|
|
|
}
|
|
|
|
|
|
|
|
manifestPath := path.Join(imgStore.RootDir(), repo, "blobs",
|
|
|
|
digest.Algorithm().String(), digest.Encoded())
|
|
|
|
|
|
|
|
if err := json.Unmarshal(manifestBlob, &manifestContent); err != nil {
|
|
|
|
log.Error().Err(err).Str("path", manifestPath).Msg("invalid JSON")
|
|
|
|
|
|
|
|
return manifestContent, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return manifestContent, nil
|
|
|
|
}
|
|
|
|
|
2022-11-18 12:35:28 -05:00
|
|
|
func RemoveManifestDescByReference(index *ispec.Index, reference string, detectCollisions bool,
|
2022-11-24 14:00:22 -05:00
|
|
|
) (ispec.Descriptor, error) {
|
2022-09-30 12:35:16 -05:00
|
|
|
var removedManifest ispec.Descriptor
|
|
|
|
|
|
|
|
var found bool
|
|
|
|
|
2022-11-18 12:35:28 -05:00
|
|
|
foundCount := 0
|
|
|
|
|
2022-09-30 12:35:16 -05:00
|
|
|
var outIndex ispec.Index
|
|
|
|
|
|
|
|
for _, manifest := range index.Manifests {
|
|
|
|
tag, ok := manifest.Annotations[ispec.AnnotationRefName]
|
|
|
|
if ok && tag == reference {
|
|
|
|
removedManifest = manifest
|
|
|
|
found = true
|
2022-11-18 12:35:28 -05:00
|
|
|
foundCount++
|
2022-09-30 12:35:16 -05:00
|
|
|
|
|
|
|
continue
|
|
|
|
} else if reference == manifest.Digest.String() {
|
|
|
|
removedManifest = manifest
|
|
|
|
found = true
|
2022-11-18 12:35:28 -05:00
|
|
|
foundCount++
|
2022-09-30 12:35:16 -05:00
|
|
|
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
outIndex.Manifests = append(outIndex.Manifests, manifest)
|
|
|
|
}
|
|
|
|
|
2022-11-18 12:35:28 -05:00
|
|
|
if foundCount > 1 && detectCollisions {
|
2022-11-24 14:00:22 -05:00
|
|
|
return ispec.Descriptor{}, zerr.ErrManifestConflict
|
|
|
|
} else if !found {
|
|
|
|
return ispec.Descriptor{}, zerr.ErrManifestNotFound
|
2022-11-18 12:35:28 -05:00
|
|
|
}
|
|
|
|
|
2022-09-30 12:35:16 -05:00
|
|
|
index.Manifests = outIndex.Manifests
|
|
|
|
|
2022-11-24 14:00:22 -05:00
|
|
|
return removedManifest, nil
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
|
2022-10-05 05:21:14 -05:00
|
|
|
/*
|
2022-11-18 12:35:28 -05:00
|
|
|
Unmarshal an image index and for all manifests in that
|
2022-09-30 12:35:16 -05:00
|
|
|
index, ensure that they do not have a name or they are not in other
|
2022-10-05 05:21:14 -05:00
|
|
|
manifest indexes else GC can never clean them.
|
|
|
|
*/
|
2023-05-26 13:08:19 -05:00
|
|
|
func UpdateIndexWithPrunedImageManifests(imgStore storageTypes.ImageStore, index *ispec.Index, repo string,
|
2023-09-01 12:54:39 -05:00
|
|
|
desc ispec.Descriptor, oldDgst godigest.Digest, log zlog.Logger,
|
2022-09-30 12:35:16 -05:00
|
|
|
) error {
|
|
|
|
if (desc.MediaType == ispec.MediaTypeImageIndex) && (oldDgst != "") {
|
|
|
|
otherImgIndexes := []ispec.Descriptor{}
|
|
|
|
|
|
|
|
for _, manifest := range index.Manifests {
|
|
|
|
if manifest.MediaType == ispec.MediaTypeImageIndex {
|
|
|
|
otherImgIndexes = append(otherImgIndexes, manifest)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
otherImgIndexes = append(otherImgIndexes, desc)
|
|
|
|
|
|
|
|
prunedManifests, err := PruneImageManifestsFromIndex(imgStore, repo, oldDgst, *index, otherImgIndexes, log)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
index.Manifests = prunedManifests
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2022-11-18 12:35:28 -05:00
|
|
|
Before an image index manifest is pushed to a repo, its constituent manifests
|
2022-09-30 12:35:16 -05:00
|
|
|
are pushed first, so when updating/removing this image index manifest, we also
|
|
|
|
need to determine if there are other image index manifests which refer to the
|
|
|
|
same constitutent manifests so that they can be garbage-collected correctly
|
|
|
|
|
2022-11-18 12:35:28 -05:00
|
|
|
PruneImageManifestsFromIndex is a helper routine to achieve this.
|
2022-09-30 12:35:16 -05:00
|
|
|
*/
|
2023-05-26 13:08:19 -05:00
|
|
|
func PruneImageManifestsFromIndex(imgStore storageTypes.ImageStore, repo string, digest godigest.Digest, //nolint:gocyclo,lll
|
2023-09-01 12:54:39 -05:00
|
|
|
outIndex ispec.Index, otherImgIndexes []ispec.Descriptor, log zlog.Logger,
|
2022-09-30 12:35:16 -05:00
|
|
|
) ([]ispec.Descriptor, error) {
|
|
|
|
dir := path.Join(imgStore.RootDir(), repo)
|
|
|
|
|
|
|
|
indexPath := path.Join(dir, "blobs", digest.Algorithm().String(), digest.Encoded())
|
|
|
|
|
2022-10-22 15:46:13 -05:00
|
|
|
buf, err := imgStore.GetBlobContent(repo, digest)
|
2022-09-30 12:35:16 -05:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
var imgIndex ispec.Index
|
|
|
|
if err := json.Unmarshal(buf, &imgIndex); err != nil {
|
|
|
|
log.Error().Err(err).Str("path", indexPath).Msg("invalid JSON")
|
|
|
|
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
inUse := map[string]uint{}
|
|
|
|
|
|
|
|
for _, manifest := range imgIndex.Manifests {
|
|
|
|
inUse[manifest.Digest.Encoded()]++
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, otherIndex := range otherImgIndexes {
|
2022-11-24 14:00:22 -05:00
|
|
|
oindex, err := GetImageIndex(imgStore, repo, otherIndex.Digest, log)
|
2022-09-30 12:35:16 -05:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, omanifest := range oindex.Manifests {
|
|
|
|
_, ok := inUse[omanifest.Digest.Encoded()]
|
|
|
|
if ok {
|
|
|
|
inUse[omanifest.Digest.Encoded()]++
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
prunedManifests := []ispec.Descriptor{}
|
|
|
|
|
|
|
|
// for all manifests in the index, skip those that either have a tag or
|
|
|
|
// are used in other imgIndexes
|
|
|
|
for _, outManifest := range outIndex.Manifests {
|
|
|
|
if outManifest.MediaType != ispec.MediaTypeImageManifest {
|
|
|
|
prunedManifests = append(prunedManifests, outManifest)
|
|
|
|
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
_, ok := outManifest.Annotations[ispec.AnnotationRefName]
|
|
|
|
if ok {
|
|
|
|
prunedManifests = append(prunedManifests, outManifest)
|
|
|
|
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
count, ok := inUse[outManifest.Digest.Encoded()]
|
|
|
|
if !ok {
|
|
|
|
prunedManifests = append(prunedManifests, outManifest)
|
|
|
|
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
if count != 1 {
|
|
|
|
// this manifest is in use in other image indexes
|
|
|
|
prunedManifests = append(prunedManifests, outManifest)
|
|
|
|
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return prunedManifests, nil
|
|
|
|
}
|
|
|
|
|
2023-09-01 12:54:39 -05:00
|
|
|
func isBlobReferencedInImageManifest(imgStore storageTypes.ImageStore, repo string,
|
|
|
|
bdigest, mdigest godigest.Digest, log zlog.Logger,
|
2023-07-10 04:24:45 -05:00
|
|
|
) (bool, error) {
|
|
|
|
if bdigest == mdigest {
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
manifestContent, err := GetImageManifest(imgStore, repo, mdigest, log)
|
|
|
|
if err != nil {
|
2023-12-08 03:05:02 -05:00
|
|
|
log.Error().Err(err).Str("repo", repo).Str("digest", mdigest.String()).Str("component", "gc").
|
|
|
|
Msg("failed to read manifest image")
|
2023-07-10 04:24:45 -05:00
|
|
|
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if bdigest == manifestContent.Config.Digest {
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, layer := range manifestContent.Layers {
|
|
|
|
if bdigest == layer.Digest {
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return false, nil
|
|
|
|
}
|
|
|
|
|
2023-09-01 12:54:39 -05:00
|
|
|
func IsBlobReferencedInImageIndex(imgStore storageTypes.ImageStore, repo string,
|
|
|
|
digest godigest.Digest, index ispec.Index, log zlog.Logger,
|
2023-07-10 04:24:45 -05:00
|
|
|
) (bool, error) {
|
|
|
|
for _, desc := range index.Manifests {
|
|
|
|
var found bool
|
|
|
|
|
|
|
|
switch desc.MediaType {
|
|
|
|
case ispec.MediaTypeImageIndex:
|
|
|
|
indexImage, err := GetImageIndex(imgStore, repo, desc.Digest, log)
|
|
|
|
if err != nil {
|
|
|
|
log.Error().Err(err).Str("repository", repo).Str("digest", desc.Digest.String()).
|
|
|
|
Msg("failed to read multiarch(index) image")
|
|
|
|
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
2023-09-01 12:54:39 -05:00
|
|
|
found, _ = IsBlobReferencedInImageIndex(imgStore, repo, digest, indexImage, log)
|
2023-07-10 04:24:45 -05:00
|
|
|
case ispec.MediaTypeImageManifest:
|
2023-09-01 12:54:39 -05:00
|
|
|
found, _ = isBlobReferencedInImageManifest(imgStore, repo, digest, desc.Digest, log)
|
2023-09-05 11:42:12 -05:00
|
|
|
default:
|
|
|
|
log.Warn().Str("mediatype", desc.MediaType).Msg("unknown media-type")
|
|
|
|
// should return true for digests found in index.json even if we don't know it's mediatype
|
|
|
|
if digest == desc.Digest {
|
|
|
|
found = true
|
|
|
|
}
|
2023-07-10 04:24:45 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
if found {
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return false, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func IsBlobReferenced(imgStore storageTypes.ImageStore, repo string,
|
2023-09-01 12:54:39 -05:00
|
|
|
digest godigest.Digest, log zlog.Logger,
|
2023-07-10 04:24:45 -05:00
|
|
|
) (bool, error) {
|
|
|
|
dir := path.Join(imgStore.RootDir(), repo)
|
|
|
|
if !imgStore.DirExists(dir) {
|
|
|
|
return false, zerr.ErrRepoNotFound
|
|
|
|
}
|
|
|
|
|
|
|
|
index, err := GetIndex(imgStore, repo, log)
|
|
|
|
if err != nil {
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
2023-09-01 12:54:39 -05:00
|
|
|
return IsBlobReferencedInImageIndex(imgStore, repo, digest, index, log)
|
|
|
|
}
|
|
|
|
|
2023-05-26 13:08:19 -05:00
|
|
|
func ApplyLinter(imgStore storageTypes.ImageStore, linter Lint, repo string, descriptor ispec.Descriptor,
|
|
|
|
) (bool, error) {
|
2022-09-30 12:35:16 -05:00
|
|
|
pass := true
|
|
|
|
|
2023-05-10 12:15:33 -05:00
|
|
|
// we'll skip anything that's not a image manifest
|
|
|
|
if descriptor.MediaType != ispec.MediaTypeImageManifest {
|
|
|
|
return pass, nil
|
|
|
|
}
|
2022-09-30 12:35:16 -05:00
|
|
|
|
2023-05-10 12:15:33 -05:00
|
|
|
if linter != nil && !IsSignature(descriptor) {
|
|
|
|
// lint new index with new manifest before writing to disk
|
|
|
|
pass, err := linter.Lint(repo, descriptor.Digest, imgStore)
|
|
|
|
if err != nil {
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if !pass {
|
|
|
|
return false, zerr.ErrImageLintAnnotations
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return pass, nil
|
|
|
|
}
|
|
|
|
|
2023-05-10 12:15:33 -05:00
|
|
|
func IsSignature(descriptor ispec.Descriptor) bool {
|
|
|
|
tag := descriptor.Annotations[ispec.AnnotationRefName]
|
|
|
|
|
|
|
|
switch descriptor.MediaType {
|
|
|
|
case ispec.MediaTypeImageManifest:
|
|
|
|
// is cosgin signature
|
2023-08-19 00:52:03 -05:00
|
|
|
if strings.HasPrefix(tag, "sha256-") && strings.HasSuffix(tag, cosignSignatureTagSuffix) {
|
2023-05-10 12:15:33 -05:00
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
2023-11-06 17:09:39 -05:00
|
|
|
// is cosign signature (OCI 1.1 support)
|
|
|
|
if descriptor.ArtifactType == zcommon.ArtifactTypeCosign {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
2023-05-10 12:15:33 -05:00
|
|
|
// is notation signature
|
2023-09-06 11:58:00 -05:00
|
|
|
if descriptor.ArtifactType == zcommon.ArtifactTypeNotation {
|
2023-05-10 12:15:33 -05:00
|
|
|
return true
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2023-05-26 13:08:19 -05:00
|
|
|
func GetReferrers(imgStore storageTypes.ImageStore, repo string, gdigest godigest.Digest, artifactTypes []string,
|
2023-09-01 12:54:39 -05:00
|
|
|
log zlog.Logger,
|
2022-11-15 01:21:49 -05:00
|
|
|
) (ispec.Index, error) {
|
|
|
|
nilIndex := ispec.Index{}
|
|
|
|
|
|
|
|
if err := gdigest.Validate(); err != nil {
|
|
|
|
return nilIndex, err
|
|
|
|
}
|
|
|
|
|
|
|
|
dir := path.Join(imgStore.RootDir(), repo)
|
|
|
|
if !imgStore.DirExists(dir) {
|
|
|
|
return nilIndex, zerr.ErrRepoNotFound
|
|
|
|
}
|
|
|
|
|
|
|
|
index, err := GetIndex(imgStore, repo, log)
|
|
|
|
if err != nil {
|
|
|
|
return nilIndex, err
|
|
|
|
}
|
|
|
|
|
|
|
|
result := []ispec.Descriptor{}
|
|
|
|
|
2023-07-05 11:42:16 -05:00
|
|
|
for _, descriptor := range index.Manifests {
|
|
|
|
if descriptor.Digest == gdigest {
|
2022-11-15 01:21:49 -05:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2023-07-05 11:42:16 -05:00
|
|
|
buf, err := imgStore.GetBlobContent(repo, descriptor.Digest)
|
2022-11-15 01:21:49 -05:00
|
|
|
if err != nil {
|
2023-07-05 11:42:16 -05:00
|
|
|
log.Error().Err(err).Str("blob", imgStore.BlobPath(repo, descriptor.Digest)).Msg("failed to read manifest")
|
2022-11-15 01:21:49 -05:00
|
|
|
|
2023-02-13 13:43:52 -05:00
|
|
|
if errors.Is(err, zerr.ErrBlobNotFound) {
|
2022-11-15 01:21:49 -05:00
|
|
|
return nilIndex, zerr.ErrManifestNotFound
|
|
|
|
}
|
|
|
|
|
|
|
|
return nilIndex, err
|
|
|
|
}
|
|
|
|
|
2023-07-05 11:42:16 -05:00
|
|
|
switch descriptor.MediaType {
|
|
|
|
case ispec.MediaTypeImageManifest:
|
|
|
|
var manifestContent ispec.Manifest
|
|
|
|
|
|
|
|
if err := json.Unmarshal(buf, &manifestContent); err != nil {
|
|
|
|
log.Error().Err(err).Str("manifest digest", descriptor.Digest.String()).Msg("invalid JSON")
|
2022-11-15 01:21:49 -05:00
|
|
|
|
|
|
|
return nilIndex, err
|
|
|
|
}
|
|
|
|
|
2023-07-05 11:42:16 -05:00
|
|
|
if manifestContent.Subject == nil || manifestContent.Subject.Digest != gdigest {
|
2022-11-15 01:21:49 -05:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
// filter by artifact type
|
2023-07-05 11:42:16 -05:00
|
|
|
manifestArtifactType := zcommon.GetManifestArtifactType(manifestContent)
|
2023-01-26 13:13:12 -05:00
|
|
|
|
2023-05-10 12:15:33 -05:00
|
|
|
if len(artifactTypes) > 0 && !zcommon.Contains(artifactTypes, manifestArtifactType) {
|
2022-11-15 01:21:49 -05:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
result = append(result, ispec.Descriptor{
|
2023-07-05 11:42:16 -05:00
|
|
|
MediaType: descriptor.MediaType,
|
2023-05-10 12:15:33 -05:00
|
|
|
ArtifactType: manifestArtifactType,
|
2023-07-05 11:42:16 -05:00
|
|
|
Size: descriptor.Size,
|
|
|
|
Digest: descriptor.Digest,
|
|
|
|
Annotations: manifestContent.Annotations,
|
|
|
|
})
|
|
|
|
case ispec.MediaTypeImageIndex:
|
|
|
|
var indexContent ispec.Index
|
|
|
|
|
|
|
|
if err := json.Unmarshal(buf, &indexContent); err != nil {
|
|
|
|
log.Error().Err(err).Str("manifest digest", descriptor.Digest.String()).Msg("invalid JSON")
|
|
|
|
|
|
|
|
return nilIndex, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if indexContent.Subject == nil || indexContent.Subject.Digest != gdigest {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
indexArtifactType := zcommon.GetIndexArtifactType(indexContent)
|
|
|
|
|
|
|
|
if len(artifactTypes) > 0 && !zcommon.Contains(artifactTypes, indexArtifactType) {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
result = append(result, ispec.Descriptor{
|
|
|
|
MediaType: descriptor.MediaType,
|
|
|
|
ArtifactType: indexArtifactType,
|
|
|
|
Size: descriptor.Size,
|
|
|
|
Digest: descriptor.Digest,
|
|
|
|
Annotations: indexContent.Annotations,
|
2022-11-15 01:21:49 -05:00
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
index = ispec.Index{
|
|
|
|
Versioned: imeta.Versioned{SchemaVersion: storageConstants.SchemaVersion},
|
|
|
|
MediaType: ispec.MediaTypeImageIndex,
|
|
|
|
Manifests: result,
|
|
|
|
Annotations: map[string]string{},
|
|
|
|
}
|
|
|
|
|
|
|
|
return index, nil
|
|
|
|
}
|
|
|
|
|
2023-10-20 15:02:31 -05:00
|
|
|
// Get blob descriptor from it's manifest contents, if blob can not be found it will return error.
|
|
|
|
func GetBlobDescriptorFromRepo(imgStore storageTypes.ImageStore, repo string, blobDigest godigest.Digest,
|
|
|
|
log zlog.Logger,
|
|
|
|
) (ispec.Descriptor, error) {
|
|
|
|
index, err := GetIndex(imgStore, repo, log)
|
|
|
|
if err != nil {
|
|
|
|
return ispec.Descriptor{}, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return GetBlobDescriptorFromIndex(imgStore, index, repo, blobDigest, log)
|
|
|
|
}
|
|
|
|
|
|
|
|
func GetBlobDescriptorFromIndex(imgStore storageTypes.ImageStore, index ispec.Index, repo string,
|
|
|
|
blobDigest godigest.Digest, log zlog.Logger,
|
|
|
|
) (ispec.Descriptor, error) {
|
|
|
|
for _, desc := range index.Manifests {
|
|
|
|
if desc.Digest == blobDigest {
|
|
|
|
return desc, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
switch desc.MediaType {
|
|
|
|
case ispec.MediaTypeImageManifest:
|
|
|
|
if foundDescriptor, err := getBlobDescriptorFromManifest(imgStore, repo, blobDigest, desc, log); err == nil {
|
|
|
|
return foundDescriptor, nil
|
|
|
|
}
|
|
|
|
case ispec.MediaTypeImageIndex:
|
|
|
|
indexImage, err := GetImageIndex(imgStore, repo, desc.Digest, log)
|
|
|
|
if err != nil {
|
|
|
|
return ispec.Descriptor{}, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if foundDescriptor, err := GetBlobDescriptorFromIndex(imgStore, indexImage, repo, blobDigest, log); err == nil {
|
|
|
|
return foundDescriptor, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return ispec.Descriptor{}, zerr.ErrBlobNotFound
|
|
|
|
}
|
|
|
|
|
|
|
|
func getBlobDescriptorFromManifest(imgStore storageTypes.ImageStore, repo string, blobDigest godigest.Digest,
|
|
|
|
desc ispec.Descriptor, log zlog.Logger,
|
|
|
|
) (ispec.Descriptor, error) {
|
|
|
|
manifest, err := GetImageManifest(imgStore, repo, desc.Digest, log)
|
|
|
|
if err != nil {
|
|
|
|
return ispec.Descriptor{}, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if manifest.Config.Digest == blobDigest {
|
|
|
|
return manifest.Config, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, layer := range manifest.Layers {
|
|
|
|
if layer.Digest == blobDigest {
|
|
|
|
return layer, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return ispec.Descriptor{}, zerr.ErrBlobNotFound
|
|
|
|
}
|
|
|
|
|
2022-09-30 12:35:16 -05:00
|
|
|
func IsSupportedMediaType(mediaType string) bool {
|
|
|
|
return mediaType == ispec.MediaTypeImageIndex ||
|
2024-03-06 15:16:42 -05:00
|
|
|
mediaType == ispec.MediaTypeImageManifest
|
2022-09-30 12:35:16 -05:00
|
|
|
}
|
2023-01-09 15:37:44 -05:00
|
|
|
|
2023-05-01 14:49:41 -05:00
|
|
|
func IsNonDistributable(mediaType string) bool {
|
2023-05-10 12:15:33 -05:00
|
|
|
return mediaType == ispec.MediaTypeImageLayerNonDistributable || //nolint:staticcheck
|
|
|
|
mediaType == ispec.MediaTypeImageLayerNonDistributableGzip || //nolint:staticcheck
|
|
|
|
mediaType == ispec.MediaTypeImageLayerNonDistributableZstd //nolint:staticcheck
|
2023-05-01 14:49:41 -05:00
|
|
|
}
|
|
|
|
|
2023-07-13 11:31:39 -05:00
|
|
|
func ValidateManifestSchema(buf []byte) error {
|
|
|
|
if err := schema.ValidatorMediaTypeManifest.Validate(bytes.NewBuffer(buf)); err != nil {
|
|
|
|
if !IsEmptyLayersError(err) {
|
2023-08-23 12:59:52 -05:00
|
|
|
return err
|
2023-07-13 11:31:39 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func ValidateImageIndexSchema(buf []byte) error {
|
|
|
|
if err := schema.ValidatorMediaTypeImageIndex.Validate(bytes.NewBuffer(buf)); err != nil {
|
2023-08-23 12:59:52 -05:00
|
|
|
return err
|
2023-07-13 11:31:39 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func IsEmptyLayersError(err error) bool {
|
|
|
|
var validationErr schema.ValidationError
|
|
|
|
if errors.As(err, &validationErr) {
|
|
|
|
if len(validationErr.Errs) == 1 && strings.Contains(err.Error(), manifestWithEmptyLayersErrMsg) {
|
|
|
|
return true
|
|
|
|
} else {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2023-04-07 11:49:24 -05:00
|
|
|
/*
|
2023-05-26 13:08:19 -05:00
|
|
|
DedupeTaskGenerator takes all blobs paths found in the storage.imagestore and groups them by digest
|
2023-04-07 11:49:24 -05:00
|
|
|
|
|
|
|
for each digest and based on the dedupe value it will dedupe or restore deduped blobs to the original state(undeduped)\
|
|
|
|
by creating a task for each digest and pushing it to the task scheduler.
|
|
|
|
*/
|
|
|
|
type DedupeTaskGenerator struct {
|
2023-05-26 13:08:19 -05:00
|
|
|
ImgStore storageTypes.ImageStore
|
2023-04-07 11:49:24 -05:00
|
|
|
// storage dedupe value
|
|
|
|
Dedupe bool
|
|
|
|
// store blobs paths grouped by digest
|
|
|
|
digest godigest.Digest
|
|
|
|
duplicateBlobs []string
|
|
|
|
/* store processed digest, used for iterating duplicateBlobs one by one
|
|
|
|
and generating a task for each unprocessed one*/
|
|
|
|
lastDigests []godigest.Digest
|
|
|
|
done bool
|
2023-09-27 13:15:08 -05:00
|
|
|
repos []string // list of repos on which we run dedupe
|
2023-09-01 12:54:39 -05:00
|
|
|
Log zlog.Logger
|
2023-04-07 11:49:24 -05:00
|
|
|
}
|
|
|
|
|
2024-02-01 12:15:53 -05:00
|
|
|
func (gen *DedupeTaskGenerator) Name() string {
|
|
|
|
return "DedupeTaskGenerator"
|
|
|
|
}
|
|
|
|
|
2023-07-04 03:03:29 -05:00
|
|
|
func (gen *DedupeTaskGenerator) Next() (scheduler.Task, error) {
|
2023-04-07 11:49:24 -05:00
|
|
|
var err error
|
|
|
|
|
2023-09-27 13:15:08 -05:00
|
|
|
/* at first run get from storage currently found repositories so that we skip the ones that gets synced/uploaded
|
|
|
|
while this generator runs, there are deduped/restored inline, no need to run dedupe/restore again */
|
|
|
|
if len(gen.repos) == 0 {
|
|
|
|
gen.repos, err = gen.ImgStore.GetRepositories()
|
|
|
|
if err != nil {
|
|
|
|
//nolint: dupword
|
2023-12-08 03:05:02 -05:00
|
|
|
gen.Log.Error().Err(err).Str("component", "dedupe").Msg("failed to get list of repositories")
|
2023-09-27 13:15:08 -05:00
|
|
|
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// if still no repos
|
|
|
|
if len(gen.repos) == 0 {
|
2023-12-08 03:05:02 -05:00
|
|
|
gen.Log.Info().Str("component", "dedupe").Msg("no repositories found in storage, finished.")
|
2023-09-27 13:15:08 -05:00
|
|
|
|
|
|
|
// no repositories in storage, no need to continue
|
|
|
|
gen.done = true
|
|
|
|
|
2024-07-29 12:32:51 -05:00
|
|
|
return nil, nil //nolint:nilnil
|
2023-09-27 13:15:08 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-05-26 13:08:19 -05:00
|
|
|
// get all blobs from storage.imageStore and group them by digest
|
2023-09-27 13:15:08 -05:00
|
|
|
gen.digest, gen.duplicateBlobs, err = gen.ImgStore.GetNextDigestWithBlobPaths(gen.repos, gen.lastDigests)
|
2023-04-07 11:49:24 -05:00
|
|
|
if err != nil {
|
2023-12-08 03:05:02 -05:00
|
|
|
gen.Log.Error().Err(err).Str("component", "dedupe").Msg("failed to get next digest")
|
2023-04-07 11:49:24 -05:00
|
|
|
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// if no digests left, then mark the task generator as done
|
|
|
|
if gen.digest == "" {
|
2023-12-11 08:39:32 -05:00
|
|
|
gen.Log.Info().Str("component", "dedupe").Msg("no digests left, finished")
|
2023-04-07 11:49:24 -05:00
|
|
|
|
|
|
|
gen.done = true
|
|
|
|
|
2024-07-29 12:32:51 -05:00
|
|
|
return nil, nil //nolint:nilnil
|
2023-04-07 11:49:24 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
// mark digest as processed before running its task
|
|
|
|
gen.lastDigests = append(gen.lastDigests, gen.digest)
|
|
|
|
|
|
|
|
// generate rebuild dedupe task for this digest
|
|
|
|
return newDedupeTask(gen.ImgStore, gen.digest, gen.Dedupe, gen.duplicateBlobs, gen.Log), nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (gen *DedupeTaskGenerator) IsDone() bool {
|
|
|
|
return gen.done
|
|
|
|
}
|
|
|
|
|
2023-08-07 14:55:19 -05:00
|
|
|
func (gen *DedupeTaskGenerator) IsReady() bool {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
2023-04-07 11:49:24 -05:00
|
|
|
func (gen *DedupeTaskGenerator) Reset() {
|
|
|
|
gen.lastDigests = []godigest.Digest{}
|
|
|
|
gen.duplicateBlobs = []string{}
|
2023-09-27 13:15:08 -05:00
|
|
|
gen.repos = []string{}
|
2023-04-07 11:49:24 -05:00
|
|
|
gen.digest = ""
|
|
|
|
gen.done = false
|
|
|
|
}
|
|
|
|
|
|
|
|
type dedupeTask struct {
|
2023-05-26 13:08:19 -05:00
|
|
|
imgStore storageTypes.ImageStore
|
2023-04-07 11:49:24 -05:00
|
|
|
// digest of duplicateBLobs
|
|
|
|
digest godigest.Digest
|
|
|
|
// blobs paths with the same digest ^
|
|
|
|
duplicateBlobs []string
|
|
|
|
dedupe bool
|
2023-09-01 12:54:39 -05:00
|
|
|
log zlog.Logger
|
2023-04-07 11:49:24 -05:00
|
|
|
}
|
|
|
|
|
2023-05-26 13:08:19 -05:00
|
|
|
func newDedupeTask(imgStore storageTypes.ImageStore, digest godigest.Digest, dedupe bool,
|
2023-09-01 12:54:39 -05:00
|
|
|
duplicateBlobs []string, log zlog.Logger,
|
2023-04-07 11:49:24 -05:00
|
|
|
) *dedupeTask {
|
|
|
|
return &dedupeTask{imgStore, digest, duplicateBlobs, dedupe, log}
|
|
|
|
}
|
|
|
|
|
2023-09-05 11:48:56 -05:00
|
|
|
func (dt *dedupeTask) DoWork(ctx context.Context) error {
|
2023-04-07 11:49:24 -05:00
|
|
|
// run task
|
2023-11-24 03:40:10 -05:00
|
|
|
err := dt.imgStore.RunDedupeForDigest(ctx, dt.digest, dt.dedupe, dt.duplicateBlobs) //nolint: contextcheck
|
2023-04-07 11:49:24 -05:00
|
|
|
if err != nil {
|
|
|
|
// log it
|
2023-12-08 03:05:02 -05:00
|
|
|
dt.log.Error().Err(err).Str("digest", dt.digest.String()).Str("component", "dedupe").
|
|
|
|
Msg("failed to rebuild digest")
|
2023-04-07 11:49:24 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
2023-11-01 11:09:21 -05:00
|
|
|
|
2023-12-04 17:13:50 -05:00
|
|
|
func (dt *dedupeTask) String() string {
|
|
|
|
return fmt.Sprintf("{Name: %s, digest: %s, dedupe: %t}",
|
|
|
|
dt.Name(), dt.digest, dt.dedupe)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (dt *dedupeTask) Name() string {
|
|
|
|
return "DedupeTask"
|
|
|
|
}
|
|
|
|
|
2023-11-01 11:09:21 -05:00
|
|
|
type StorageMetricsInitGenerator struct {
|
|
|
|
ImgStore storageTypes.ImageStore
|
|
|
|
done bool
|
|
|
|
Metrics monitoring.MetricServer
|
|
|
|
lastRepo string
|
|
|
|
nextRun time.Time
|
|
|
|
rand *rand.Rand
|
|
|
|
Log zlog.Logger
|
|
|
|
MaxDelay int
|
|
|
|
}
|
|
|
|
|
2024-02-01 12:15:53 -05:00
|
|
|
func (gen *StorageMetricsInitGenerator) Name() string {
|
|
|
|
return "StorageMetricsInitGenerator"
|
|
|
|
}
|
|
|
|
|
2023-11-01 11:09:21 -05:00
|
|
|
func (gen *StorageMetricsInitGenerator) Next() (scheduler.Task, error) {
|
|
|
|
if gen.lastRepo == "" && gen.nextRun.IsZero() {
|
|
|
|
gen.rand = rand.New(rand.NewSource(time.Now().UTC().UnixNano())) //nolint: gosec
|
|
|
|
}
|
|
|
|
|
|
|
|
delay := gen.rand.Intn(gen.MaxDelay)
|
|
|
|
|
|
|
|
gen.nextRun = time.Now().Add(time.Duration(delay) * time.Second)
|
|
|
|
|
|
|
|
repo, err := gen.ImgStore.GetNextRepository(gen.lastRepo)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2023-12-08 03:05:02 -05:00
|
|
|
gen.Log.Debug().Str("repo", repo).Int("randomDelay", delay).Msg("generate task for storage metrics")
|
2023-11-01 11:09:21 -05:00
|
|
|
|
|
|
|
if repo == "" {
|
|
|
|
gen.done = true
|
|
|
|
|
2024-07-29 12:32:51 -05:00
|
|
|
return nil, nil //nolint:nilnil
|
2023-11-01 11:09:21 -05:00
|
|
|
}
|
2024-07-29 12:32:51 -05:00
|
|
|
|
2023-11-01 11:09:21 -05:00
|
|
|
gen.lastRepo = repo
|
|
|
|
|
2023-11-14 19:22:24 -05:00
|
|
|
return NewStorageMetricsTask(gen.ImgStore, gen.Metrics, repo, gen.Log), nil
|
2023-11-01 11:09:21 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
func (gen *StorageMetricsInitGenerator) IsDone() bool {
|
|
|
|
return gen.done
|
|
|
|
}
|
|
|
|
|
|
|
|
func (gen *StorageMetricsInitGenerator) IsReady() bool {
|
|
|
|
return time.Now().After(gen.nextRun)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (gen *StorageMetricsInitGenerator) Reset() {
|
|
|
|
gen.lastRepo = ""
|
|
|
|
gen.done = false
|
|
|
|
gen.nextRun = time.Time{}
|
|
|
|
}
|
|
|
|
|
|
|
|
type smTask struct {
|
|
|
|
imgStore storageTypes.ImageStore
|
|
|
|
metrics monitoring.MetricServer
|
|
|
|
repo string
|
2023-11-14 19:22:24 -05:00
|
|
|
log zlog.Logger
|
2023-11-01 11:09:21 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
func NewStorageMetricsTask(imgStore storageTypes.ImageStore, metrics monitoring.MetricServer, repo string,
|
2023-11-14 19:22:24 -05:00
|
|
|
log zlog.Logger,
|
2023-11-01 11:09:21 -05:00
|
|
|
) *smTask {
|
2023-11-14 19:22:24 -05:00
|
|
|
return &smTask{imgStore, metrics, repo, log}
|
2023-11-01 11:09:21 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
func (smt *smTask) DoWork(ctx context.Context) error {
|
|
|
|
// run task
|
|
|
|
monitoring.SetStorageUsage(smt.metrics, smt.imgStore.RootDir(), smt.repo)
|
2023-12-08 03:05:02 -05:00
|
|
|
smt.log.Debug().Str("component", "monitoring").Msg("computed storage usage for repo " + smt.repo)
|
2023-11-01 11:09:21 -05:00
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
2023-12-04 17:13:50 -05:00
|
|
|
|
|
|
|
func (smt *smTask) String() string {
|
|
|
|
return fmt.Sprintf("{Name: \"%s\", repo: \"%s\"}",
|
|
|
|
smt.Name(), smt.repo)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (smt *smTask) Name() string {
|
|
|
|
return "StorageMetricsTask"
|
|
|
|
}
|