2023-05-31 20:26:23 +03:00
|
|
|
//go:build sync
|
|
|
|
// +build sync
|
|
|
|
|
2021-06-08 23:11:18 +03:00
|
|
|
package sync
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
2023-12-05 00:13:50 +02:00
|
|
|
"fmt"
|
2024-03-04 19:44:11 +02:00
|
|
|
"sync"
|
|
|
|
"time"
|
2021-06-08 23:11:18 +03:00
|
|
|
|
|
|
|
"github.com/containers/common/pkg/retry"
|
|
|
|
"github.com/containers/image/v5/types"
|
2023-05-31 20:26:23 +03:00
|
|
|
"github.com/opencontainers/go-digest"
|
2022-10-20 19:39:20 +03:00
|
|
|
|
2024-02-01 06:34:07 +02:00
|
|
|
"zotregistry.dev/zot/pkg/log"
|
|
|
|
"zotregistry.dev/zot/pkg/scheduler"
|
2021-06-08 23:11:18 +03:00
|
|
|
)
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
// below types are used by containers/image to copy images
|
|
|
|
// types.ImageReference - describes a registry/repo:tag
|
|
|
|
// types.SystemContext - describes a registry/oci layout config
|
|
|
|
|
|
|
|
// Sync general functionalities, one service per registry config.
|
|
|
|
type Service interface {
|
|
|
|
// Get next repo from remote /v2/_catalog, will return empty string when there is no repo left.
|
|
|
|
GetNextRepo(lastRepo string) (string, error) // used by task scheduler
|
|
|
|
// Sync a repo with all of its tags and references (signatures, artifacts, sboms) into ImageStore.
|
2023-09-05 19:48:56 +03:00
|
|
|
SyncRepo(ctx context.Context, repo string) error // used by periodically sync
|
2023-05-31 20:26:23 +03:00
|
|
|
// Sync an image (repo:tag || repo:digest) into ImageStore.
|
2023-09-05 19:48:56 +03:00
|
|
|
SyncImage(ctx context.Context, repo, reference string) error // used by sync on demand
|
2023-05-31 20:26:23 +03:00
|
|
|
// Sync a single reference for an image.
|
2023-09-05 19:48:56 +03:00
|
|
|
SyncReference(ctx context.Context, repo string, subjectDigestStr string,
|
|
|
|
referenceType string) error // used by sync on demand
|
2023-05-31 20:26:23 +03:00
|
|
|
// Remove all internal catalog entries.
|
|
|
|
ResetCatalog() // used by scheduler to empty out the catalog after a sync periodically roundtrip finishes
|
|
|
|
// Sync supports multiple urls per registry, before a sync repo/image/ref 'ping' each url.
|
|
|
|
SetNextAvailableURL() error // used by all sync methods
|
|
|
|
// Returns retry options from registry config.
|
|
|
|
GetRetryOptions() *retry.Options // used by sync on demand to retry in background
|
2021-06-08 23:11:18 +03:00
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
// Local and remote registries must implement this interface.
|
|
|
|
type Registry interface {
|
|
|
|
// Get temporary ImageReference, is used by functions in containers/image package
|
|
|
|
GetImageReference(repo string, tag string) (types.ImageReference, error)
|
|
|
|
// Get local oci layout context, is used by functions in containers/image package
|
|
|
|
GetContext() *types.SystemContext
|
2022-10-22 10:26:14 +03:00
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
/*
|
|
|
|
Temporary oci layout, sync first pulls an image to this oci layout (using oci:// transport)
|
|
|
|
then moves them into ImageStore.
|
|
|
|
*/
|
|
|
|
type OciLayoutStorage interface {
|
|
|
|
Registry
|
2021-06-08 23:11:18 +03:00
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
// Remote registry.
|
|
|
|
type Remote interface {
|
|
|
|
Registry
|
|
|
|
// Get a list of repos (catalog)
|
|
|
|
GetRepositories(ctx context.Context) ([]string, error)
|
|
|
|
// Get a list of tags given a repo
|
|
|
|
GetRepoTags(repo string) ([]string, error)
|
|
|
|
// Get manifest content, mediaType, digest given an ImageReference
|
|
|
|
GetManifestContent(imageReference types.ImageReference) ([]byte, string, digest.Digest, error)
|
2024-02-14 19:18:10 +02:00
|
|
|
// In the case of public dockerhub images 'library' namespace is added to the repo names of images
|
|
|
|
// eg: alpine -> library/alpine
|
|
|
|
GetDockerRemoteRepo(repo string) string
|
2021-06-08 23:11:18 +03:00
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
// Local registry.
|
2023-11-28 22:08:15 +02:00
|
|
|
type Destination interface {
|
2023-05-31 20:26:23 +03:00
|
|
|
Registry
|
|
|
|
// Check if an image is already synced
|
|
|
|
CanSkipImage(repo, tag string, imageDigest digest.Digest) (bool, error)
|
|
|
|
// CommitImage moves a synced repo/ref from temporary oci layout to ImageStore
|
|
|
|
CommitImage(imageReference types.ImageReference, repo, tag string) error
|
2024-02-29 19:09:21 +02:00
|
|
|
// Removes image reference, used when copy.Image() errors out
|
|
|
|
CleanupImage(imageReference types.ImageReference, repo, reference string) error
|
2021-06-08 23:11:18 +03:00
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
type TaskGenerator struct {
|
2024-03-04 19:44:11 +02:00
|
|
|
Service Service
|
|
|
|
lastRepo string
|
|
|
|
done bool
|
|
|
|
waitTime time.Duration
|
|
|
|
lastTaskTime time.Time
|
|
|
|
maxWaitTime time.Duration
|
|
|
|
lock *sync.Mutex
|
|
|
|
log log.Logger
|
2021-06-08 23:11:18 +03:00
|
|
|
}
|
|
|
|
|
2024-03-04 19:44:11 +02:00
|
|
|
func NewTaskGenerator(service Service, maxWaitTime time.Duration, log log.Logger) *TaskGenerator {
|
2023-05-31 20:26:23 +03:00
|
|
|
return &TaskGenerator{
|
2024-03-04 19:44:11 +02:00
|
|
|
Service: service,
|
|
|
|
done: false,
|
|
|
|
waitTime: 0,
|
|
|
|
lastTaskTime: time.Now(),
|
|
|
|
lock: &sync.Mutex{},
|
|
|
|
lastRepo: "",
|
|
|
|
maxWaitTime: maxWaitTime,
|
|
|
|
log: log,
|
2022-12-22 20:19:42 +02:00
|
|
|
}
|
2023-05-31 20:26:23 +03:00
|
|
|
}
|
2022-12-22 20:19:42 +02:00
|
|
|
|
2024-02-01 19:15:53 +02:00
|
|
|
func (gen *TaskGenerator) Name() string {
|
|
|
|
return "SyncGenerator"
|
|
|
|
}
|
|
|
|
|
2023-07-04 11:03:29 +03:00
|
|
|
func (gen *TaskGenerator) Next() (scheduler.Task, error) {
|
2024-03-04 19:44:11 +02:00
|
|
|
gen.lock.Lock()
|
|
|
|
defer gen.lock.Unlock()
|
|
|
|
|
|
|
|
if time.Since(gen.lastTaskTime) <= gen.waitTime {
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
if err := gen.Service.SetNextAvailableURL(); err != nil {
|
2024-03-04 19:44:11 +02:00
|
|
|
gen.increaseWaitTime()
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
return nil, err
|
2022-12-22 20:19:42 +02:00
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
repo, err := gen.Service.GetNextRepo(gen.lastRepo)
|
2021-12-07 20:26:26 +02:00
|
|
|
if err != nil {
|
2024-03-04 19:44:11 +02:00
|
|
|
gen.increaseWaitTime()
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
return nil, err
|
2021-12-07 20:26:26 +02:00
|
|
|
}
|
|
|
|
|
2024-03-04 19:44:11 +02:00
|
|
|
gen.resetWaitTime()
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
if repo == "" {
|
2024-03-04 19:44:11 +02:00
|
|
|
gen.log.Info().Str("component", "sync").Msg("finished syncing all repositories")
|
2023-05-31 20:26:23 +03:00
|
|
|
gen.done = true
|
2021-12-13 19:23:31 +00:00
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
return nil, nil
|
2021-06-08 23:11:18 +03:00
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
gen.lastRepo = repo
|
2022-04-05 18:18:31 +03:00
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
return newSyncRepoTask(gen.lastRepo, gen.Service), nil
|
2021-06-08 23:11:18 +03:00
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
func (gen *TaskGenerator) IsDone() bool {
|
|
|
|
return gen.done
|
2021-06-08 23:11:18 +03:00
|
|
|
}
|
|
|
|
|
2023-08-07 22:55:19 +03:00
|
|
|
func (gen *TaskGenerator) IsReady() bool {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
func (gen *TaskGenerator) Reset() {
|
2024-03-04 19:44:11 +02:00
|
|
|
gen.lock.Lock()
|
|
|
|
defer gen.lock.Unlock()
|
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
gen.lastRepo = ""
|
|
|
|
gen.Service.ResetCatalog()
|
|
|
|
gen.done = false
|
2024-03-04 19:44:11 +02:00
|
|
|
gen.waitTime = 0
|
|
|
|
}
|
|
|
|
|
|
|
|
func (gen *TaskGenerator) increaseWaitTime() {
|
|
|
|
if gen.waitTime == 0 {
|
|
|
|
gen.waitTime = time.Second
|
|
|
|
}
|
|
|
|
|
|
|
|
gen.waitTime *= 2
|
|
|
|
|
|
|
|
// max wait time should not exceed generator interval.
|
|
|
|
if gen.waitTime > gen.maxWaitTime {
|
|
|
|
gen.waitTime = gen.maxWaitTime
|
|
|
|
}
|
|
|
|
|
|
|
|
gen.lastTaskTime = time.Now()
|
|
|
|
}
|
|
|
|
|
|
|
|
// resets wait time.
|
|
|
|
func (gen *TaskGenerator) resetWaitTime() {
|
|
|
|
gen.lastTaskTime = time.Now()
|
|
|
|
gen.waitTime = 0
|
2023-05-31 20:26:23 +03:00
|
|
|
}
|
2022-02-10 16:17:49 +02:00
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
type syncRepoTask struct {
|
|
|
|
repo string
|
|
|
|
service Service
|
|
|
|
}
|
2021-06-08 23:11:18 +03:00
|
|
|
|
2023-05-31 20:26:23 +03:00
|
|
|
func newSyncRepoTask(repo string, service Service) *syncRepoTask {
|
|
|
|
return &syncRepoTask{repo, service}
|
|
|
|
}
|
2021-06-08 23:11:18 +03:00
|
|
|
|
2023-09-05 19:48:56 +03:00
|
|
|
func (srt *syncRepoTask) DoWork(ctx context.Context) error {
|
|
|
|
return srt.service.SyncRepo(ctx, srt.repo)
|
2021-06-08 23:11:18 +03:00
|
|
|
}
|
2023-12-05 00:13:50 +02:00
|
|
|
|
|
|
|
func (srt *syncRepoTask) String() string {
|
2024-03-04 19:44:11 +02:00
|
|
|
return fmt.Sprintf("{Name: \"%s\", repository: \"%s\"}",
|
2023-12-05 00:13:50 +02:00
|
|
|
srt.Name(), srt.repo)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (srt *syncRepoTask) Name() string {
|
|
|
|
return "SyncTask"
|
|
|
|
}
|