2020-02-17 16:57:15 -05:00
|
|
|
package storage
|
|
|
|
|
|
|
|
import (
|
|
|
|
"path"
|
2020-05-27 16:27:35 -05:00
|
|
|
"path/filepath"
|
2020-02-17 16:57:15 -05:00
|
|
|
"strings"
|
2021-10-21 08:05:50 -05:00
|
|
|
"time"
|
2020-02-17 16:57:15 -05:00
|
|
|
|
|
|
|
"go.etcd.io/bbolt"
|
2021-12-03 22:50:58 -05:00
|
|
|
"zotregistry.io/zot/errors"
|
|
|
|
zlog "zotregistry.io/zot/pkg/log"
|
2020-02-17 16:57:15 -05:00
|
|
|
)
|
|
|
|
|
|
|
|
const (
|
2022-09-08 10:07:00 -05:00
|
|
|
// global bucket.
|
|
|
|
BlobsCache = "blobs"
|
|
|
|
// bucket where we store all blobs from storage(deduped blobs + original blob).
|
2022-08-30 17:12:10 -05:00
|
|
|
DuplicatesBucket = "duplicates"
|
2022-09-08 10:07:00 -05:00
|
|
|
/* bucket where we store only the original/source blob (used by s3 to know which is the blob with content)
|
|
|
|
it should contain only one blob, this is the only place from which we'll get blobs. */
|
2022-08-30 17:12:10 -05:00
|
|
|
OriginalBucket = "original"
|
2022-04-12 05:01:04 -05:00
|
|
|
DBExtensionName = ".db"
|
2021-10-21 08:05:50 -05:00
|
|
|
dbCacheLockCheckTimeout = 10 * time.Second
|
2020-02-17 16:57:15 -05:00
|
|
|
)
|
|
|
|
|
|
|
|
type Cache struct {
|
2022-04-12 05:01:04 -05:00
|
|
|
rootDir string
|
|
|
|
db *bbolt.DB
|
|
|
|
log zlog.Logger
|
|
|
|
useRelPaths bool // weather or not to use relative paths, should be true for filesystem and false for s3
|
2020-02-17 16:57:15 -05:00
|
|
|
}
|
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
// Blob is a blob record.
|
|
|
|
type Blob struct {
|
|
|
|
Path string
|
|
|
|
}
|
|
|
|
|
2022-04-12 05:01:04 -05:00
|
|
|
func NewCache(rootDir string, name string, useRelPaths bool, log zlog.Logger) *Cache {
|
|
|
|
dbPath := path.Join(rootDir, name+DBExtensionName)
|
2021-10-21 08:05:50 -05:00
|
|
|
dbOpts := &bbolt.Options{
|
|
|
|
Timeout: dbCacheLockCheckTimeout,
|
|
|
|
FreelistType: bbolt.FreelistArrayType,
|
|
|
|
}
|
2020-02-17 16:57:15 -05:00
|
|
|
|
2021-12-13 14:23:31 -05:00
|
|
|
cacheDB, err := bbolt.Open(dbPath, 0o600, dbOpts) //nolint:gomnd
|
2020-02-17 16:57:15 -05:00
|
|
|
if err != nil {
|
|
|
|
log.Error().Err(err).Str("dbPath", dbPath).Msg("unable to create cache db")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-12-13 14:23:31 -05:00
|
|
|
if err := cacheDB.Update(func(tx *bbolt.Tx) error {
|
2020-02-17 16:57:15 -05:00
|
|
|
if _, err := tx.CreateBucketIfNotExists([]byte(BlobsCache)); err != nil {
|
|
|
|
// this is a serious failure
|
|
|
|
log.Error().Err(err).Str("dbPath", dbPath).Msg("unable to create a root bucket")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return err
|
|
|
|
}
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return nil
|
|
|
|
}); err != nil {
|
|
|
|
// something went wrong
|
|
|
|
log.Error().Err(err).Msg("unable to create a cache")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2022-04-12 05:01:04 -05:00
|
|
|
return &Cache{rootDir: rootDir, db: cacheDB, useRelPaths: useRelPaths, log: log}
|
2020-02-17 16:57:15 -05:00
|
|
|
}
|
|
|
|
|
2022-03-21 12:37:23 -05:00
|
|
|
func (c *Cache) PutBlob(digest, path string) error {
|
2021-07-20 16:04:10 -05:00
|
|
|
if path == "" {
|
|
|
|
c.log.Error().Err(errors.ErrEmptyValue).Str("digest", digest).Msg("empty path provided")
|
|
|
|
|
|
|
|
return errors.ErrEmptyValue
|
|
|
|
}
|
|
|
|
|
2020-05-27 16:27:35 -05:00
|
|
|
// use only relative (to rootDir) paths on blobs
|
2022-04-12 05:01:04 -05:00
|
|
|
var err error
|
|
|
|
if c.useRelPaths {
|
|
|
|
path, err = filepath.Rel(c.rootDir, path)
|
|
|
|
if err != nil {
|
|
|
|
c.log.Error().Err(err).Str("path", path).Msg("unable to get relative path")
|
|
|
|
}
|
2020-05-27 16:27:35 -05:00
|
|
|
}
|
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
if err := c.db.Update(func(tx *bbolt.Tx) error {
|
|
|
|
root := tx.Bucket([]byte(BlobsCache))
|
|
|
|
if root == nil {
|
|
|
|
// this is a serious failure
|
|
|
|
err := errors.ErrCacheRootBucket
|
|
|
|
c.log.Error().Err(err).Msg("unable to access root bucket")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return err
|
|
|
|
}
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
bucket, err := root.CreateBucketIfNotExists([]byte(digest))
|
|
|
|
if err != nil {
|
|
|
|
// this is a serious failure
|
|
|
|
c.log.Error().Err(err).Str("bucket", digest).Msg("unable to create a bucket")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// create nested deduped bucket where we store all the deduped blobs + original blob
|
2022-08-30 17:12:10 -05:00
|
|
|
deduped, err := bucket.CreateBucketIfNotExists([]byte(DuplicatesBucket))
|
2022-09-08 10:07:00 -05:00
|
|
|
if err != nil {
|
|
|
|
// this is a serious failure
|
2022-08-30 17:12:10 -05:00
|
|
|
c.log.Error().Err(err).Str("bucket", DuplicatesBucket).Msg("unable to create a bucket")
|
2022-09-08 10:07:00 -05:00
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := deduped.Put([]byte(path), nil); err != nil {
|
2022-08-30 17:12:10 -05:00
|
|
|
c.log.Error().Err(err).Str("bucket", DuplicatesBucket).Str("value", path).Msg("unable to put record")
|
2022-09-08 10:07:00 -05:00
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// create origin bucket and insert only the original blob
|
2022-08-30 17:12:10 -05:00
|
|
|
origin := bucket.Bucket([]byte(OriginalBucket))
|
2022-09-08 10:07:00 -05:00
|
|
|
if origin == nil {
|
|
|
|
// if the bucket doesn't exist yet then 'path' is the original blob
|
2022-08-30 17:12:10 -05:00
|
|
|
origin, err := bucket.CreateBucket([]byte(OriginalBucket))
|
2022-09-07 17:12:14 -05:00
|
|
|
if err != nil {
|
|
|
|
// this is a serious failure
|
2022-08-30 17:12:10 -05:00
|
|
|
c.log.Error().Err(err).Str("bucket", OriginalBucket).Msg("unable to create a bucket")
|
2022-09-07 17:12:14 -05:00
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
if err := origin.Put([]byte(path), nil); err != nil {
|
2022-08-30 17:12:10 -05:00
|
|
|
c.log.Error().Err(err).Str("bucket", OriginalBucket).Str("value", path).Msg("unable to put record")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
return err
|
|
|
|
}
|
2020-02-17 16:57:15 -05:00
|
|
|
}
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return nil
|
|
|
|
}); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *Cache) GetBlob(digest string) (string, error) {
|
|
|
|
var blobPath strings.Builder
|
|
|
|
|
|
|
|
if err := c.db.View(func(tx *bbolt.Tx) error {
|
|
|
|
root := tx.Bucket([]byte(BlobsCache))
|
|
|
|
if root == nil {
|
|
|
|
// this is a serious failure
|
|
|
|
err := errors.ErrCacheRootBucket
|
|
|
|
c.log.Error().Err(err).Msg("unable to access root bucket")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
bucket := root.Bucket([]byte(digest))
|
|
|
|
if bucket != nil {
|
2022-08-30 17:12:10 -05:00
|
|
|
origin := bucket.Bucket([]byte(OriginalBucket))
|
2022-09-08 10:07:00 -05:00
|
|
|
blobPath.WriteString(string(c.getOne(origin)))
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
return errors.ErrCacheMiss
|
|
|
|
}); err != nil {
|
|
|
|
return "", err
|
|
|
|
}
|
|
|
|
|
|
|
|
return blobPath.String(), nil
|
|
|
|
}
|
|
|
|
|
2022-03-21 12:37:23 -05:00
|
|
|
func (c *Cache) HasBlob(digest, blob string) bool {
|
2020-02-17 16:57:15 -05:00
|
|
|
if err := c.db.View(func(tx *bbolt.Tx) error {
|
|
|
|
root := tx.Bucket([]byte(BlobsCache))
|
|
|
|
if root == nil {
|
|
|
|
// this is a serious failure
|
|
|
|
err := errors.ErrCacheRootBucket
|
|
|
|
c.log.Error().Err(err).Msg("unable to access root bucket")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
bucket := root.Bucket([]byte(digest))
|
|
|
|
if bucket == nil {
|
2020-02-17 16:57:15 -05:00
|
|
|
return errors.ErrCacheMiss
|
|
|
|
}
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2022-08-30 17:12:10 -05:00
|
|
|
origin := bucket.Bucket([]byte(OriginalBucket))
|
2022-09-08 10:07:00 -05:00
|
|
|
if origin == nil {
|
|
|
|
return errors.ErrCacheMiss
|
|
|
|
}
|
|
|
|
|
|
|
|
if origin.Get([]byte(blob)) == nil {
|
2020-02-17 16:57:15 -05:00
|
|
|
return errors.ErrCacheMiss
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}); err != nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
func (c *Cache) getOne(bucket *bbolt.Bucket) []byte {
|
|
|
|
if bucket != nil {
|
|
|
|
cursor := bucket.Cursor()
|
|
|
|
k, _ := cursor.First()
|
|
|
|
|
|
|
|
return k
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2022-03-21 12:37:23 -05:00
|
|
|
func (c *Cache) DeleteBlob(digest, path string) error {
|
2020-05-27 16:27:35 -05:00
|
|
|
// use only relative (to rootDir) paths on blobs
|
2022-04-12 05:01:04 -05:00
|
|
|
var err error
|
|
|
|
if c.useRelPaths {
|
|
|
|
path, err = filepath.Rel(c.rootDir, path)
|
|
|
|
if err != nil {
|
|
|
|
c.log.Error().Err(err).Str("path", path).Msg("unable to get relative path")
|
|
|
|
}
|
2020-05-27 16:27:35 -05:00
|
|
|
}
|
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
if err := c.db.Update(func(tx *bbolt.Tx) error {
|
|
|
|
root := tx.Bucket([]byte(BlobsCache))
|
|
|
|
if root == nil {
|
|
|
|
// this is a serious failure
|
|
|
|
err := errors.ErrCacheRootBucket
|
|
|
|
c.log.Error().Err(err).Msg("unable to access root bucket")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2021-12-13 14:23:31 -05:00
|
|
|
bucket := root.Bucket([]byte(digest))
|
|
|
|
if bucket == nil {
|
2020-02-17 16:57:15 -05:00
|
|
|
return errors.ErrCacheMiss
|
|
|
|
}
|
|
|
|
|
2022-08-30 17:12:10 -05:00
|
|
|
deduped := bucket.Bucket([]byte(DuplicatesBucket))
|
2022-09-08 10:07:00 -05:00
|
|
|
if deduped == nil {
|
|
|
|
return errors.ErrCacheMiss
|
|
|
|
}
|
2022-09-07 17:12:14 -05:00
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
if err := deduped.Delete([]byte(path)); err != nil {
|
2022-08-30 17:12:10 -05:00
|
|
|
c.log.Error().Err(err).Str("digest", digest).Str("bucket", DuplicatesBucket).
|
|
|
|
Str("path", path).Msg("unable to delete")
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2022-08-30 17:12:10 -05:00
|
|
|
origin := bucket.Bucket([]byte(OriginalBucket))
|
2022-09-08 10:07:00 -05:00
|
|
|
if origin != nil {
|
|
|
|
originBlob := c.getOne(origin)
|
|
|
|
if originBlob != nil {
|
|
|
|
if err := origin.Delete([]byte(path)); err != nil {
|
2022-08-30 17:12:10 -05:00
|
|
|
c.log.Error().Err(err).Str("digest", digest).Str("bucket", OriginalBucket).
|
|
|
|
Str("path", path).Msg("unable to delete")
|
2020-04-06 20:17:24 -05:00
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
return err
|
|
|
|
}
|
2021-12-13 14:23:31 -05:00
|
|
|
|
2022-09-08 10:07:00 -05:00
|
|
|
// move next candidate to origin bucket, next GetKey will return this one and storage will move the content here
|
|
|
|
dedupedBlob := c.getOne(deduped)
|
|
|
|
if dedupedBlob != nil {
|
|
|
|
if err := origin.Put(dedupedBlob, nil); err != nil {
|
2022-08-30 17:12:10 -05:00
|
|
|
c.log.Error().Err(err).Str("digest", digest).Str("bucket", OriginalBucket).Str("path", path).Msg("unable to put")
|
2022-09-08 10:07:00 -05:00
|
|
|
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
2022-09-07 17:12:14 -05:00
|
|
|
}
|
2022-09-08 10:07:00 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
// if no key in origin bucket then digest bucket is empty, remove it
|
|
|
|
k := c.getOne(origin)
|
|
|
|
if k == nil {
|
|
|
|
c.log.Debug().Str("digest", digest).Str("path", path).Msg("deleting empty bucket")
|
|
|
|
if err := root.DeleteBucket([]byte(digest)); err != nil {
|
|
|
|
c.log.Error().Err(err).Str("digest", digest).Str("bucket", digest).Str("path", path).Msg("unable to delete")
|
2022-09-07 17:12:14 -05:00
|
|
|
|
2020-04-06 20:17:24 -05:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-02-17 16:57:15 -05:00
|
|
|
return nil
|
|
|
|
}); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|