406 lines
11 KiB
Go
406 lines
11 KiB
Go
package meta
|
|
|
|
import (
|
|
"bytes"
|
|
"context"
|
|
"fmt"
|
|
"time"
|
|
|
|
"git.frostfs.info/TrueCloudLab/frostfs-node/pkg/local_object_storage/internal/metaerr"
|
|
"git.frostfs.info/TrueCloudLab/frostfs-node/pkg/local_object_storage/util/logicerr"
|
|
"git.frostfs.info/TrueCloudLab/frostfs-observability/tracing"
|
|
apistatus "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/client/status"
|
|
cid "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/container/id"
|
|
objectSDK "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/object"
|
|
oid "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/object/id"
|
|
"go.etcd.io/bbolt"
|
|
"go.opentelemetry.io/otel/attribute"
|
|
"go.opentelemetry.io/otel/trace"
|
|
)
|
|
|
|
var bucketNameLocked = []byte{lockedPrefix}
|
|
|
|
type keyValue struct {
|
|
Key []byte
|
|
Value []byte
|
|
}
|
|
|
|
// returns name of the bucket with objects of type LOCK for specified container.
|
|
func bucketNameLockers(idCnr cid.ID, key []byte) []byte {
|
|
return bucketName(idCnr, lockersPrefix, key)
|
|
}
|
|
|
|
// Lock marks objects as locked with another object. All objects are from the
|
|
// specified container.
|
|
//
|
|
// Allows locking regular objects only (otherwise returns apistatus.LockNonRegularObject).
|
|
//
|
|
// Locked list should be unique. Panics if it is empty.
|
|
func (db *DB) Lock(ctx context.Context, cnr cid.ID, locker oid.ID, locked []oid.ID, expEpoch uint64) error {
|
|
var (
|
|
startedAt = time.Now()
|
|
success = false
|
|
)
|
|
defer func() {
|
|
db.metrics.AddMethodDuration("Lock", time.Since(startedAt), success)
|
|
}()
|
|
|
|
_, span := tracing.StartSpanFromContext(ctx, "metabase.Lock",
|
|
trace.WithAttributes(
|
|
attribute.String("container_id", cnr.EncodeToString()),
|
|
attribute.String("locker", locker.EncodeToString()),
|
|
attribute.Int("locked_count", len(locked)),
|
|
))
|
|
defer span.End()
|
|
|
|
db.modeMtx.RLock()
|
|
defer db.modeMtx.RUnlock()
|
|
|
|
if db.mode.NoMetabase() {
|
|
return ErrDegradedMode
|
|
} else if db.mode.ReadOnly() {
|
|
return ErrReadOnlyMode
|
|
}
|
|
|
|
if len(locked) == 0 {
|
|
panic("empty locked list")
|
|
}
|
|
|
|
err := db.lockInternal(locked, cnr, locker, expEpoch)
|
|
success = err == nil
|
|
return err
|
|
}
|
|
|
|
func (db *DB) lockInternal(locked []oid.ID, cnr cid.ID, locker oid.ID, expEpoch uint64) error {
|
|
bucketKeysLocked := make([][]byte, len(locked))
|
|
for i := range locked {
|
|
bucketKeysLocked[i] = objectKey(locked[i], make([]byte, objectKeySize))
|
|
}
|
|
key := make([]byte, cidSize)
|
|
|
|
return metaerr.Wrap(db.boltDB.Batch(func(tx *bbolt.Tx) error {
|
|
if firstIrregularObjectType(tx, cnr, bucketKeysLocked...) != objectSDK.TypeRegular {
|
|
return logicerr.Wrap(new(apistatus.LockNonRegularObject))
|
|
}
|
|
|
|
bucketLocked := tx.Bucket(bucketNameLocked)
|
|
|
|
cnr.Encode(key)
|
|
bucketLockedContainer, err := bucketLocked.CreateBucketIfNotExists(key)
|
|
if err != nil {
|
|
return fmt.Errorf("create container bucket for locked objects %v: %w", cnr, err)
|
|
}
|
|
|
|
var newLock lockWithExpEpoch
|
|
newLock.encode(locker, expEpoch)
|
|
|
|
loop:
|
|
for i := range bucketKeysLocked {
|
|
locks, err := decodeLockWithExpEpochList(bucketLockedContainer.Get(bucketKeysLocked[i]))
|
|
if err != nil {
|
|
return fmt.Errorf("decode list of object lockers: %w", err)
|
|
}
|
|
|
|
var lockID oid.ID
|
|
var lockExpEpoch uint64
|
|
var foundLock bool
|
|
for j := range locks {
|
|
if locks[j].id == newLock.id {
|
|
if err := locks[j].decode(&lockID, &lockExpEpoch); err != nil {
|
|
return fmt.Errorf("decode lock: %w", err)
|
|
}
|
|
if lockExpEpoch != NoExpirationEpoch {
|
|
continue loop
|
|
}
|
|
// Add expiration epoch to lock because it doesn't have it.
|
|
locks[j].encode(lockID, expEpoch)
|
|
foundLock = true
|
|
break
|
|
}
|
|
}
|
|
|
|
if !foundLock {
|
|
locks = append(locks, newLock)
|
|
}
|
|
|
|
data, err := encodeLockWithExpEpochList(locks)
|
|
if err != nil {
|
|
return fmt.Errorf("encode list of object lockers: %w", err)
|
|
}
|
|
|
|
err = bucketLockedContainer.Put(bucketKeysLocked[i], data)
|
|
if err != nil {
|
|
return fmt.Errorf("update list of object lockers: %w", err)
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}))
|
|
}
|
|
|
|
// FreeLockedBy unlocks all objects in DB which are locked by lockers.
|
|
// Returns slice of unlocked object ID's or an error.
|
|
func (db *DB) FreeLockedBy(lockers []oid.Address) ([]oid.Address, error) {
|
|
var (
|
|
startedAt = time.Now()
|
|
success = false
|
|
)
|
|
defer func() {
|
|
db.metrics.AddMethodDuration("FreeLockedBy", time.Since(startedAt), success)
|
|
}()
|
|
|
|
db.modeMtx.RLock()
|
|
defer db.modeMtx.RUnlock()
|
|
|
|
if db.mode.NoMetabase() {
|
|
return nil, ErrDegradedMode
|
|
}
|
|
|
|
var unlockedObjects []oid.Address
|
|
|
|
if err := db.boltDB.Batch(func(tx *bbolt.Tx) error {
|
|
for i := range lockers {
|
|
unlocked, err := freePotentialLocks(tx, lockers[i].Container(), lockers[i].Object())
|
|
if err != nil {
|
|
return err
|
|
}
|
|
unlockedObjects = append(unlockedObjects, unlocked...)
|
|
}
|
|
|
|
return nil
|
|
}); err != nil {
|
|
return nil, metaerr.Wrap(err)
|
|
}
|
|
success = true
|
|
return unlockedObjects, nil
|
|
}
|
|
|
|
// checks if specified object is locked in the specified container.
|
|
func objectLocked(tx *bbolt.Tx, idCnr cid.ID, idObj oid.ID) bool {
|
|
bucketLocked := tx.Bucket(bucketNameLocked)
|
|
if bucketLocked != nil {
|
|
key := make([]byte, cidSize)
|
|
idCnr.Encode(key)
|
|
bucketLockedContainer := bucketLocked.Bucket(key)
|
|
if bucketLockedContainer != nil {
|
|
return bucketLockedContainer.Get(objectKey(idObj, key)) != nil
|
|
}
|
|
}
|
|
|
|
return false
|
|
}
|
|
|
|
// return `LOCK` id's if specified object is locked in the specified container.
|
|
func getLocks(tx *bbolt.Tx, idCnr cid.ID, idObj oid.ID) ([]Lock, error) {
|
|
var lockers []Lock
|
|
bucketLocked := tx.Bucket(bucketNameLocked)
|
|
if bucketLocked != nil {
|
|
key := make([]byte, cidSize)
|
|
idCnr.Encode(key)
|
|
bucketLockedContainer := bucketLocked.Bucket(key)
|
|
if bucketLockedContainer != nil {
|
|
binObjIDs, err := decodeLockWithExpEpochList(bucketLockedContainer.Get(objectKey(idObj, key)))
|
|
if err != nil {
|
|
return nil, fmt.Errorf("decode list of object lockers: %w", err)
|
|
}
|
|
for _, binObjID := range binObjIDs {
|
|
var id oid.ID
|
|
var expEpoch uint64
|
|
|
|
if err = binObjID.decode(&id, &expEpoch); err != nil {
|
|
return nil, err
|
|
}
|
|
lockers = append(lockers, Lock{ID: id, ExpEpoch: expEpoch})
|
|
}
|
|
}
|
|
}
|
|
return lockers, nil
|
|
}
|
|
|
|
// releases all records about the objects locked by the locker.
|
|
// Returns slice of unlocked object ID's or an error.
|
|
//
|
|
// Operation is very resource-intensive, which is caused by the admissibility
|
|
// of multiple locks. Also, if we knew what objects are locked, it would be
|
|
// possible to speed up the execution.
|
|
func freePotentialLocks(tx *bbolt.Tx, idCnr cid.ID, locker oid.ID) ([]oid.Address, error) {
|
|
var unlockedObjects []oid.Address
|
|
bucketLocked := tx.Bucket(bucketNameLocked)
|
|
if bucketLocked == nil {
|
|
return unlockedObjects, nil
|
|
}
|
|
|
|
key := make([]byte, cidSize)
|
|
idCnr.Encode(key)
|
|
|
|
bucketLockedContainer := bucketLocked.Bucket(key)
|
|
if bucketLockedContainer == nil {
|
|
return unlockedObjects, nil
|
|
}
|
|
|
|
keyLocker := objectKey(locker, key)
|
|
updates := make([]keyValue, 0)
|
|
err := bucketLockedContainer.ForEach(func(k, v []byte) error {
|
|
keyLockers, err := decodeLockWithExpEpochList(v)
|
|
if err != nil {
|
|
return fmt.Errorf("decode list of lockers in locked bucket: %w", err)
|
|
}
|
|
|
|
for i := range keyLockers {
|
|
if bytes.Equal(keyLockers[i].id[:], keyLocker) {
|
|
if len(keyLockers) == 1 {
|
|
updates = append(updates, keyValue{
|
|
Key: k,
|
|
Value: nil,
|
|
})
|
|
|
|
var id oid.ID
|
|
if err := id.Decode(k); err != nil {
|
|
return fmt.Errorf("decode unlocked object id error: %w", err)
|
|
}
|
|
|
|
var addr oid.Address
|
|
addr.SetContainer(idCnr)
|
|
addr.SetObject(id)
|
|
|
|
unlockedObjects = append(unlockedObjects, addr)
|
|
} else {
|
|
// exclude locker
|
|
keyLockers = append(keyLockers[:i], keyLockers[i+1:]...)
|
|
|
|
v, err = encodeLockWithExpEpochList(keyLockers)
|
|
if err != nil {
|
|
return fmt.Errorf("encode updated list of lockers: %w", err)
|
|
}
|
|
|
|
updates = append(updates, keyValue{
|
|
Key: k,
|
|
Value: v,
|
|
})
|
|
}
|
|
|
|
return nil
|
|
}
|
|
}
|
|
|
|
return nil
|
|
})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
if err = applyBucketUpdates(bucketLockedContainer, updates); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return unlockedObjects, nil
|
|
}
|
|
|
|
func applyBucketUpdates(bucket *bbolt.Bucket, updates []keyValue) error {
|
|
for _, update := range updates {
|
|
if update.Value == nil {
|
|
err := bucket.Delete(update.Key)
|
|
if err != nil {
|
|
return fmt.Errorf("delete locked object record from locked bucket: %w", err)
|
|
}
|
|
} else {
|
|
err := bucket.Put(update.Key, update.Value)
|
|
if err != nil {
|
|
return fmt.Errorf("update list of lockers: %w", err)
|
|
}
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// IsLockedPrm groups the parameters of IsLocked operation.
|
|
type IsLockedPrm struct {
|
|
addr oid.Address
|
|
}
|
|
|
|
// SetAddress sets object address that will be checked for lock relations.
|
|
func (i *IsLockedPrm) SetAddress(addr oid.Address) {
|
|
i.addr = addr
|
|
}
|
|
|
|
// IsLockedRes groups the resulting values of IsLocked operation.
|
|
type IsLockedRes struct {
|
|
locked bool
|
|
}
|
|
|
|
// Locked describes the requested object status according to the metabase
|
|
// current state.
|
|
func (i IsLockedRes) Locked() bool {
|
|
return i.locked
|
|
}
|
|
|
|
// IsLocked checks is the provided object is locked by any `LOCK`. Not found
|
|
// object is considered as non-locked.
|
|
//
|
|
// Returns only non-logical errors related to underlying database.
|
|
func (db *DB) IsLocked(ctx context.Context, prm IsLockedPrm) (res IsLockedRes, err error) {
|
|
var (
|
|
startedAt = time.Now()
|
|
success = false
|
|
)
|
|
defer func() {
|
|
db.metrics.AddMethodDuration("IsLocked", time.Since(startedAt), success)
|
|
}()
|
|
|
|
_, span := tracing.StartSpanFromContext(ctx, "metabase.IsLocked",
|
|
trace.WithAttributes(
|
|
attribute.String("address", prm.addr.EncodeToString()),
|
|
))
|
|
defer span.End()
|
|
|
|
db.modeMtx.RLock()
|
|
defer db.modeMtx.RUnlock()
|
|
|
|
if db.mode.NoMetabase() {
|
|
return res, ErrDegradedMode
|
|
}
|
|
err = metaerr.Wrap(db.boltDB.View(func(tx *bbolt.Tx) error {
|
|
res.locked = objectLocked(tx, prm.addr.Container(), prm.addr.Object())
|
|
return nil
|
|
}))
|
|
success = err == nil
|
|
return res, err
|
|
}
|
|
|
|
type Lock struct {
|
|
ID oid.ID
|
|
ExpEpoch uint64
|
|
}
|
|
|
|
// GetLocks return `LOCK` id's if provided object is locked by any `LOCK`. Not found
|
|
// object is considered as non-locked.
|
|
//
|
|
// Returns only non-logical errors related to underlying database.
|
|
func (db *DB) GetLocks(ctx context.Context, addr oid.Address) (res []Lock, err error) {
|
|
var (
|
|
startedAt = time.Now()
|
|
success = false
|
|
)
|
|
defer func() {
|
|
db.metrics.AddMethodDuration("GetLocks", time.Since(startedAt), success)
|
|
}()
|
|
|
|
_, span := tracing.StartSpanFromContext(ctx, "metabase.GetLocks",
|
|
trace.WithAttributes(
|
|
attribute.String("address", addr.EncodeToString()),
|
|
))
|
|
defer span.End()
|
|
|
|
db.modeMtx.RLock()
|
|
defer db.modeMtx.RUnlock()
|
|
|
|
if db.mode.NoMetabase() {
|
|
return res, ErrDegradedMode
|
|
}
|
|
err = metaerr.Wrap(db.boltDB.View(func(tx *bbolt.Tx) error {
|
|
res, err = getLocks(tx, addr.Container(), addr.Object())
|
|
return nil
|
|
}))
|
|
success = err == nil
|
|
return res, err
|
|
}
|