Evgenii Stratonikov
11ff1ae521
Under load changing shard mode can lead to it being removed from the list during some other PUT. ``` Dec 28 07:01:26 az neofs-node[364505]: panic: runtime error: invalid memory address or nil pointer dereference Dec 28 07:01:26 az neofs-node[364505]: [signal SIGSEGV: segmentation violation code=0x1 addr=0x20 pc=0xc9fbb1] Dec 28 07:01:26 az neofs-node[364505]: goroutine 11791912 [running]: Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine.(*StorageEngine).putToShard(0xc000435490, {0xc0003f7a28?, 0xc0001192c0?}, 0x2, {0x0, 0x> Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine/put.go:91 +0x1b1 Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine.(*StorageEngine).put.func1(0xc000435490?, {0xc0003f7a28?, 0xc0001192c0?}) Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine/put.go:71 +0x19c Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine.(*StorageEngine).iterateOverSortedShards(0x1?, {{0x62, 0x23, 0xfe, 0x60, 0x67, 0xd5, 0x> Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine/shards.go:225 +0xc8 Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine.(*StorageEngine).put(0xc000435490, {0x1?}) Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine/put.go:66 +0x2a9 Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine.(*StorageEngine).Put.func1() Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine/put.go:43 +0x2a Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine.(*StorageEngine).execIfNotBlocked(0x8?, 0x38?) Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine/control.go:147 +0xcf Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine.(*StorageEngine).Put(0xc4df775a80?, {0x0?}) Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine/put.go:42 +0x65 Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine.Put(0xc06d928b80?, 0xc06b1b8dc8?) Dec 28 07:01:26 az neofs-node[364505]: github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine/put.go:158 +0x19 Dec 28 07:01:26 az neofs-node[364505]: main.engineWithoutNotifications.Put({0x20301b?}, 0x20301b?) ``` Signed-off-by: Evgenii Stratonikov <e.stratonikov@yadro.com>
165 lines
4 KiB
Go
165 lines
4 KiB
Go
package engine
|
|
|
|
import (
|
|
"errors"
|
|
|
|
"github.com/TrueCloudLab/frostfs-node/pkg/core/object"
|
|
"github.com/TrueCloudLab/frostfs-node/pkg/local_object_storage/blobstor"
|
|
"github.com/TrueCloudLab/frostfs-node/pkg/local_object_storage/blobstor/common"
|
|
"github.com/TrueCloudLab/frostfs-node/pkg/local_object_storage/shard"
|
|
"github.com/TrueCloudLab/frostfs-node/pkg/util"
|
|
objectSDK "github.com/TrueCloudLab/frostfs-sdk-go/object"
|
|
oid "github.com/TrueCloudLab/frostfs-sdk-go/object/id"
|
|
"go.uber.org/zap"
|
|
)
|
|
|
|
// PutPrm groups the parameters of Put operation.
|
|
type PutPrm struct {
|
|
obj *objectSDK.Object
|
|
}
|
|
|
|
// PutRes groups the resulting values of Put operation.
|
|
type PutRes struct{}
|
|
|
|
var errPutShard = errors.New("could not put object to any shard")
|
|
|
|
// WithObject is a Put option to set object to save.
|
|
//
|
|
// Option is required.
|
|
func (p *PutPrm) WithObject(obj *objectSDK.Object) {
|
|
p.obj = obj
|
|
}
|
|
|
|
// Put saves the object to local storage.
|
|
//
|
|
// Returns any error encountered that
|
|
// did not allow to completely save the object.
|
|
//
|
|
// Returns an error if executions are blocked (see BlockExecution).
|
|
//
|
|
// Returns an error of type apistatus.ObjectAlreadyRemoved if the object has been marked as removed.
|
|
func (e *StorageEngine) Put(prm PutPrm) (res PutRes, err error) {
|
|
err = e.execIfNotBlocked(func() error {
|
|
res, err = e.put(prm)
|
|
return err
|
|
})
|
|
|
|
return
|
|
}
|
|
|
|
func (e *StorageEngine) put(prm PutPrm) (PutRes, error) {
|
|
if e.metrics != nil {
|
|
defer elapsed(e.metrics.AddPutDuration)()
|
|
}
|
|
|
|
addr := object.AddressOf(prm.obj)
|
|
|
|
// In #1146 this check was parallelized, however, it became
|
|
// much slower on fast machines for 4 shards.
|
|
_, err := e.exists(addr)
|
|
if err != nil {
|
|
return PutRes{}, err
|
|
}
|
|
|
|
finished := false
|
|
|
|
e.iterateOverSortedShards(addr, func(ind int, sh hashedShard) (stop bool) {
|
|
e.mtx.RLock()
|
|
pool, ok := e.shardPools[sh.ID().String()]
|
|
e.mtx.RUnlock()
|
|
if !ok {
|
|
// Shard was concurrently removed, skip.
|
|
return false
|
|
}
|
|
|
|
putDone, exists := e.putToShard(sh, ind, pool, addr, prm.obj)
|
|
finished = putDone || exists
|
|
return finished
|
|
})
|
|
|
|
if !finished {
|
|
err = errPutShard
|
|
}
|
|
|
|
return PutRes{}, err
|
|
}
|
|
|
|
// putToShard puts object to sh.
|
|
// First return value is true iff put has been successfully done.
|
|
// Second return value is true iff object already exists.
|
|
func (e *StorageEngine) putToShard(sh hashedShard, ind int, pool util.WorkerPool, addr oid.Address, obj *objectSDK.Object) (bool, bool) {
|
|
var putSuccess, alreadyExists bool
|
|
|
|
exitCh := make(chan struct{})
|
|
|
|
if err := pool.Submit(func() {
|
|
defer close(exitCh)
|
|
|
|
var existPrm shard.ExistsPrm
|
|
existPrm.SetAddress(addr)
|
|
|
|
exists, err := sh.Exists(existPrm)
|
|
if err != nil {
|
|
if shard.IsErrObjectExpired(err) {
|
|
// object is already found but
|
|
// expired => do nothing with it
|
|
alreadyExists = true
|
|
}
|
|
|
|
return // this is not ErrAlreadyRemoved error so we can go to the next shard
|
|
}
|
|
|
|
alreadyExists = exists.Exists()
|
|
if alreadyExists {
|
|
if ind != 0 {
|
|
var toMoveItPrm shard.ToMoveItPrm
|
|
toMoveItPrm.SetAddress(addr)
|
|
|
|
_, err = sh.ToMoveIt(toMoveItPrm)
|
|
if err != nil {
|
|
e.log.Warn("could not mark object for shard relocation",
|
|
zap.Stringer("shard", sh.ID()),
|
|
zap.String("error", err.Error()),
|
|
)
|
|
}
|
|
}
|
|
|
|
return
|
|
}
|
|
|
|
var putPrm shard.PutPrm
|
|
putPrm.SetObject(obj)
|
|
|
|
_, err = sh.Put(putPrm)
|
|
if err != nil {
|
|
if errors.Is(err, shard.ErrReadOnlyMode) || errors.Is(err, blobstor.ErrNoPlaceFound) ||
|
|
errors.Is(err, common.ErrReadOnly) || errors.Is(err, common.ErrNoSpace) {
|
|
e.log.Warn("could not put object to shard",
|
|
zap.Stringer("shard_id", sh.ID()),
|
|
zap.String("error", err.Error()))
|
|
return
|
|
}
|
|
|
|
e.reportShardError(sh, "could not put object to shard", err)
|
|
return
|
|
}
|
|
|
|
putSuccess = true
|
|
}); err != nil {
|
|
close(exitCh)
|
|
}
|
|
|
|
<-exitCh
|
|
|
|
return putSuccess, alreadyExists
|
|
}
|
|
|
|
// Put writes provided object to local storage.
|
|
func Put(storage *StorageEngine, obj *objectSDK.Object) error {
|
|
var putPrm PutPrm
|
|
putPrm.WithObject(obj)
|
|
|
|
_, err := storage.Put(putPrm)
|
|
|
|
return err
|
|
}
|