forked from TrueCloudLab/frostfs-node
634792077e
Includes extending listing methods in the Storage Engine with object types. It allows tuning replication/policer algorithms: container nodes do not remove `LOCK` objects as redundant and try to fulfill `LOCK` placement on the ohter container nodes. Signed-off-by: Pavel Karpy <carpawell@nspcc.ru>
100 lines
2 KiB
Go
100 lines
2 KiB
Go
package policer
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"time"
|
|
|
|
objectcore "github.com/nspcc-dev/neofs-node/pkg/core/object"
|
|
"github.com/nspcc-dev/neofs-node/pkg/local_object_storage/engine"
|
|
"go.uber.org/zap"
|
|
)
|
|
|
|
func (p *Policer) Run(ctx context.Context) {
|
|
defer func() {
|
|
p.log.Info("routine stopped")
|
|
}()
|
|
|
|
go p.poolCapacityWorker(ctx)
|
|
p.shardPolicyWorker(ctx)
|
|
}
|
|
|
|
func (p *Policer) shardPolicyWorker(ctx context.Context) {
|
|
var (
|
|
addrs []objectcore.AddressWithType
|
|
cursor *engine.Cursor
|
|
err error
|
|
)
|
|
|
|
for {
|
|
select {
|
|
case <-ctx.Done():
|
|
return
|
|
default:
|
|
}
|
|
|
|
addrs, cursor, err = p.jobQueue.Select(cursor, p.batchSize)
|
|
if err != nil {
|
|
if errors.Is(err, engine.ErrEndOfListing) {
|
|
time.Sleep(time.Second) // finished whole cycle, sleep a bit
|
|
continue
|
|
}
|
|
p.log.Warn("failure at object select for replication", zap.Error(err))
|
|
}
|
|
|
|
for i := range addrs {
|
|
select {
|
|
case <-ctx.Done():
|
|
return
|
|
default:
|
|
addr := addrs[i].Address
|
|
if p.objsInWork.inWork(addr) {
|
|
// do not process an object
|
|
// that is in work
|
|
continue
|
|
}
|
|
|
|
err = p.taskPool.Submit(func() {
|
|
v, ok := p.cache.Get(addr)
|
|
if ok && time.Since(v.(time.Time)) < p.evictDuration {
|
|
return
|
|
}
|
|
|
|
p.objsInWork.add(addr)
|
|
|
|
p.processObject(ctx, addrs[i])
|
|
|
|
p.cache.Add(addr, time.Now())
|
|
p.objsInWork.remove(addr)
|
|
})
|
|
if err != nil {
|
|
p.log.Warn("pool submission", zap.Error(err))
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
func (p *Policer) poolCapacityWorker(ctx context.Context) {
|
|
ticker := time.NewTicker(p.rebalanceFreq)
|
|
for {
|
|
select {
|
|
case <-ctx.Done():
|
|
ticker.Stop()
|
|
return
|
|
case <-ticker.C:
|
|
neofsSysLoad := p.loader.ObjectServiceLoad()
|
|
newCapacity := int((1.0 - neofsSysLoad) * float64(p.maxCapacity))
|
|
if newCapacity == 0 {
|
|
newCapacity++
|
|
}
|
|
|
|
if p.taskPool.Cap() != newCapacity {
|
|
p.taskPool.Tune(newCapacity)
|
|
p.log.Debug("tune replication capacity",
|
|
zap.Float64("system_load", neofsSysLoad),
|
|
zap.Int("new_capacity", newCapacity))
|
|
}
|
|
}
|
|
}
|
|
}
|