mirror of
https://github.com/nspcc-dev/neo-go.git
synced 2024-12-23 13:41:37 +00:00
3010324c4f
Drain the channel only if it has pending events. This avoids trying to read from an already-empty channel. Close #3734 Signed-off-by: Ekaterina Pavlova <ekt@morphbits.io>
580 lines
16 KiB
Go
580 lines
16 KiB
Go
package blockfetcher
|
|
|
|
import (
|
|
"context"
|
|
"crypto/sha256"
|
|
"errors"
|
|
"fmt"
|
|
"io"
|
|
"net/url"
|
|
"strconv"
|
|
"strings"
|
|
"sync"
|
|
"sync/atomic"
|
|
"time"
|
|
|
|
"github.com/nspcc-dev/neo-go/pkg/config"
|
|
"github.com/nspcc-dev/neo-go/pkg/core/block"
|
|
gio "github.com/nspcc-dev/neo-go/pkg/io"
|
|
"github.com/nspcc-dev/neo-go/pkg/services/oracle/neofs"
|
|
"github.com/nspcc-dev/neo-go/pkg/wallet"
|
|
"github.com/nspcc-dev/neofs-sdk-go/client"
|
|
"github.com/nspcc-dev/neofs-sdk-go/container"
|
|
cid "github.com/nspcc-dev/neofs-sdk-go/container/id"
|
|
"github.com/nspcc-dev/neofs-sdk-go/object"
|
|
oid "github.com/nspcc-dev/neofs-sdk-go/object/id"
|
|
"github.com/nspcc-dev/neofs-sdk-go/pool"
|
|
"github.com/nspcc-dev/neofs-sdk-go/user"
|
|
"go.uber.org/zap"
|
|
)
|
|
|
|
const (
|
|
// oidSize is the size of the object ID in NeoFS.
|
|
oidSize = sha256.Size
|
|
// defaultTimeout is the default timeout for NeoFS requests.
|
|
defaultTimeout = 5 * time.Minute
|
|
// defaultOIDBatchSize is the default number of OIDs to search and fetch at once.
|
|
defaultOIDBatchSize = 8000
|
|
// defaultDownloaderWorkersCount is the default number of workers downloading blocks.
|
|
defaultDownloaderWorkersCount = 100
|
|
)
|
|
|
|
// Constants related to NeoFS pool request timeouts.
|
|
const (
|
|
// defaultDialTimeout is a default timeout used to establish connection with
|
|
// NeoFS storage nodes.
|
|
defaultDialTimeout = 30 * time.Second
|
|
// defaultStreamTimeout is a default timeout used for NeoFS streams processing.
|
|
// It has significantly large value to reliably avoid timeout problems with heavy
|
|
// SEARCH requests.
|
|
defaultStreamTimeout = 10 * time.Minute
|
|
// defaultHealthcheckTimeout is a timeout for request to NeoFS storage node to
|
|
// decide if it is alive.
|
|
defaultHealthcheckTimeout = 10 * time.Second
|
|
)
|
|
|
|
// Constants related to retry mechanism.
|
|
const (
|
|
// maxRetries is the maximum number of retries for a single operation.
|
|
maxRetries = 5
|
|
// initialBackoff is the initial backoff duration.
|
|
initialBackoff = 500 * time.Millisecond
|
|
// backoffFactor is the factor by which the backoff duration is multiplied.
|
|
backoffFactor = 2
|
|
// maxBackoff is the maximum backoff duration.
|
|
maxBackoff = 20 * time.Second
|
|
)
|
|
|
|
// Ledger is an interface to Blockchain sufficient for Service.
|
|
type Ledger interface {
|
|
GetConfig() config.Blockchain
|
|
BlockHeight() uint32
|
|
}
|
|
|
|
// poolWrapper wraps a NeoFS pool to adapt its Close method to return an error.
|
|
type poolWrapper struct {
|
|
*pool.Pool
|
|
}
|
|
|
|
// Close closes the pool and returns nil.
|
|
func (p poolWrapper) Close() error {
|
|
p.Pool.Close()
|
|
return nil
|
|
}
|
|
|
|
// Service is a service that fetches blocks from NeoFS.
|
|
type Service struct {
|
|
// isActive denotes whether the service is working or in the process of shutdown.
|
|
isActive atomic.Bool
|
|
log *zap.Logger
|
|
cfg config.NeoFSBlockFetcher
|
|
stateRootInHeader bool
|
|
|
|
chain Ledger
|
|
pool poolWrapper
|
|
enqueueBlock func(*block.Block) error
|
|
account *wallet.Account
|
|
|
|
oidsCh chan oid.ID
|
|
// wg is a wait group for block downloaders.
|
|
wg sync.WaitGroup
|
|
|
|
// Global context for download operations cancellation.
|
|
ctx context.Context
|
|
ctxCancel context.CancelFunc
|
|
|
|
// A set of routines managing graceful Service shutdown.
|
|
quit chan bool
|
|
quitOnce sync.Once
|
|
exiterToOIDDownloader chan struct{}
|
|
exiterToShutdown chan struct{}
|
|
oidDownloaderToExiter chan struct{}
|
|
|
|
shutdownCallback func()
|
|
}
|
|
|
|
// New creates a new BlockFetcher Service.
|
|
func New(chain Ledger, cfg config.NeoFSBlockFetcher, logger *zap.Logger, putBlock func(*block.Block) error, shutdownCallback func()) (*Service, error) {
|
|
var (
|
|
account *wallet.Account
|
|
err error
|
|
)
|
|
if !cfg.Enabled {
|
|
return &Service{}, nil
|
|
}
|
|
if cfg.UnlockWallet.Path != "" {
|
|
walletFromFile, err := wallet.NewWalletFromFile(cfg.UnlockWallet.Path)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
for _, acc := range walletFromFile.Accounts {
|
|
if err := acc.Decrypt(cfg.UnlockWallet.Password, walletFromFile.Scrypt); err == nil {
|
|
account = acc
|
|
break
|
|
}
|
|
}
|
|
if account == nil {
|
|
return nil, errors.New("failed to decrypt any account in the wallet")
|
|
}
|
|
} else {
|
|
account, err = wallet.NewAccount()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
}
|
|
if cfg.Timeout <= 0 {
|
|
cfg.Timeout = defaultTimeout
|
|
}
|
|
if cfg.OIDBatchSize <= 0 {
|
|
cfg.OIDBatchSize = defaultOIDBatchSize
|
|
}
|
|
if cfg.DownloaderWorkersCount <= 0 {
|
|
cfg.DownloaderWorkersCount = defaultDownloaderWorkersCount
|
|
}
|
|
if len(cfg.Addresses) == 0 {
|
|
return nil, errors.New("no addresses provided")
|
|
}
|
|
|
|
params := pool.DefaultOptions()
|
|
params.SetHealthcheckTimeout(defaultHealthcheckTimeout)
|
|
params.SetNodeDialTimeout(defaultDialTimeout)
|
|
params.SetNodeStreamTimeout(defaultStreamTimeout)
|
|
p, err := pool.New(pool.NewFlatNodeParams(cfg.Addresses), user.NewAutoIDSignerRFC6979(account.PrivateKey().PrivateKey), params)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return &Service{
|
|
chain: chain,
|
|
pool: poolWrapper{Pool: p},
|
|
log: logger,
|
|
cfg: cfg,
|
|
|
|
enqueueBlock: putBlock,
|
|
account: account,
|
|
stateRootInHeader: chain.GetConfig().StateRootInHeader,
|
|
shutdownCallback: shutdownCallback,
|
|
|
|
quit: make(chan bool),
|
|
exiterToOIDDownloader: make(chan struct{}),
|
|
exiterToShutdown: make(chan struct{}),
|
|
oidDownloaderToExiter: make(chan struct{}),
|
|
|
|
// Use buffer of two batch sizes to load OIDs in advance:
|
|
// * first full block of OIDs is processing by Downloader
|
|
// * second full block of OIDs is available to be fetched by Downloader immediately
|
|
// * third half-filled block of OIDs is being collected by OIDsFetcher.
|
|
oidsCh: make(chan oid.ID, 2*cfg.OIDBatchSize),
|
|
}, nil
|
|
}
|
|
|
|
// Start runs the NeoFS BlockFetcher service.
|
|
func (bfs *Service) Start() error {
|
|
if !bfs.isActive.CompareAndSwap(false, true) {
|
|
return nil
|
|
}
|
|
bfs.log.Info("starting NeoFS BlockFetcher service")
|
|
var (
|
|
containerID cid.ID
|
|
containerObj container.Container
|
|
err error
|
|
)
|
|
bfs.ctx, bfs.ctxCancel = context.WithCancel(context.Background())
|
|
if err = bfs.pool.Dial(context.Background()); err != nil {
|
|
bfs.isActive.CompareAndSwap(true, false)
|
|
return fmt.Errorf("failed to dial NeoFS pool: %w", err)
|
|
}
|
|
|
|
err = containerID.DecodeString(bfs.cfg.ContainerID)
|
|
if err != nil {
|
|
bfs.isActive.CompareAndSwap(true, false)
|
|
return fmt.Errorf("failed to decode container ID: %w", err)
|
|
}
|
|
|
|
err = bfs.retry(func() error {
|
|
containerObj, err = bfs.pool.ContainerGet(bfs.ctx, containerID, client.PrmContainerGet{})
|
|
return err
|
|
})
|
|
if err != nil {
|
|
bfs.isActive.CompareAndSwap(true, false)
|
|
return fmt.Errorf("failed to get container: %w", err)
|
|
}
|
|
containerMagic := containerObj.Attribute("Magic")
|
|
if containerMagic != strconv.Itoa(int(bfs.chain.GetConfig().Magic)) {
|
|
bfs.isActive.CompareAndSwap(true, false)
|
|
return fmt.Errorf("container magic mismatch: expected %d, got %s", bfs.chain.GetConfig().Magic, containerMagic)
|
|
}
|
|
// Start routine that manages Service shutdown process.
|
|
go bfs.exiter()
|
|
|
|
// Start OIDs downloader routine.
|
|
go bfs.oidDownloader()
|
|
|
|
// Start the set of blocks downloading routines.
|
|
for range bfs.cfg.DownloaderWorkersCount {
|
|
bfs.wg.Add(1)
|
|
go bfs.blockDownloader()
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// oidDownloader runs the appropriate blocks OID fetching method based on the configuration.
|
|
func (bfs *Service) oidDownloader() {
|
|
defer close(bfs.oidDownloaderToExiter)
|
|
|
|
var err error
|
|
if bfs.cfg.SkipIndexFilesSearch {
|
|
err = bfs.fetchOIDsBySearch()
|
|
} else {
|
|
err = bfs.fetchOIDsFromIndexFiles()
|
|
}
|
|
var force bool
|
|
if err != nil {
|
|
if !isContextCanceledErr(err) {
|
|
bfs.log.Error("NeoFS BlockFetcher service: OID downloading routine failed", zap.Error(err))
|
|
}
|
|
force = true
|
|
}
|
|
// Stop the service since there's nothing to do anymore.
|
|
bfs.stopService(force)
|
|
}
|
|
|
|
// blockDownloader downloads the block from NeoFS and sends it to the blocks channel.
|
|
func (bfs *Service) blockDownloader() {
|
|
defer bfs.wg.Done()
|
|
|
|
for blkOid := range bfs.oidsCh {
|
|
ctx, cancel := context.WithTimeout(bfs.ctx, bfs.cfg.Timeout)
|
|
defer cancel()
|
|
|
|
rc, err := bfs.objectGet(ctx, blkOid.String())
|
|
if err != nil {
|
|
if isContextCanceledErr(err) {
|
|
return
|
|
}
|
|
bfs.log.Error("failed to objectGet block", zap.String("oid", blkOid.String()), zap.Error(err))
|
|
bfs.stopService(true)
|
|
return
|
|
}
|
|
|
|
b, err := bfs.readBlock(rc)
|
|
if err != nil {
|
|
if isContextCanceledErr(err) {
|
|
return
|
|
}
|
|
bfs.log.Error("failed to decode block from stream", zap.String("oid", blkOid.String()), zap.Error(err))
|
|
bfs.stopService(true)
|
|
return
|
|
}
|
|
select {
|
|
case <-bfs.ctx.Done():
|
|
return
|
|
default:
|
|
err = bfs.enqueueBlock(b)
|
|
if err != nil {
|
|
bfs.log.Error("failed to enqueue block", zap.Uint32("index", b.Index), zap.Error(err))
|
|
bfs.stopService(true)
|
|
return
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// fetchOIDsFromIndexFiles fetches block OIDs from NeoFS by searching index files first.
|
|
func (bfs *Service) fetchOIDsFromIndexFiles() error {
|
|
h := bfs.chain.BlockHeight()
|
|
startIndex := h / bfs.cfg.IndexFileSize
|
|
skip := h % bfs.cfg.IndexFileSize
|
|
|
|
for {
|
|
select {
|
|
case <-bfs.exiterToOIDDownloader:
|
|
return nil
|
|
default:
|
|
prm := client.PrmObjectSearch{}
|
|
filters := object.NewSearchFilters()
|
|
filters.AddFilter(bfs.cfg.IndexFileAttribute, fmt.Sprintf("%d", startIndex), object.MatchStringEqual)
|
|
filters.AddFilter("IndexSize", fmt.Sprintf("%d", bfs.cfg.IndexFileSize), object.MatchStringEqual)
|
|
prm.SetFilters(filters)
|
|
|
|
ctx, cancel := context.WithTimeout(bfs.ctx, bfs.cfg.Timeout)
|
|
blockOidsObject, err := bfs.objectSearch(ctx, prm)
|
|
cancel()
|
|
if err != nil {
|
|
if isContextCanceledErr(err) {
|
|
return nil
|
|
}
|
|
return fmt.Errorf("failed to find '%s' object with index %d: %w", bfs.cfg.IndexFileAttribute, startIndex, err)
|
|
}
|
|
if len(blockOidsObject) == 0 {
|
|
bfs.log.Info(fmt.Sprintf("NeoFS BlockFetcher service: no '%s' object found with index %d, stopping", bfs.cfg.IndexFileAttribute, startIndex))
|
|
return nil
|
|
}
|
|
|
|
blockCtx, blockCancel := context.WithTimeout(bfs.ctx, bfs.cfg.Timeout)
|
|
defer blockCancel()
|
|
oidsRC, err := bfs.objectGet(blockCtx, blockOidsObject[0].String())
|
|
if err != nil {
|
|
if isContextCanceledErr(err) {
|
|
return nil
|
|
}
|
|
return fmt.Errorf("failed to fetch '%s' object with index %d: %w", bfs.cfg.IndexFileAttribute, startIndex, err)
|
|
}
|
|
|
|
err = bfs.streamBlockOIDs(oidsRC, int(skip))
|
|
if err != nil {
|
|
if isContextCanceledErr(err) {
|
|
return nil
|
|
}
|
|
return fmt.Errorf("failed to stream block OIDs with index %d: %w", startIndex, err)
|
|
}
|
|
|
|
startIndex++
|
|
skip = 0
|
|
}
|
|
}
|
|
}
|
|
|
|
// streamBlockOIDs reads block OIDs from the read closer and sends them to the OIDs channel.
|
|
func (bfs *Service) streamBlockOIDs(rc io.ReadCloser, skip int) error {
|
|
defer rc.Close()
|
|
oidBytes := make([]byte, oidSize)
|
|
oidsProcessed := 0
|
|
|
|
for {
|
|
_, err := io.ReadFull(rc, oidBytes)
|
|
if err == io.EOF {
|
|
break
|
|
}
|
|
if err != nil {
|
|
return fmt.Errorf("failed to read OID: %w", err)
|
|
}
|
|
|
|
if oidsProcessed < skip {
|
|
oidsProcessed++
|
|
continue
|
|
}
|
|
|
|
var oidBlock oid.ID
|
|
if err := oidBlock.Decode(oidBytes); err != nil {
|
|
return fmt.Errorf("failed to decode OID: %w", err)
|
|
}
|
|
|
|
select {
|
|
case <-bfs.exiterToOIDDownloader:
|
|
return nil
|
|
case bfs.oidsCh <- oidBlock:
|
|
}
|
|
|
|
oidsProcessed++
|
|
}
|
|
if oidsProcessed != int(bfs.cfg.IndexFileSize) {
|
|
return fmt.Errorf("block OIDs count mismatch: expected %d, processed %d", bfs.cfg.IndexFileSize, oidsProcessed)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// fetchOIDsBySearch fetches block OIDs from NeoFS by searching through the Block objects.
|
|
func (bfs *Service) fetchOIDsBySearch() error {
|
|
startIndex := bfs.chain.BlockHeight()
|
|
//We need to search with EQ filter to avoid partially-completed SEARCH responses.
|
|
batchSize := uint32(1)
|
|
|
|
for {
|
|
select {
|
|
case <-bfs.exiterToOIDDownloader:
|
|
return nil
|
|
default:
|
|
prm := client.PrmObjectSearch{}
|
|
filters := object.NewSearchFilters()
|
|
if startIndex == startIndex+batchSize-1 {
|
|
filters.AddFilter(bfs.cfg.BlockAttribute, fmt.Sprintf("%d", startIndex), object.MatchStringEqual)
|
|
} else {
|
|
filters.AddFilter(bfs.cfg.BlockAttribute, fmt.Sprintf("%d", startIndex), object.MatchNumGE)
|
|
filters.AddFilter(bfs.cfg.BlockAttribute, fmt.Sprintf("%d", startIndex+batchSize-1), object.MatchNumLE)
|
|
}
|
|
prm.SetFilters(filters)
|
|
ctx, cancel := context.WithTimeout(bfs.ctx, bfs.cfg.Timeout)
|
|
blockOids, err := bfs.objectSearch(ctx, prm)
|
|
cancel()
|
|
if err != nil {
|
|
if isContextCanceledErr(err) {
|
|
return nil
|
|
}
|
|
return err
|
|
}
|
|
|
|
if len(blockOids) == 0 {
|
|
bfs.log.Info(fmt.Sprintf("NeoFS BlockFetcher service: no block found with index %d, stopping", startIndex))
|
|
return nil
|
|
}
|
|
for _, oid := range blockOids {
|
|
select {
|
|
case <-bfs.exiterToOIDDownloader:
|
|
return nil
|
|
case bfs.oidsCh <- oid:
|
|
}
|
|
}
|
|
startIndex += batchSize
|
|
}
|
|
}
|
|
}
|
|
|
|
// readBlock decodes the block from the read closer and prepares it for adding to the blockchain.
|
|
func (bfs *Service) readBlock(rc io.ReadCloser) (*block.Block, error) {
|
|
b := block.New(bfs.stateRootInHeader)
|
|
r := gio.NewBinReaderFromIO(rc)
|
|
b.DecodeBinary(r)
|
|
rc.Close()
|
|
return b, r.Err
|
|
}
|
|
|
|
// Shutdown stops the NeoFS BlockFetcher service. It prevents service from new
|
|
// block OIDs search, cancels all in-progress downloading operations and waits
|
|
// until all service routines finish their work.
|
|
func (bfs *Service) Shutdown() {
|
|
if !bfs.IsActive() {
|
|
return
|
|
}
|
|
bfs.stopService(true)
|
|
<-bfs.exiterToShutdown
|
|
}
|
|
|
|
// stopService close quitting goroutine once. It's the only entrypoint to shutdown
|
|
// procedure.
|
|
func (bfs *Service) stopService(force bool) {
|
|
bfs.quitOnce.Do(func() {
|
|
bfs.quit <- force
|
|
close(bfs.quit)
|
|
})
|
|
}
|
|
|
|
// exiter is a routine that is listening to a quitting signal and manages graceful
|
|
// Service shutdown process.
|
|
func (bfs *Service) exiter() {
|
|
// Closing signal may come from anyone, but only once.
|
|
force := <-bfs.quit
|
|
bfs.log.Info("shutting down NeoFS BlockFetcher service",
|
|
zap.Bool("force", force),
|
|
)
|
|
|
|
bfs.isActive.CompareAndSwap(true, false)
|
|
// Cansel all pending OIDs/blocks downloads in case if shutdown requested by user
|
|
// or caused by downloading error.
|
|
if force {
|
|
bfs.ctxCancel()
|
|
}
|
|
|
|
// Send signal to OID downloader to stop. Wait until OID downloader finishes his
|
|
// work.
|
|
close(bfs.exiterToOIDDownloader)
|
|
<-bfs.oidDownloaderToExiter
|
|
|
|
// Close OIDs channel to let block downloaders know that there are no more OIDs
|
|
// expected. Wait until all downloaders finish their work.
|
|
close(bfs.oidsCh)
|
|
bfs.wg.Wait()
|
|
|
|
// Everything is done, release resources, turn off the activity marker and let
|
|
// the server know about it.
|
|
_ = bfs.pool.Close()
|
|
_ = bfs.log.Sync()
|
|
bfs.shutdownCallback()
|
|
|
|
// Notify Shutdown routine in case if it's user-triggered shutdown.
|
|
close(bfs.exiterToShutdown)
|
|
}
|
|
|
|
// IsActive returns true if the NeoFS BlockFetcher service is running.
|
|
func (bfs *Service) IsActive() bool {
|
|
return bfs.isActive.Load()
|
|
}
|
|
|
|
// retry function with exponential backoff.
|
|
func (bfs *Service) retry(action func() error) error {
|
|
var (
|
|
err error
|
|
backoff = initialBackoff
|
|
timer = time.NewTimer(0)
|
|
)
|
|
defer func() {
|
|
if !timer.Stop() {
|
|
select {
|
|
case <-timer.C:
|
|
default:
|
|
}
|
|
}
|
|
}()
|
|
|
|
for i := range maxRetries {
|
|
if err = action(); err == nil {
|
|
return nil
|
|
}
|
|
if i == maxRetries-1 {
|
|
break
|
|
}
|
|
timer.Reset(backoff)
|
|
|
|
select {
|
|
case <-timer.C:
|
|
case <-bfs.ctx.Done():
|
|
return bfs.ctx.Err()
|
|
}
|
|
backoff *= time.Duration(backoffFactor)
|
|
if backoff > maxBackoff {
|
|
backoff = maxBackoff
|
|
}
|
|
}
|
|
return err
|
|
}
|
|
|
|
func (bfs *Service) objectGet(ctx context.Context, oid string) (io.ReadCloser, error) {
|
|
u, err := url.Parse(fmt.Sprintf("neofs:%s/%s", bfs.cfg.ContainerID, oid))
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
var rc io.ReadCloser
|
|
err = bfs.retry(func() error {
|
|
rc, err = neofs.GetWithClient(ctx, bfs.pool, bfs.account.PrivateKey(), u, false)
|
|
return err
|
|
})
|
|
return rc, err
|
|
}
|
|
|
|
func (bfs *Service) objectSearch(ctx context.Context, prm client.PrmObjectSearch) ([]oid.ID, error) {
|
|
var (
|
|
oids []oid.ID
|
|
err error
|
|
)
|
|
err = bfs.retry(func() error {
|
|
oids, err = neofs.ObjectSearch(ctx, bfs.pool, bfs.account.PrivateKey(), bfs.cfg.ContainerID, prm)
|
|
return err
|
|
})
|
|
return oids, err
|
|
}
|
|
|
|
// isContextCanceledErr returns whether error is a wrapped [context.Canceled].
|
|
// Ref. https://github.com/nspcc-dev/neofs-sdk-go/issues/624.
|
|
func isContextCanceledErr(err error) bool {
|
|
return errors.Is(err, context.Canceled) ||
|
|
strings.Contains(err.Error(), "context canceled")
|
|
}
|