forked from TrueCloudLab/frostfs-node
383 lines
8.7 KiB
Go
383 lines
8.7 KiB
Go
package cache
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"sync"
|
|
"time"
|
|
|
|
clientcore "git.frostfs.info/TrueCloudLab/frostfs-node/pkg/core/client"
|
|
"git.frostfs.info/TrueCloudLab/frostfs-node/pkg/network"
|
|
metrics "git.frostfs.info/TrueCloudLab/frostfs-observability/metrics/grpc"
|
|
tracing "git.frostfs.info/TrueCloudLab/frostfs-observability/tracing/grpc"
|
|
rawclient "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/api/rpc/client"
|
|
"git.frostfs.info/TrueCloudLab/frostfs-sdk-go/client"
|
|
objectSDK "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/object"
|
|
"google.golang.org/grpc"
|
|
"google.golang.org/grpc/codes"
|
|
"google.golang.org/grpc/status"
|
|
)
|
|
|
|
type singleClient struct {
|
|
sync.RWMutex
|
|
client clientcore.Client
|
|
lastAttempt time.Time
|
|
}
|
|
|
|
type multiClient struct {
|
|
mtx sync.RWMutex
|
|
|
|
clients map[string]*singleClient
|
|
|
|
// addrMtx protects addr field. Should not be taken before the mtx.
|
|
addrMtx sync.RWMutex
|
|
addr network.AddressGroup
|
|
|
|
opts ClientCacheOpts
|
|
}
|
|
|
|
const defaultReconnectInterval = time.Second * 30
|
|
|
|
func newMultiClient(addr network.AddressGroup, opts ClientCacheOpts) *multiClient {
|
|
if opts.ReconnectTimeout <= 0 {
|
|
opts.ReconnectTimeout = defaultReconnectInterval
|
|
}
|
|
return &multiClient{
|
|
clients: make(map[string]*singleClient),
|
|
addr: addr,
|
|
opts: opts,
|
|
}
|
|
}
|
|
|
|
func (x *multiClient) createForAddress(ctx context.Context, addr network.Address) (clientcore.Client, error) {
|
|
var c client.Client
|
|
|
|
prmInit := client.PrmInit{
|
|
DisableFrostFSErrorResolution: true,
|
|
}
|
|
if x.opts.Key != nil {
|
|
prmInit.Key = *x.opts.Key
|
|
}
|
|
|
|
grpcOpts := []grpc.DialOption{
|
|
grpc.WithChainUnaryInterceptor(
|
|
metrics.NewUnaryClientInterceptor(),
|
|
tracing.NewUnaryClientInteceptor(),
|
|
),
|
|
grpc.WithChainStreamInterceptor(
|
|
metrics.NewStreamClientInterceptor(),
|
|
tracing.NewStreamClientInterceptor(),
|
|
),
|
|
grpc.WithContextDialer(x.opts.DialerSource.GrpcContextDialer()),
|
|
grpc.WithDefaultCallOptions(grpc.WaitForReady(true)),
|
|
}
|
|
|
|
prmDial := client.PrmDial{
|
|
Endpoint: addr.URIAddr(),
|
|
GRPCDialOptions: grpcOpts,
|
|
}
|
|
if x.opts.DialTimeout > 0 {
|
|
prmDial.DialTimeout = x.opts.DialTimeout
|
|
}
|
|
|
|
if x.opts.StreamTimeout > 0 {
|
|
prmDial.StreamTimeout = x.opts.StreamTimeout
|
|
}
|
|
|
|
if x.opts.ResponseCallback != nil {
|
|
prmInit.ResponseInfoCallback = x.opts.ResponseCallback
|
|
}
|
|
|
|
c.Init(prmInit)
|
|
err := c.Dial(ctx, prmDial)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("can't init SDK client: %w", err)
|
|
}
|
|
|
|
return &c, nil
|
|
}
|
|
|
|
// updateGroup replaces current multiClient addresses with a new group.
|
|
// Old addresses not present in group are removed.
|
|
func (x *multiClient) updateGroup(group network.AddressGroup) {
|
|
// Firstly, remove old clients.
|
|
cache := make([]string, 0, group.Len())
|
|
group.IterateAddresses(func(a network.Address) bool {
|
|
cache = append(cache, a.String())
|
|
return false
|
|
})
|
|
|
|
x.addrMtx.RLock()
|
|
oldGroup := x.addr
|
|
x.addrMtx.RUnlock()
|
|
if len(oldGroup) == len(cache) {
|
|
needUpdate := false
|
|
for i := range oldGroup {
|
|
if cache[i] != oldGroup[i].String() {
|
|
needUpdate = true
|
|
break
|
|
}
|
|
}
|
|
if !needUpdate {
|
|
return
|
|
}
|
|
}
|
|
|
|
x.mtx.Lock()
|
|
defer x.mtx.Unlock()
|
|
loop:
|
|
for a := range x.clients {
|
|
for i := range cache {
|
|
if cache[i] == a {
|
|
continue loop
|
|
}
|
|
}
|
|
x.clients[a].invalidate()
|
|
delete(x.clients, a)
|
|
}
|
|
|
|
// Then add new clients.
|
|
x.addrMtx.Lock()
|
|
x.addr = group
|
|
x.addrMtx.Unlock()
|
|
}
|
|
|
|
var errRecentlyFailed = errors.New("client has recently failed, skipping")
|
|
|
|
func (x *multiClient) iterateClients(ctx context.Context, f func(clientcore.Client) error) error {
|
|
var firstErr error
|
|
|
|
x.addrMtx.RLock()
|
|
group := x.addr
|
|
x.addrMtx.RUnlock()
|
|
|
|
group.IterateAddresses(func(addr network.Address) bool {
|
|
select {
|
|
case <-ctx.Done():
|
|
firstErr = fmt.Errorf("try %v: %w", addr, context.Canceled)
|
|
return true
|
|
default:
|
|
}
|
|
|
|
var err error
|
|
|
|
c, err := x.client(ctx, addr)
|
|
if err == nil {
|
|
err = f(c)
|
|
}
|
|
|
|
// non-status logic error that could be returned
|
|
// from the SDK client; should not be considered
|
|
// as a connection error
|
|
var siErr *objectSDK.SplitInfoError
|
|
var eiErr *objectSDK.ECInfoError
|
|
|
|
if err != nil {
|
|
err = fmt.Errorf("client connection error at %v: %w", addr, err)
|
|
x.ReportError(err)
|
|
}
|
|
|
|
success := err == nil || errors.Is(err, context.Canceled) || errors.As(err, &siErr) || errors.As(err, &eiErr)
|
|
if success || firstErr == nil || errors.Is(firstErr, errRecentlyFailed) {
|
|
firstErr = err
|
|
}
|
|
|
|
return success
|
|
})
|
|
|
|
return firstErr
|
|
}
|
|
|
|
func (x *multiClient) ReportError(err error) {
|
|
if errors.Is(err, errRecentlyFailed) {
|
|
return
|
|
}
|
|
|
|
if status.Code(err) == codes.Canceled || errors.Is(err, context.Canceled) {
|
|
return
|
|
}
|
|
|
|
// non-status logic error that could be returned
|
|
// from the SDK client; should not be considered
|
|
// as a connection error
|
|
var siErr *objectSDK.SplitInfoError
|
|
var eiErr *objectSDK.ECInfoError
|
|
if errors.As(err, &siErr) || errors.As(err, &eiErr) {
|
|
return
|
|
}
|
|
|
|
// Dropping all clients here is not necessary, we do this
|
|
// because `multiClient` doesn't yet provide convenient interface
|
|
// for reporting individual errors for streaming operations.
|
|
x.mtx.RLock()
|
|
for _, sc := range x.clients {
|
|
sc.invalidate()
|
|
}
|
|
x.mtx.RUnlock()
|
|
}
|
|
|
|
func (s *singleClient) invalidate() {
|
|
s.Lock()
|
|
if s.client != nil {
|
|
_ = s.client.Close()
|
|
}
|
|
s.client = nil
|
|
s.Unlock()
|
|
}
|
|
|
|
func (x *multiClient) ObjectPutInit(ctx context.Context, p client.PrmObjectPutInit) (res client.ObjectWriter, err error) {
|
|
err = x.iterateClients(ctx, func(c clientcore.Client) error {
|
|
res, err = c.ObjectPutInit(ctx, p)
|
|
return err
|
|
})
|
|
|
|
return
|
|
}
|
|
|
|
func (x *multiClient) ObjectPutSingle(ctx context.Context, p client.PrmObjectPutSingle) (res *client.ResObjectPutSingle, err error) {
|
|
err = x.iterateClients(ctx, func(c clientcore.Client) error {
|
|
res, err = c.ObjectPutSingle(ctx, p)
|
|
return err
|
|
})
|
|
|
|
return
|
|
}
|
|
|
|
func (x *multiClient) ObjectDelete(ctx context.Context, p client.PrmObjectDelete) (res *client.ResObjectDelete, err error) {
|
|
err = x.iterateClients(ctx, func(c clientcore.Client) error {
|
|
res, err = c.ObjectDelete(ctx, p)
|
|
return err
|
|
})
|
|
|
|
return
|
|
}
|
|
|
|
func (x *multiClient) ObjectGetInit(ctx context.Context, p client.PrmObjectGet) (res *client.ObjectReader, err error) {
|
|
err = x.iterateClients(ctx, func(c clientcore.Client) error {
|
|
res, err = c.ObjectGetInit(ctx, p)
|
|
return err
|
|
})
|
|
|
|
return
|
|
}
|
|
|
|
func (x *multiClient) ObjectRangeInit(ctx context.Context, p client.PrmObjectRange) (res *client.ObjectRangeReader, err error) {
|
|
err = x.iterateClients(ctx, func(c clientcore.Client) error {
|
|
res, err = c.ObjectRangeInit(ctx, p)
|
|
return err
|
|
})
|
|
|
|
return
|
|
}
|
|
|
|
func (x *multiClient) ObjectHead(ctx context.Context, p client.PrmObjectHead) (res *client.ResObjectHead, err error) {
|
|
err = x.iterateClients(ctx, func(c clientcore.Client) error {
|
|
res, err = c.ObjectHead(ctx, p)
|
|
return err
|
|
})
|
|
|
|
return
|
|
}
|
|
|
|
func (x *multiClient) ObjectHash(ctx context.Context, p client.PrmObjectHash) (res *client.ResObjectHash, err error) {
|
|
err = x.iterateClients(ctx, func(c clientcore.Client) error {
|
|
res, err = c.ObjectHash(ctx, p)
|
|
return err
|
|
})
|
|
|
|
return
|
|
}
|
|
|
|
func (x *multiClient) ObjectSearchInit(ctx context.Context, p client.PrmObjectSearch) (res *client.ObjectListReader, err error) {
|
|
err = x.iterateClients(ctx, func(c clientcore.Client) error {
|
|
res, err = c.ObjectSearchInit(ctx, p)
|
|
return err
|
|
})
|
|
|
|
return
|
|
}
|
|
|
|
func (x *multiClient) ExecRaw(func(client *rawclient.Client) error) error {
|
|
panic("multiClient.ExecRaw() must not be called")
|
|
}
|
|
|
|
func (x *multiClient) Close() error {
|
|
x.mtx.RLock()
|
|
|
|
{
|
|
for _, c := range x.clients {
|
|
if c.client != nil {
|
|
_ = c.client.Close()
|
|
}
|
|
}
|
|
}
|
|
|
|
x.mtx.RUnlock()
|
|
|
|
return nil
|
|
}
|
|
|
|
func (x *multiClient) RawForAddress(ctx context.Context, addr network.Address, f func(client *rawclient.Client) error) error {
|
|
c, err := x.client(ctx, addr)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
err = c.ExecRaw(f)
|
|
if err != nil {
|
|
x.ReportError(err)
|
|
}
|
|
return err
|
|
}
|
|
|
|
func (x *multiClient) client(ctx context.Context, addr network.Address) (clientcore.Client, error) {
|
|
strAddr := addr.String()
|
|
|
|
x.mtx.RLock()
|
|
c, cached := x.clients[strAddr]
|
|
x.mtx.RUnlock()
|
|
|
|
if cached {
|
|
c.RLock()
|
|
if c.client != nil {
|
|
cl := c.client
|
|
c.RUnlock()
|
|
return cl, nil
|
|
}
|
|
if x.opts.ReconnectTimeout != 0 && time.Since(c.lastAttempt) < x.opts.ReconnectTimeout {
|
|
c.RUnlock()
|
|
return nil, errRecentlyFailed
|
|
}
|
|
c.RUnlock()
|
|
} else {
|
|
var ok bool
|
|
x.mtx.Lock()
|
|
c, ok = x.clients[strAddr]
|
|
if !ok {
|
|
c = new(singleClient)
|
|
x.clients[strAddr] = c
|
|
}
|
|
x.mtx.Unlock()
|
|
}
|
|
|
|
c.Lock()
|
|
defer c.Unlock()
|
|
|
|
if c.client != nil {
|
|
return c.client, nil
|
|
}
|
|
|
|
if x.opts.ReconnectTimeout != 0 && time.Since(c.lastAttempt) < x.opts.ReconnectTimeout {
|
|
return nil, errRecentlyFailed
|
|
}
|
|
|
|
cl, err := x.createForAddress(ctx, addr)
|
|
if err != nil {
|
|
c.lastAttempt = time.Now()
|
|
return nil, err
|
|
}
|
|
|
|
c.client = cl
|
|
return cl, nil
|
|
}
|