Evgenii Stratonikov
0e31c12e63
Drop duplicate entities. Format entities. Signed-off-by: Dmitrii Stepanov <d.stepanov@yadro.com> Signed-off-by: Evgenii Stratonikov <e.stratonikov@yadro.com>
168 lines
4.6 KiB
Go
168 lines
4.6 KiB
Go
package writecache
|
|
|
|
import (
|
|
"errors"
|
|
"fmt"
|
|
"os"
|
|
|
|
"git.frostfs.info/TrueCloudLab/frostfs-node/internal/logs"
|
|
"git.frostfs.info/TrueCloudLab/frostfs-node/pkg/local_object_storage/blobstor/common"
|
|
"git.frostfs.info/TrueCloudLab/frostfs-node/pkg/local_object_storage/blobstor/fstree"
|
|
storagelog "git.frostfs.info/TrueCloudLab/frostfs-node/pkg/local_object_storage/internal/log"
|
|
"git.frostfs.info/TrueCloudLab/frostfs-node/pkg/util"
|
|
apistatus "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/client/status"
|
|
oid "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/object/id"
|
|
lru "github.com/hashicorp/golang-lru/v2"
|
|
"github.com/hashicorp/golang-lru/v2/simplelru"
|
|
"go.etcd.io/bbolt"
|
|
"go.uber.org/zap"
|
|
)
|
|
|
|
// store represents persistent storage with in-memory LRU cache
|
|
// for flushed items on top of it.
|
|
type store struct {
|
|
maxFlushedMarksCount int
|
|
maxRemoveBatchSize int
|
|
|
|
// flushed contains addresses of objects that were already flushed to the main storage.
|
|
// We use LRU cache instead of map here to facilitate removing of unused object in favour of
|
|
// frequently read ones.
|
|
// MUST NOT be used inside bolt db transaction because it's eviction handler
|
|
// removes untracked items from the database.
|
|
flushed simplelru.LRUCache[string, bool]
|
|
db *bbolt.DB
|
|
|
|
dbKeysToRemove []string
|
|
fsKeysToRemove []string
|
|
}
|
|
|
|
const dbName = "small.bolt"
|
|
|
|
func (c *cache) openStore(readOnly bool) error {
|
|
err := util.MkdirAllX(c.path, os.ModePerm)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
c.db, err = OpenDB(c.path, readOnly, c.openFile)
|
|
if err != nil {
|
|
return fmt.Errorf("could not open database: %w", err)
|
|
}
|
|
|
|
c.db.MaxBatchSize = c.maxBatchSize
|
|
c.db.MaxBatchDelay = c.maxBatchDelay
|
|
|
|
if !readOnly {
|
|
err = c.db.Update(func(tx *bbolt.Tx) error {
|
|
_, err := tx.CreateBucketIfNotExists(defaultBucket)
|
|
return err
|
|
})
|
|
if err != nil {
|
|
return fmt.Errorf("could not create default bucket: %w", err)
|
|
}
|
|
}
|
|
|
|
c.fsTree = fstree.New(
|
|
fstree.WithPath(c.path),
|
|
fstree.WithPerm(os.ModePerm),
|
|
fstree.WithDepth(1),
|
|
fstree.WithDirNameLen(1),
|
|
fstree.WithNoSync(c.noSync))
|
|
if err := c.fsTree.Open(readOnly); err != nil {
|
|
return fmt.Errorf("could not open FSTree: %w", err)
|
|
}
|
|
|
|
// Write-cache can be opened multiple times during `SetMode`.
|
|
// flushed map must not be re-created in this case.
|
|
if c.flushed == nil {
|
|
c.flushed, _ = lru.NewWithEvict[string, bool](c.maxFlushedMarksCount, c.removeFlushed)
|
|
}
|
|
|
|
c.initialized.Store(false)
|
|
|
|
return nil
|
|
}
|
|
|
|
// removeFlushed removes an object from the writecache.
|
|
// To minimize interference with the client operations, the actual removal
|
|
// is done in batches.
|
|
// It is not thread-safe and is used only as an evict callback to LRU cache.
|
|
func (c *cache) removeFlushed(key string, value bool) {
|
|
fromDatabase := value
|
|
if fromDatabase {
|
|
c.dbKeysToRemove = append(c.dbKeysToRemove, key)
|
|
} else {
|
|
c.fsKeysToRemove = append(c.fsKeysToRemove, key)
|
|
}
|
|
|
|
if len(c.dbKeysToRemove)+len(c.fsKeysToRemove) >= c.maxRemoveBatchSize {
|
|
c.dbKeysToRemove = c.deleteFromDB(c.dbKeysToRemove)
|
|
c.fsKeysToRemove = c.deleteFromDisk(c.fsKeysToRemove)
|
|
}
|
|
}
|
|
|
|
func (c *cache) deleteFromDB(keys []string) []string {
|
|
if len(keys) == 0 {
|
|
return keys
|
|
}
|
|
|
|
var errorIndex int
|
|
err := c.db.Batch(func(tx *bbolt.Tx) error {
|
|
b := tx.Bucket(defaultBucket)
|
|
for errorIndex = range keys {
|
|
if err := b.Delete([]byte(keys[errorIndex])); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
return nil
|
|
})
|
|
for i := 0; i < errorIndex; i++ {
|
|
c.objCounters.DecDB()
|
|
storagelog.Write(c.log,
|
|
storagelog.AddressField(keys[i]),
|
|
storagelog.StorageTypeField(wcStorageType),
|
|
storagelog.OpField("db DELETE"),
|
|
)
|
|
}
|
|
if err != nil {
|
|
c.log.Error(logs.WritecacheCantRemoveObjectsFromTheDatabase, zap.Error(err))
|
|
}
|
|
|
|
copy(keys, keys[errorIndex:])
|
|
return keys[:len(keys)-errorIndex]
|
|
}
|
|
|
|
func (c *cache) deleteFromDisk(keys []string) []string {
|
|
if len(keys) == 0 {
|
|
return keys
|
|
}
|
|
|
|
var copyIndex int
|
|
var addr oid.Address
|
|
|
|
for i := range keys {
|
|
if err := addr.DecodeString(keys[i]); err != nil {
|
|
c.log.Error(logs.WritecacheCantParseAddress, zap.String("address", keys[i]))
|
|
continue
|
|
}
|
|
|
|
_, err := c.fsTree.Delete(common.DeletePrm{Address: addr})
|
|
if err != nil && !errors.As(err, new(apistatus.ObjectNotFound)) {
|
|
c.log.Error(logs.WritecacheCantRemoveObjectFromWritecache, zap.Error(err))
|
|
|
|
// Save the key for the next iteration.
|
|
keys[copyIndex] = keys[i]
|
|
copyIndex++
|
|
continue
|
|
} else if err == nil {
|
|
storagelog.Write(c.log,
|
|
storagelog.AddressField(keys[i]),
|
|
storagelog.StorageTypeField(wcStorageType),
|
|
storagelog.OpField("fstree DELETE"),
|
|
)
|
|
c.objCounters.DecFS()
|
|
}
|
|
}
|
|
|
|
return keys[:copyIndex]
|
|
}
|