package writecache import ( "errors" "fmt" "os" "git.frostfs.info/TrueCloudLab/frostfs-node/internal/logs" "git.frostfs.info/TrueCloudLab/frostfs-node/pkg/local_object_storage/blobstor/common" "git.frostfs.info/TrueCloudLab/frostfs-node/pkg/local_object_storage/blobstor/fstree" storagelog "git.frostfs.info/TrueCloudLab/frostfs-node/pkg/local_object_storage/internal/log" "git.frostfs.info/TrueCloudLab/frostfs-node/pkg/util" apistatus "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/client/status" oid "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/object/id" lru "github.com/hashicorp/golang-lru/v2" "github.com/hashicorp/golang-lru/v2/simplelru" "go.etcd.io/bbolt" "go.uber.org/zap" ) // store represents persistent storage with in-memory LRU cache // for flushed items on top of it. type store struct { maxFlushedMarksCount int maxRemoveBatchSize int // flushed contains addresses of objects that were already flushed to the main storage. // We use LRU cache instead of map here to facilitate removing of unused object in favour of // frequently read ones. // MUST NOT be used inside bolt db transaction because it's eviction handler // removes untracked items from the database. flushed simplelru.LRUCache[string, bool] db *bbolt.DB dbKeysToRemove []string fsKeysToRemove []string } const dbName = "small.bolt" func (c *cache) openStore(readOnly bool) error { err := util.MkdirAllX(c.path, os.ModePerm) if err != nil { return err } c.db, err = OpenDB(c.path, readOnly, c.openFile) if err != nil { return fmt.Errorf("could not open database: %w", err) } c.db.MaxBatchSize = c.maxBatchSize c.db.MaxBatchDelay = c.maxBatchDelay if !readOnly { err = c.db.Update(func(tx *bbolt.Tx) error { _, err := tx.CreateBucketIfNotExists(defaultBucket) return err }) if err != nil { return fmt.Errorf("could not create default bucket: %w", err) } } c.fsTree = fstree.New( fstree.WithPath(c.path), fstree.WithPerm(os.ModePerm), fstree.WithDepth(1), fstree.WithDirNameLen(1), fstree.WithNoSync(c.noSync)) if err := c.fsTree.Open(readOnly); err != nil { return fmt.Errorf("could not open FSTree: %w", err) } // Write-cache can be opened multiple times during `SetMode`. // flushed map must not be re-created in this case. if c.flushed == nil { c.flushed, _ = lru.NewWithEvict[string, bool](c.maxFlushedMarksCount, c.removeFlushed) } c.initialized.Store(false) return nil } // removeFlushed removes an object from the writecache. // To minimize interference with the client operations, the actual removal // is done in batches. // It is not thread-safe and is used only as an evict callback to LRU cache. func (c *cache) removeFlushed(key string, value bool) { fromDatabase := value if fromDatabase { c.dbKeysToRemove = append(c.dbKeysToRemove, key) } else { c.fsKeysToRemove = append(c.fsKeysToRemove, key) } if len(c.dbKeysToRemove)+len(c.fsKeysToRemove) >= c.maxRemoveBatchSize { c.dbKeysToRemove = c.deleteFromDB(c.dbKeysToRemove) c.fsKeysToRemove = c.deleteFromDisk(c.fsKeysToRemove) } } func (c *cache) deleteFromDB(keys []string) []string { if len(keys) == 0 { return keys } var errorIndex int err := c.db.Batch(func(tx *bbolt.Tx) error { b := tx.Bucket(defaultBucket) for errorIndex = range keys { if err := b.Delete([]byte(keys[errorIndex])); err != nil { return err } } return nil }) for i := 0; i < errorIndex; i++ { c.objCounters.DecDB() storagelog.Write(c.log, storagelog.AddressField(keys[i]), storagelog.StorageTypeField(wcStorageType), storagelog.OpField("db DELETE"), ) } if err != nil { c.log.Error(logs.WritecacheCantRemoveObjectsFromTheDatabase, zap.Error(err)) } copy(keys, keys[errorIndex:]) return keys[:len(keys)-errorIndex] } func (c *cache) deleteFromDisk(keys []string) []string { if len(keys) == 0 { return keys } var copyIndex int var addr oid.Address for i := range keys { if err := addr.DecodeString(keys[i]); err != nil { c.log.Error(logs.WritecacheCantParseAddress, zap.String("address", keys[i])) continue } _, err := c.fsTree.Delete(common.DeletePrm{Address: addr}) if err != nil && !errors.As(err, new(apistatus.ObjectNotFound)) { c.log.Error(logs.WritecacheCantRemoveObjectFromWritecache, zap.Error(err)) // Save the key for the next iteration. keys[copyIndex] = keys[i] copyIndex++ continue } else if err == nil { storagelog.Write(c.log, storagelog.AddressField(keys[i]), storagelog.StorageTypeField(wcStorageType), storagelog.OpField("fstree DELETE"), ) c.objCounters.DecFS() } } return keys[:copyIndex] }