2014-09-23 20:39:12 +00:00
|
|
|
package khepri
|
|
|
|
|
|
|
|
import (
|
2014-11-17 22:28:51 +00:00
|
|
|
"io"
|
|
|
|
"io/ioutil"
|
2014-09-23 20:39:12 +00:00
|
|
|
"os"
|
|
|
|
"path/filepath"
|
2014-11-16 21:50:20 +00:00
|
|
|
"sync"
|
2014-09-23 20:39:12 +00:00
|
|
|
|
|
|
|
"github.com/fd0/khepri/backend"
|
2014-11-17 22:28:51 +00:00
|
|
|
"github.com/fd0/khepri/chunker"
|
2014-11-23 11:14:56 +00:00
|
|
|
"github.com/juju/arrar"
|
2014-09-23 20:39:12 +00:00
|
|
|
)
|
|
|
|
|
2014-11-16 21:50:20 +00:00
|
|
|
const (
|
|
|
|
maxConcurrentFiles = 32
|
2014-11-22 21:05:39 +00:00
|
|
|
maxConcurrentBlobs = 32
|
2014-11-16 21:50:20 +00:00
|
|
|
)
|
|
|
|
|
2014-09-23 20:39:12 +00:00
|
|
|
type Archiver struct {
|
2014-11-16 21:50:20 +00:00
|
|
|
be backend.Server
|
|
|
|
key *Key
|
|
|
|
ch *ContentHandler
|
|
|
|
|
2014-11-21 20:21:44 +00:00
|
|
|
bl *BlobList // blobs used for the current snapshot
|
2014-09-23 20:39:12 +00:00
|
|
|
|
2014-11-16 21:50:20 +00:00
|
|
|
fileToken chan struct{}
|
2014-11-22 21:05:39 +00:00
|
|
|
blobToken chan struct{}
|
2014-11-16 21:50:20 +00:00
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
Stats Stats
|
|
|
|
|
2014-09-23 20:39:12 +00:00
|
|
|
Error func(dir string, fi os.FileInfo, err error) error
|
|
|
|
Filter func(item string, fi os.FileInfo) bool
|
2014-11-16 20:29:11 +00:00
|
|
|
|
|
|
|
ScannerUpdate func(stats Stats)
|
|
|
|
SaveUpdate func(stats Stats)
|
2014-11-16 21:50:20 +00:00
|
|
|
|
|
|
|
sum sync.Mutex // for SaveUpdate
|
2014-11-16 20:29:11 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
type Stats struct {
|
|
|
|
Files int
|
|
|
|
Directories int
|
|
|
|
Other int
|
|
|
|
Bytes uint64
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func NewArchiver(be backend.Server, key *Key) (*Archiver, error) {
|
|
|
|
var err error
|
2014-11-16 21:50:20 +00:00
|
|
|
arch := &Archiver{
|
|
|
|
be: be,
|
|
|
|
key: key,
|
|
|
|
fileToken: make(chan struct{}, maxConcurrentFiles),
|
2014-11-22 21:05:39 +00:00
|
|
|
blobToken: make(chan struct{}, maxConcurrentBlobs),
|
2014-11-16 21:50:20 +00:00
|
|
|
}
|
|
|
|
|
2014-11-22 21:05:39 +00:00
|
|
|
// fill file and blob token
|
2014-11-16 21:50:20 +00:00
|
|
|
for i := 0; i < maxConcurrentFiles; i++ {
|
|
|
|
arch.fileToken <- struct{}{}
|
|
|
|
}
|
2014-09-23 20:39:12 +00:00
|
|
|
|
2014-11-22 21:05:39 +00:00
|
|
|
for i := 0; i < maxConcurrentBlobs; i++ {
|
|
|
|
arch.blobToken <- struct{}{}
|
|
|
|
}
|
|
|
|
|
2014-09-23 20:39:12 +00:00
|
|
|
// abort on all errors
|
|
|
|
arch.Error = func(string, os.FileInfo, error) error { return err }
|
|
|
|
// allow all files
|
|
|
|
arch.Filter = func(string, os.FileInfo) bool { return true }
|
2014-11-16 20:29:11 +00:00
|
|
|
// do nothing
|
|
|
|
arch.ScannerUpdate = func(Stats) {}
|
2014-09-23 20:39:12 +00:00
|
|
|
|
2014-11-21 20:21:44 +00:00
|
|
|
arch.bl = NewBlobList()
|
2014-09-23 20:39:12 +00:00
|
|
|
arch.ch, err = NewContentHandler(be, key)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// load all blobs from all snapshots
|
|
|
|
err = arch.ch.LoadAllSnapshots()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return arch, nil
|
|
|
|
}
|
|
|
|
|
2014-11-16 21:50:20 +00:00
|
|
|
func (arch *Archiver) saveUpdate(stats Stats) {
|
|
|
|
if arch.SaveUpdate != nil {
|
|
|
|
arch.sum.Lock()
|
|
|
|
defer arch.sum.Unlock()
|
|
|
|
arch.SaveUpdate(stats)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-11-21 20:21:44 +00:00
|
|
|
func (arch *Archiver) Save(t backend.Type, data []byte) (Blob, error) {
|
2014-09-23 20:39:12 +00:00
|
|
|
blob, err := arch.ch.Save(t, data)
|
|
|
|
if err != nil {
|
2014-11-21 20:21:44 +00:00
|
|
|
return Blob{}, err
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// store blob in storage map for current snapshot
|
2014-11-21 20:21:44 +00:00
|
|
|
arch.bl.Insert(blob)
|
2014-09-23 20:39:12 +00:00
|
|
|
|
|
|
|
return blob, nil
|
|
|
|
}
|
|
|
|
|
2014-11-21 20:21:44 +00:00
|
|
|
func (arch *Archiver) SaveJSON(t backend.Type, item interface{}) (Blob, error) {
|
2014-09-23 20:39:12 +00:00
|
|
|
blob, err := arch.ch.SaveJSON(t, item)
|
|
|
|
if err != nil {
|
2014-11-21 20:21:44 +00:00
|
|
|
return Blob{}, err
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// store blob in storage map for current snapshot
|
2014-11-21 20:21:44 +00:00
|
|
|
arch.bl.Insert(blob)
|
2014-09-23 20:39:12 +00:00
|
|
|
|
|
|
|
return blob, nil
|
|
|
|
}
|
|
|
|
|
2014-11-17 22:28:51 +00:00
|
|
|
// SaveFile stores the content of the file on the backend as a Blob by calling
|
|
|
|
// Save for each chunk.
|
2014-11-16 20:29:11 +00:00
|
|
|
func (arch *Archiver) SaveFile(node *Node) error {
|
2014-11-17 22:28:51 +00:00
|
|
|
file, err := os.Open(node.path)
|
|
|
|
defer file.Close()
|
2014-09-23 20:39:12 +00:00
|
|
|
if err != nil {
|
2014-11-23 11:14:56 +00:00
|
|
|
return arrar.Annotate(err, "SaveFile()")
|
2014-11-17 22:28:51 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
var blobs Blobs
|
|
|
|
|
|
|
|
// if the file is small enough, store it directly
|
|
|
|
if node.Size < chunker.MinSize {
|
|
|
|
buf, err := ioutil.ReadAll(file)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
blob, err := arch.ch.Save(backend.Data, buf)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
arch.saveUpdate(Stats{Bytes: blob.Size})
|
|
|
|
|
|
|
|
blobs = Blobs{blob}
|
|
|
|
} else {
|
|
|
|
// else store all chunks
|
2014-11-17 22:37:03 +00:00
|
|
|
chnker := chunker.New(file)
|
2014-11-22 21:05:39 +00:00
|
|
|
chans := [](<-chan Blob){}
|
2014-11-17 22:28:51 +00:00
|
|
|
|
|
|
|
for {
|
2014-11-17 22:37:03 +00:00
|
|
|
chunk, err := chnker.Next()
|
2014-11-17 22:28:51 +00:00
|
|
|
if err == io.EOF {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2014-11-22 21:05:39 +00:00
|
|
|
// acquire token, start goroutine to save chunk
|
|
|
|
token := <-arch.blobToken
|
|
|
|
resCh := make(chan Blob, 1)
|
|
|
|
|
|
|
|
go func(ch chan<- Blob) {
|
|
|
|
blob, err := arch.ch.Save(backend.Data, chunk.Data)
|
|
|
|
// TODO handle error
|
|
|
|
if err != nil {
|
|
|
|
panic(err)
|
|
|
|
}
|
2014-11-17 22:28:51 +00:00
|
|
|
|
2014-11-22 21:05:39 +00:00
|
|
|
arch.saveUpdate(Stats{Bytes: blob.Size})
|
|
|
|
arch.blobToken <- token
|
|
|
|
ch <- blob
|
|
|
|
}(resCh)
|
|
|
|
|
|
|
|
chans = append(chans, resCh)
|
|
|
|
}
|
2014-11-17 22:28:51 +00:00
|
|
|
|
2014-11-22 21:05:39 +00:00
|
|
|
blobs = []Blob{}
|
|
|
|
for _, ch := range chans {
|
|
|
|
blobs = append(blobs, <-ch)
|
2014-11-17 22:28:51 +00:00
|
|
|
}
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
node.Content = make([]backend.ID, len(blobs))
|
|
|
|
for i, blob := range blobs {
|
|
|
|
node.Content[i] = blob.ID
|
2014-11-21 20:21:44 +00:00
|
|
|
arch.bl.Insert(blob)
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
return err
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
func (arch *Archiver) loadTree(dir string) (*Tree, error) {
|
|
|
|
// open and list path
|
2014-09-23 20:39:12 +00:00
|
|
|
fd, err := os.Open(dir)
|
|
|
|
defer fd.Close()
|
|
|
|
if err != nil {
|
2014-11-23 11:14:56 +00:00
|
|
|
return nil, arch.Error(dir, nil, err)
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
entries, err := fd.Readdir(-1)
|
|
|
|
if err != nil {
|
2014-11-16 20:29:11 +00:00
|
|
|
return nil, err
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
tree := Tree{}
|
|
|
|
|
|
|
|
for _, entry := range entries {
|
|
|
|
path := filepath.Join(dir, entry.Name())
|
|
|
|
|
|
|
|
if !arch.Filter(path, entry) {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
node, err := NodeFromFileInfo(path, entry)
|
|
|
|
if err != nil {
|
2014-11-16 20:29:11 +00:00
|
|
|
// TODO: error processing
|
|
|
|
return nil, err
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
tree = append(tree, node)
|
|
|
|
|
|
|
|
if entry.IsDir() {
|
2014-11-16 20:29:11 +00:00
|
|
|
node.Tree, err = arch.loadTree(path)
|
2014-09-23 20:39:12 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
switch node.Type {
|
|
|
|
case "file":
|
|
|
|
arch.Stats.Files++
|
|
|
|
arch.Stats.Bytes += node.Size
|
|
|
|
case "dir":
|
|
|
|
arch.Stats.Directories++
|
|
|
|
default:
|
|
|
|
arch.Stats.Other++
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
arch.ScannerUpdate(arch.Stats)
|
|
|
|
|
|
|
|
return &tree, nil
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
func (arch *Archiver) LoadTree(path string) (*Tree, error) {
|
|
|
|
fi, err := os.Lstat(path)
|
|
|
|
if err != nil {
|
2014-11-23 11:14:56 +00:00
|
|
|
return nil, arrar.Annotatef(err, "Lstat(%q)", path)
|
2014-11-16 20:29:11 +00:00
|
|
|
}
|
2014-09-23 20:39:12 +00:00
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
node, err := NodeFromFileInfo(path, fi)
|
2014-09-23 20:39:12 +00:00
|
|
|
if err != nil {
|
2014-11-23 11:14:56 +00:00
|
|
|
return nil, arrar.Annotate(err, "NodeFromFileInfo()")
|
2014-11-16 20:29:11 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if node.Type != "dir" {
|
|
|
|
arch.Stats.Files = 1
|
|
|
|
arch.Stats.Bytes = node.Size
|
|
|
|
arch.ScannerUpdate(arch.Stats)
|
|
|
|
return &Tree{node}, nil
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
arch.Stats.Directories = 1
|
|
|
|
node.Tree, err = arch.loadTree(path)
|
2014-09-23 20:39:12 +00:00
|
|
|
if err != nil {
|
2014-11-23 11:14:56 +00:00
|
|
|
return nil, arrar.Annotate(err, "loadTree()")
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
arch.ScannerUpdate(arch.Stats)
|
2014-09-23 20:39:12 +00:00
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
return &Tree{node}, nil
|
|
|
|
}
|
2014-09-23 20:39:12 +00:00
|
|
|
|
2014-11-21 20:21:44 +00:00
|
|
|
func (arch *Archiver) saveTree(t *Tree) (Blob, error) {
|
2014-11-16 21:50:20 +00:00
|
|
|
var wg sync.WaitGroup
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
for _, node := range *t {
|
|
|
|
if node.Tree != nil && node.Subtree == nil {
|
|
|
|
b, err := arch.saveTree(node.Tree)
|
|
|
|
if err != nil {
|
2014-11-21 20:21:44 +00:00
|
|
|
return Blob{}, err
|
2014-11-16 20:29:11 +00:00
|
|
|
}
|
|
|
|
node.Subtree = b.ID
|
2014-11-16 21:50:20 +00:00
|
|
|
arch.saveUpdate(Stats{Directories: 1})
|
2014-11-16 20:29:11 +00:00
|
|
|
} else if node.Type == "file" && len(node.Content) == 0 {
|
2014-11-16 21:50:20 +00:00
|
|
|
// start goroutine
|
|
|
|
wg.Add(1)
|
|
|
|
go func(n *Node) {
|
|
|
|
defer wg.Done()
|
2014-11-16 20:29:11 +00:00
|
|
|
|
2014-11-16 21:50:20 +00:00
|
|
|
// get token
|
|
|
|
token := <-arch.fileToken
|
|
|
|
defer func() {
|
|
|
|
arch.fileToken <- token
|
|
|
|
}()
|
|
|
|
|
|
|
|
// TODO: handle error
|
|
|
|
arch.SaveFile(n)
|
2014-11-17 22:28:51 +00:00
|
|
|
arch.saveUpdate(Stats{Files: 1})
|
2014-11-16 21:50:20 +00:00
|
|
|
}(node)
|
2014-11-16 20:29:11 +00:00
|
|
|
} else {
|
2014-11-16 21:50:20 +00:00
|
|
|
arch.saveUpdate(Stats{Other: 1})
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-11-16 21:50:20 +00:00
|
|
|
wg.Wait()
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
blob, err := arch.SaveJSON(backend.Tree, t)
|
|
|
|
if err != nil {
|
2014-11-21 20:21:44 +00:00
|
|
|
return Blob{}, err
|
2014-11-16 20:29:11 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return blob, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (arch *Archiver) Snapshot(dir string, t *Tree) (*Snapshot, backend.ID, error) {
|
|
|
|
sn := NewSnapshot(dir)
|
|
|
|
|
|
|
|
blob, err := arch.saveTree(t)
|
2014-09-23 20:39:12 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
sn.Content = blob.ID
|
|
|
|
|
|
|
|
// save snapshot
|
2014-11-21 20:21:44 +00:00
|
|
|
sn.BlobList = arch.bl
|
2014-09-23 20:39:12 +00:00
|
|
|
blob, err = arch.SaveJSON(backend.Snapshot, sn)
|
|
|
|
if err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
|
2014-11-16 20:29:11 +00:00
|
|
|
return sn, blob.Storage, nil
|
2014-09-23 20:39:12 +00:00
|
|
|
}
|