forked from TrueCloudLab/rclone
3fcff32524
...unless had some errors or stats interval requested. Add fs.ErrorLog to differentiate between Logs which should be suppressed and errors which shouldn't.
564 lines
15 KiB
Go
564 lines
15 KiB
Go
// S3 interface
|
|
package s3
|
|
|
|
// FIXME need to prevent anything but ListDir working for s3://
|
|
|
|
import (
|
|
"errors"
|
|
"fmt"
|
|
"io"
|
|
"net/http"
|
|
"path"
|
|
"regexp"
|
|
"strconv"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/ncw/goamz/aws"
|
|
"github.com/ncw/goamz/s3"
|
|
"github.com/ncw/rclone/fs"
|
|
"github.com/ncw/swift"
|
|
)
|
|
|
|
// Register with Fs
|
|
func init() {
|
|
fs.Register(&fs.FsInfo{
|
|
Name: "s3",
|
|
NewFs: NewFs,
|
|
// AWS endpoints: http://docs.amazonwebservices.com/general/latest/gr/rande.html#s3_region
|
|
Options: []fs.Option{{
|
|
Name: "access_key_id",
|
|
Help: "AWS Access Key ID.",
|
|
}, {
|
|
Name: "secret_access_key",
|
|
Help: "AWS Secret Access Key (password). ",
|
|
}, {
|
|
Name: "endpoint",
|
|
Help: "Endpoint for S3 API.",
|
|
Examples: []fs.OptionExample{{
|
|
Value: "https://s3.amazonaws.com/",
|
|
Help: "The default endpoint - a good choice if you are unsure.\nUS Region, Northern Virginia or Pacific Northwest.\nLeave location constraint empty.",
|
|
}, {
|
|
Value: "https://s3-external-1.amazonaws.com",
|
|
Help: "US Region, Northern Virginia only.\nLeave location constraint empty.",
|
|
}, {
|
|
Value: "https://s3-us-west-2.amazonaws.com",
|
|
Help: "US West (Oregon) Region\nNeeds location constraint us-west-2.",
|
|
}, {
|
|
Value: "https://s3-us-west-1.amazonaws.com",
|
|
Help: "US West (Northern California) Region\nNeeds location constraint us-west-1.",
|
|
}, {
|
|
Value: "https://s3-eu-west-1.amazonaws.com",
|
|
Help: "EU (Ireland) Region Region\nNeeds location constraint EU or eu-west-1.",
|
|
}, {
|
|
Value: "https://s3-ap-southeast-1.amazonaws.com",
|
|
Help: "Asia Pacific (Singapore) Region\nNeeds location constraint ap-southeast-1.",
|
|
}, {
|
|
Value: "https://s3-ap-southeast-2.amazonaws.com",
|
|
Help: "Asia Pacific (Sydney) Region\nNeeds location constraint .",
|
|
}, {
|
|
Value: "https://s3-ap-northeast-1.amazonaws.com",
|
|
Help: "Asia Pacific (Tokyo) Region\nNeeds location constraint ap-northeast-1.",
|
|
}, {
|
|
Value: "https://s3-sa-east-1.amazonaws.com",
|
|
Help: "South America (Sao Paulo) Region\nNeeds location constraint sa-east-1.",
|
|
}},
|
|
}, {
|
|
Name: "location_constraint",
|
|
Help: "Location constraint - must be set to match the Endpoint.",
|
|
Examples: []fs.OptionExample{{
|
|
Value: "",
|
|
Help: "Empty for US Region, Northern Virginia or Pacific Northwest.",
|
|
}, {
|
|
Value: "us-west-2",
|
|
Help: "US West (Oregon) Region.",
|
|
}, {
|
|
Value: "us-west-1",
|
|
Help: "US West (Northern California) Region.",
|
|
}, {
|
|
Value: "eu-west-1",
|
|
Help: "EU (Ireland) Region.",
|
|
}, {
|
|
Value: "EU",
|
|
Help: "EU Region.",
|
|
}, {
|
|
Value: "ap-southeast-1",
|
|
Help: "Asia Pacific (Singapore) Region.",
|
|
}, {
|
|
Value: "ap-southeast-2",
|
|
Help: "Asia Pacific (Sydney) Region.",
|
|
}, {
|
|
Value: "ap-northeast-1",
|
|
Help: "Asia Pacific (Tokyo) Region.",
|
|
}, {
|
|
Value: "sa-east-1",
|
|
Help: "South America (Sao Paulo) Region.",
|
|
}},
|
|
}},
|
|
})
|
|
}
|
|
|
|
// Constants
|
|
const (
|
|
metaMtime = "X-Amz-Meta-Mtime" // the meta key to store mtime in
|
|
listChunkSize = 1024 // number of items to read at once
|
|
)
|
|
|
|
// FsS3 represents a remote s3 server
|
|
type FsS3 struct {
|
|
c *s3.S3 // the connection to the s3 server
|
|
b *s3.Bucket // the connection to the bucket
|
|
bucket string // the bucket we are working on
|
|
perm s3.ACL // permissions for new buckets / objects
|
|
root string // root of the bucket - ignore all objects above this
|
|
}
|
|
|
|
// FsObjectS3 describes a s3 object
|
|
type FsObjectS3 struct {
|
|
// Will definitely have everything but meta which may be nil
|
|
//
|
|
// List will read everything but meta - to fill that in need to call
|
|
// readMetaData
|
|
s3 *FsS3 // what this object is part of
|
|
remote string // The remote path
|
|
etag string // md5sum of the object
|
|
bytes int64 // size of the object
|
|
lastModified time.Time // Last modified
|
|
meta s3.Headers // The object metadata if known - may be nil
|
|
}
|
|
|
|
// ------------------------------------------------------------
|
|
|
|
// String converts this FsS3 to a string
|
|
func (f *FsS3) String() string {
|
|
if f.root == "" {
|
|
return fmt.Sprintf("S3 bucket %s", f.bucket)
|
|
}
|
|
return fmt.Sprintf("S3 bucket %s path %s", f.bucket, f.root)
|
|
}
|
|
|
|
// Pattern to match a s3 path
|
|
var matcher = regexp.MustCompile(`^([^/]*)(.*)$`)
|
|
|
|
// parseParse parses a s3 'url'
|
|
func s3ParsePath(path string) (bucket, directory string, err error) {
|
|
parts := matcher.FindStringSubmatch(path)
|
|
if parts == nil {
|
|
err = fmt.Errorf("Couldn't parse bucket out of s3 path %q", path)
|
|
} else {
|
|
bucket, directory = parts[1], parts[2]
|
|
directory = strings.Trim(directory, "/")
|
|
}
|
|
return
|
|
}
|
|
|
|
// s3Connection makes a connection to s3
|
|
func s3Connection(name string) (*s3.S3, error) {
|
|
// Make the auth
|
|
accessKeyId := fs.ConfigFile.MustValue(name, "access_key_id")
|
|
if accessKeyId == "" {
|
|
return nil, errors.New("access_key_id not found")
|
|
}
|
|
secretAccessKey := fs.ConfigFile.MustValue(name, "secret_access_key")
|
|
if secretAccessKey == "" {
|
|
return nil, errors.New("secret_access_key not found")
|
|
}
|
|
auth := aws.Auth{AccessKey: accessKeyId, SecretKey: secretAccessKey}
|
|
|
|
// FIXME look through all the regions by name and use one of them if found
|
|
|
|
// Synthesize the region
|
|
s3Endpoint := fs.ConfigFile.MustValue(name, "endpoint")
|
|
if s3Endpoint == "" {
|
|
s3Endpoint = "https://s3.amazonaws.com/"
|
|
}
|
|
region := aws.Region{
|
|
Name: "s3",
|
|
S3Endpoint: s3Endpoint,
|
|
S3LocationConstraint: false,
|
|
}
|
|
s3LocationConstraint := fs.ConfigFile.MustValue(name, "location_constraint")
|
|
if s3LocationConstraint != "" {
|
|
region.Name = s3LocationConstraint
|
|
region.S3LocationConstraint = true
|
|
}
|
|
|
|
c := s3.New(auth, region)
|
|
c.Client = fs.Config.Client()
|
|
return c, nil
|
|
}
|
|
|
|
// NewFsS3 contstructs an FsS3 from the path, bucket:path
|
|
func NewFs(name, root string) (fs.Fs, error) {
|
|
bucket, directory, err := s3ParsePath(root)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
c, err := s3Connection(name)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
f := &FsS3{
|
|
c: c,
|
|
bucket: bucket,
|
|
b: c.Bucket(bucket),
|
|
perm: s3.Private, // FIXME need user to specify
|
|
root: directory,
|
|
}
|
|
if f.root != "" {
|
|
f.root += "/"
|
|
// Check to see if the object exists
|
|
_, err = f.b.Head(directory, nil)
|
|
if err == nil {
|
|
remote := path.Base(directory)
|
|
f.root = path.Dir(directory)
|
|
if f.root == "." {
|
|
f.root = ""
|
|
} else {
|
|
f.root += "/"
|
|
}
|
|
obj := f.NewFsObject(remote)
|
|
// return a Fs Limited to this object
|
|
return fs.NewLimited(f, obj), nil
|
|
}
|
|
}
|
|
return f, nil
|
|
}
|
|
|
|
// Return an FsObject from a path
|
|
//
|
|
// May return nil if an error occurred
|
|
func (f *FsS3) newFsObjectWithInfo(remote string, info *s3.Key) fs.Object {
|
|
o := &FsObjectS3{
|
|
s3: f,
|
|
remote: remote,
|
|
}
|
|
if info != nil {
|
|
// Set info but not meta
|
|
var err error
|
|
o.lastModified, err = time.Parse(time.RFC3339, info.LastModified)
|
|
if err != nil {
|
|
fs.Log(o, "Failed to read last modified: %s", err)
|
|
o.lastModified = time.Now()
|
|
}
|
|
o.etag = info.ETag
|
|
o.bytes = info.Size
|
|
} else {
|
|
err := o.readMetaData() // reads info and meta, returning an error
|
|
if err != nil {
|
|
// logged already FsDebug("Failed to read info: %s", err)
|
|
return nil
|
|
}
|
|
}
|
|
return o
|
|
}
|
|
|
|
// Return an FsObject from a path
|
|
//
|
|
// May return nil if an error occurred
|
|
func (f *FsS3) NewFsObject(remote string) fs.Object {
|
|
return f.newFsObjectWithInfo(remote, nil)
|
|
}
|
|
|
|
// list the objects into the function supplied
|
|
//
|
|
// If directories is set it only sends directories
|
|
func (f *FsS3) list(directories bool, fn func(string, *s3.Key)) {
|
|
delimiter := ""
|
|
if directories {
|
|
delimiter = "/"
|
|
}
|
|
marker := ""
|
|
for {
|
|
objects, err := f.b.List(f.root, delimiter, marker, listChunkSize)
|
|
if err != nil {
|
|
fs.Stats.Error()
|
|
fs.ErrorLog(f, "Couldn't read bucket %q: %s", f.bucket, err)
|
|
} else {
|
|
rootLength := len(f.root)
|
|
if directories {
|
|
for _, remote := range objects.CommonPrefixes {
|
|
if !strings.HasPrefix(remote, f.root) {
|
|
fs.Log(f, "Odd name received %q", remote)
|
|
continue
|
|
}
|
|
remote := remote[rootLength:]
|
|
if strings.HasSuffix(remote, "/") {
|
|
remote = remote[:len(remote)-1]
|
|
}
|
|
fn(remote, &s3.Key{Key: remote})
|
|
}
|
|
} else {
|
|
for i := range objects.Contents {
|
|
object := &objects.Contents[i]
|
|
if !strings.HasPrefix(object.Key, f.root) {
|
|
fs.Log(f, "Odd name received %q", object.Key)
|
|
continue
|
|
}
|
|
remote := object.Key[rootLength:]
|
|
fn(remote, object)
|
|
}
|
|
}
|
|
}
|
|
if !objects.IsTruncated {
|
|
break
|
|
}
|
|
// Use NextMarker if set, otherwise use last Key
|
|
marker = objects.NextMarker
|
|
if marker == "" {
|
|
marker = objects.Contents[len(objects.Contents)-1].Key
|
|
}
|
|
}
|
|
}
|
|
|
|
// Walk the path returning a channel of FsObjects
|
|
func (f *FsS3) List() fs.ObjectsChan {
|
|
out := make(fs.ObjectsChan, fs.Config.Checkers)
|
|
if f.bucket == "" {
|
|
// Return no objects at top level list
|
|
close(out)
|
|
fs.Stats.Error()
|
|
fs.ErrorLog(f, "Can't list objects at root - choose a bucket using lsd")
|
|
} else {
|
|
go func() {
|
|
defer close(out)
|
|
f.list(false, func(remote string, object *s3.Key) {
|
|
if fs := f.newFsObjectWithInfo(remote, object); fs != nil {
|
|
out <- fs
|
|
}
|
|
})
|
|
}()
|
|
}
|
|
return out
|
|
}
|
|
|
|
// Lists the buckets
|
|
func (f *FsS3) ListDir() fs.DirChan {
|
|
out := make(fs.DirChan, fs.Config.Checkers)
|
|
if f.bucket == "" {
|
|
// List the buckets
|
|
go func() {
|
|
defer close(out)
|
|
buckets, err := f.c.ListBuckets()
|
|
if err != nil {
|
|
fs.Stats.Error()
|
|
fs.ErrorLog(f, "Couldn't list buckets: %s", err)
|
|
} else {
|
|
for _, bucket := range buckets {
|
|
out <- &fs.Dir{
|
|
Name: bucket.Name,
|
|
When: bucket.CreationDate,
|
|
Bytes: -1,
|
|
Count: -1,
|
|
}
|
|
}
|
|
}
|
|
}()
|
|
} else {
|
|
// List the directories in the path in the bucket
|
|
go func() {
|
|
defer close(out)
|
|
f.list(true, func(remote string, object *s3.Key) {
|
|
out <- &fs.Dir{
|
|
Name: remote,
|
|
Bytes: object.Size,
|
|
Count: 0,
|
|
}
|
|
})
|
|
}()
|
|
}
|
|
return out
|
|
}
|
|
|
|
// Put the FsObject into the bucket
|
|
func (f *FsS3) Put(in io.Reader, remote string, modTime time.Time, size int64) (fs.Object, error) {
|
|
// Temporary FsObject under construction
|
|
fs := &FsObjectS3{s3: f, remote: remote}
|
|
return fs, fs.Update(in, modTime, size)
|
|
}
|
|
|
|
// Mkdir creates the bucket if it doesn't exist
|
|
func (f *FsS3) Mkdir() error {
|
|
err := f.b.PutBucket(f.perm)
|
|
if err, ok := err.(*s3.Error); ok {
|
|
if err.Code == "BucketAlreadyOwnedByYou" {
|
|
return nil
|
|
}
|
|
}
|
|
return err
|
|
}
|
|
|
|
// Rmdir deletes the bucket
|
|
//
|
|
// Returns an error if it isn't empty
|
|
func (f *FsS3) Rmdir() error {
|
|
return f.b.DelBucket()
|
|
}
|
|
|
|
// Return the precision
|
|
func (f *FsS3) Precision() time.Duration {
|
|
return time.Nanosecond
|
|
}
|
|
|
|
// ------------------------------------------------------------
|
|
|
|
// Return the parent Fs
|
|
func (o *FsObjectS3) Fs() fs.Fs {
|
|
return o.s3
|
|
}
|
|
|
|
// Return a string version
|
|
func (o *FsObjectS3) String() string {
|
|
if o == nil {
|
|
return "<nil>"
|
|
}
|
|
return o.remote
|
|
}
|
|
|
|
// Return the remote path
|
|
func (o *FsObjectS3) Remote() string {
|
|
return o.remote
|
|
}
|
|
|
|
var matchMd5 = regexp.MustCompile(`^[0-9a-f]{32}$`)
|
|
|
|
// Md5sum returns the Md5sum of an object returning a lowercase hex string
|
|
func (o *FsObjectS3) Md5sum() (string, error) {
|
|
etag := strings.Trim(strings.ToLower(o.etag), `"`)
|
|
// Check the etag is a valid md5sum
|
|
if !matchMd5.MatchString(etag) {
|
|
fs.Debug(o, "Invalid md5sum (probably multipart uploaded) - ignoring: %q", etag)
|
|
return "", nil
|
|
}
|
|
return etag, nil
|
|
}
|
|
|
|
// Size returns the size of an object in bytes
|
|
func (o *FsObjectS3) Size() int64 {
|
|
return o.bytes
|
|
}
|
|
|
|
// readMetaData gets the metadata if it hasn't already been fetched
|
|
//
|
|
// if we get a 404 error then we retry a few times for eventual
|
|
// consistency reasons
|
|
//
|
|
// it also sets the info
|
|
func (o *FsObjectS3) readMetaData() (err error) {
|
|
if o.meta != nil {
|
|
return nil
|
|
}
|
|
var headers s3.Headers
|
|
|
|
// Try reading the metadata a few times (with exponential
|
|
// backoff) to get around eventual consistency on 404 error
|
|
for tries := uint(0); tries < 10; tries++ {
|
|
headers, err = o.s3.b.Head(o.s3.root+o.remote, nil)
|
|
if s3Err, ok := err.(*s3.Error); ok {
|
|
if s3Err.StatusCode == http.StatusNotFound {
|
|
time.Sleep(5 * time.Millisecond << tries)
|
|
continue
|
|
}
|
|
}
|
|
break
|
|
}
|
|
if err != nil {
|
|
fs.Debug(o, "Failed to read info: %s", err)
|
|
return err
|
|
}
|
|
var size int64
|
|
// Ignore missing Content-Length assuming it is 0
|
|
// Some versions of ceph do this due their apache proxies
|
|
if contentLength, ok := headers["Content-Length"]; ok {
|
|
size, err = strconv.ParseInt(contentLength, 10, 64)
|
|
if err != nil {
|
|
fs.Debug(o, "Failed to read size from: %q", headers)
|
|
return err
|
|
}
|
|
}
|
|
o.etag = headers["Etag"]
|
|
o.bytes = size
|
|
o.meta = headers
|
|
if o.lastModified, err = time.Parse(http.TimeFormat, headers["Last-Modified"]); err != nil {
|
|
fs.Log(o, "Failed to read last modified from HEAD: %s", err)
|
|
o.lastModified = time.Now()
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// ModTime returns the modification time of the object
|
|
//
|
|
// It attempts to read the objects mtime and if that isn't present the
|
|
// LastModified returned in the http headers
|
|
func (o *FsObjectS3) ModTime() time.Time {
|
|
err := o.readMetaData()
|
|
if err != nil {
|
|
fs.Log(o, "Failed to read metadata: %s", err)
|
|
return time.Now()
|
|
}
|
|
// read mtime out of metadata if available
|
|
d, ok := o.meta[metaMtime]
|
|
if !ok {
|
|
// fs.Debug(o, "No metadata")
|
|
return o.lastModified
|
|
}
|
|
modTime, err := swift.FloatStringToTime(d)
|
|
if err != nil {
|
|
fs.Log(o, "Failed to read mtime from object: %s", err)
|
|
return o.lastModified
|
|
}
|
|
return modTime
|
|
}
|
|
|
|
// Sets the modification time of the local fs object
|
|
func (o *FsObjectS3) SetModTime(modTime time.Time) {
|
|
err := o.readMetaData()
|
|
if err != nil {
|
|
fs.Stats.Error()
|
|
fs.ErrorLog(o, "Failed to read metadata: %s", err)
|
|
return
|
|
}
|
|
o.meta[metaMtime] = swift.TimeToFloatString(modTime)
|
|
_, err = o.s3.b.Update(o.s3.root+o.remote, o.s3.perm, o.meta)
|
|
if err != nil {
|
|
fs.Stats.Error()
|
|
fs.ErrorLog(o, "Failed to update remote mtime: %s", err)
|
|
}
|
|
}
|
|
|
|
// Is this object storable
|
|
func (o *FsObjectS3) Storable() bool {
|
|
return true
|
|
}
|
|
|
|
// Open an object for read
|
|
func (o *FsObjectS3) Open() (in io.ReadCloser, err error) {
|
|
in, err = o.s3.b.GetReader(o.s3.root + o.remote)
|
|
return
|
|
}
|
|
|
|
// Update the Object from in with modTime and size
|
|
func (o *FsObjectS3) Update(in io.Reader, modTime time.Time, size int64) error {
|
|
// Set the mtime in the headers
|
|
headers := s3.Headers{
|
|
metaMtime: swift.TimeToFloatString(modTime),
|
|
}
|
|
|
|
_, err := o.s3.b.PutReaderHeaders(o.s3.root+o.remote, in, size, fs.MimeType(o), o.s3.perm, headers)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
// Read the metadata from the newly created object
|
|
o.meta = nil // wipe old metadata
|
|
err = o.readMetaData()
|
|
return err
|
|
}
|
|
|
|
// Remove an object
|
|
func (o *FsObjectS3) Remove() error {
|
|
return o.s3.b.Del(o.s3.root + o.remote)
|
|
}
|
|
|
|
// Check the interfaces are satisfied
|
|
var _ fs.Fs = &FsS3{}
|
|
var _ fs.Object = &FsObjectS3{}
|