This is done by pacing the requests to drive and backing them off using an exponential increase. Put and Modify operations can now be retried also.
// Drive interface
package drive
// FIXME need to deal with some corner cases
// * multiple files with the same name
// * files can be in multiple directories
// * can have directory loops
// * files with / in name
import (
// Constants
const (
rcloneClientId = ""
rcloneClientSecret = "X4Z3ca8xfWDb1Voo-F9a7ZxJ"
driveFolderType = "application/"
timeFormatIn = time.RFC3339
timeFormatOut = "2006-01-02T15:04:05.000000000Z07:00"
minSleep = 10 * time.Millisecond
maxSleep = 2 * time.Second
decayConstant = 2 // bigger for slower decay, exponential
// Globals
var (
// Flags
driveFullList = pflag.BoolP("drive-full-list", "", true, "Use a full listing for directory list. More data but usually quicker.")
// Description of how to auth for this app
driveAuth = &googleauth.Auth{
Scope: "",
DefaultClientId: rcloneClientId,
DefaultClientSecret: rcloneClientSecret,
// Register with Fs
func init() {
Name: "drive",
NewFs: NewFs,
Config: func(name string) {
Options: []fs.Option{{
Name: "client_id",
Help: "Google Application Client Id - leave blank to use rclone's.",
}, {
Name: "client_secret",
Help: "Google Application Client Secret - leave blank to use rclone's.",
// FsDrive represents a remote drive server
type FsDrive struct {
svc *drive.Service // the connection to the drive server
root string // the path we are working on
client *http.Client // authorized client
about *drive.About // information about the drive, including the root
rootId string // Id of the root directory
foundRoot bool // Whether we have found the root or not
findRootLock sync.Mutex // Protect findRoot from concurrent use
dirCache dirCache // Map of directory path to directory id
findDirLock sync.Mutex // Protect findDir from concurrent use
pacer chan struct{} // To pace the operations
sleepTime time.Duration // Time to sleep for each transaction
// FsObjectDrive describes a drive object
type FsObjectDrive struct {
drive *FsDrive // what this object is part of
remote string // The remote path
id string // Drive Id of this object
url string // Download URL of this object
md5sum string // md5sum of the object
bytes int64 // size of the object
modifiedDate string // RFC3339 time it was last modified
// dirCache caches paths to directory Ids and vice versa
type dirCache struct {
cache map[string]string
invCache map[string]string
// Make a new locked map
func newDirCache() dirCache {
d := dirCache{}
return d
// Gets an Id given a path
func (m *dirCache) Get(path string) (id string, ok bool) {
id, ok = m.cache[path]
// GetInv gets a path given an Id
func (m *dirCache) GetInv(path string) (id string, ok bool) {
id, ok = m.invCache[path]
// Put a path, id into the map
func (m *dirCache) Put(path, id string) {
m.cache[path] = id
m.invCache[id] = path
// Flush the map of all data
func (m *dirCache) Flush() {
m.cache = make(map[string]string)
m.invCache = make(map[string]string)
// String converts this FsDrive to a string
func (f *FsDrive) String() string {
return fmt.Sprintf("Google drive root '%s'", f.root)
// Wait for the pace
func (f *FsDrive) paceWait() {
// pacer starts with a token in and whenever we take one out
// XXX ms later we put another in. We could do this with a
// Ticker more accurately, but then we'd have to work out how
// not to run it when it wasn't needed
// Restart the timer
go func(t time.Duration) {
// fs.Debug(f, "New sleep for %v at %v", t, time.Now())
f.pacer <- struct{}{}
// Refresh the pace given an error that was returned. It returns a
// boolean as to whether the operation should be retried.
// See
func (f *FsDrive) paceRefresh(err error) bool {
again := false
oldSleepTime := f.sleepTime
if err == nil {
f.sleepTime = (f.sleepTime<<decayConstant - f.sleepTime) >> decayConstant
if f.sleepTime < minSleep {
f.sleepTime = minSleep
if f.sleepTime != oldSleepTime {
fs.Debug(f, "Reducing sleep to %v", f.sleepTime)
} else {
fs.Debug(f, "Error recived: %v", err)
if gerr, ok := err.(*googleapi.Error); ok {
if len(gerr.Errors) > 0 {
reason := gerr.Errors[0].Reason
if reason == "rateLimitExceeded" || reason == "userRateLimitExceeded" {
f.sleepTime *= 2
if f.sleepTime > maxSleep {
f.sleepTime = maxSleep
if f.sleepTime != oldSleepTime {
fs.Debug(f, "Rate limited, increasing sleep to %v", f.sleepTime)
again = true
return again
// Pace the remote operations to not exceed Google's limits and retry
// on 403 rate limit exceeded
// This calls fn, expecting it to place its error in perr
func (f *FsDrive) pace(perr *error, fn func()) {
for {
if !f.paceRefresh(*perr) {
// parseParse parses a drive 'url'
func parseDrivePath(path string) (root string, err error) {
root = strings.Trim(path, "/")
// User function to process a File item from listAll
// Should return true to finish processing
type listAllFn func(*drive.File) bool
// Lists the directory required calling the user function on each item found
// If the user fn ever returns true then it early exits with found = true
// Search params:
func (f *FsDrive) listAll(dirId string, title string, directoriesOnly bool, filesOnly bool, fn listAllFn) (found bool, err error) {
query := fmt.Sprintf("trashed=false")
if dirId != "" {
query += fmt.Sprintf(" and '%s' in parents", dirId)
if title != "" {
// Escaping the backslash isn't documented but seems to work
title = strings.Replace(title, `\`, `\\`, -1)
title = strings.Replace(title, `'`, `\'`, -1)
query += fmt.Sprintf(" and title='%s'", title)
if directoriesOnly {
query += fmt.Sprintf(" and mimeType='%s'", driveFolderType)
if filesOnly {
query += fmt.Sprintf(" and mimeType!='%s'", driveFolderType)
// fmt.Printf("listAll Query = %q\n", query)
list := f.svc.Files.List().Q(query).MaxResults(1000)
for {
var files *drive.FileList
f.pace(&err, func() {
files, err = list.Do()
if err != nil {
return false, fmt.Errorf("Couldn't list directory: %s", err)
for _, item := range files.Items {
if fn(item) {
found = true
break OUTER
if files.NextPageToken == "" {
// NewFs contstructs an FsDrive from the path, container:path
func NewFs(name, path string) (fs.Fs, error) {
t, err := driveAuth.NewTransport(name)
if err != nil {
return nil, err
root, err := parseDrivePath(path)
if err != nil {
return nil, err
f := &FsDrive{
root: root,
dirCache: newDirCache(),
pacer: make(chan struct{}, 1),
sleepTime: minSleep,
// Put the first pacing token in
f.pacer <- struct{}{}
// Create a new authorized Drive client.
f.client = t.Client()
f.svc, err = drive.New(f.client)
if err != nil {
return nil, fmt.Errorf("Couldn't create Drive client: %s", err)
// Read About so we know the root path
f.pace(&err, func() {
f.about, err = f.svc.About.Get().Do()
if err != nil {
return nil, fmt.Errorf("Couldn't read info about Drive: %s", err)
// Find the Id of the true root and clear everything
// Find the current root
err = f.findRoot(false)
if err != nil {
// Assume it is a file
newRoot, remote := splitPath(root)
newF := *f
newF.root = newRoot
// Make new Fs which is the parent
err = newF.findRoot(false)
if err != nil {
// No root so return old f
return f, nil
obj, err := newF.newFsObjectWithInfoErr(remote, nil)
if err != nil {
// File doesn't exist so return old f
return f, nil
// return a Fs Limited to this object
return fs.NewLimited(&newF, obj), nil
// fmt.Printf("Root id %s", f.rootId)
return f, nil
// Return an FsObject from a path
func (f *FsDrive) newFsObjectWithInfoErr(remote string, info *drive.File) (fs.Object, error) {
fs := &FsObjectDrive{
drive: f,
remote: remote,
if info != nil {
} else {
err := fs.readMetaData() // reads info and meta, returning an error
if err != nil {
// logged already fs.Debug("Failed to read info: %s", err)
return nil, err
return fs, nil
// Return an FsObject from a path
// May return nil if an error occurred
func (f *FsDrive) newFsObjectWithInfo(remote string, info *drive.File) fs.Object {
fs, _ := f.newFsObjectWithInfoErr(remote, info)
// Errors have already been logged
return fs
// Return an FsObject from a path
// May return nil if an error occurred
func (f *FsDrive) NewFsObject(remote string) fs.Object {
return f.newFsObjectWithInfo(remote, nil)
// Path should be directory path either "" or "path/"
// List the directory using a recursive list from the root
// This fetches the minimum amount of stuff but does more API calls
// which makes it slow
func (f *FsDrive) listDirRecursive(dirId string, path string, out fs.ObjectsChan) error {
var subError error
// Make the API request
_, err := f.listAll(dirId, "", false, false, func(item *drive.File) bool {
// Recurse on directories
// FIXME should do this in parallel
// use a wg to sync then collect error
if item.MimeType == driveFolderType {
subError = f.listDirRecursive(item.Id, path+item.Title+"/", out)
if subError != nil {
return true
} else {
// If item has no MD5 sum it isn't stored on drive, so ignore it
if item.Md5Checksum != "" {
if fs := f.newFsObjectWithInfo(path+item.Title, item); fs != nil {
out <- fs
return false
if err != nil {
return err
if subError != nil {
return subError
return nil
// Path should be directory path either "" or "path/"
// List the directory using a full listing and filtering out unwanted
// items
// This is fast in terms of number of API calls, but slow in terms of
// fetching more data than it needs
func (f *FsDrive) listDirFull(dirId string, path string, out fs.ObjectsChan) error {
// Orphans waiting for their parent
orphans := make(map[string][]*drive.File)
var outputItem func(*drive.File, string) // forward def for recursive fn
// Output an item or directory
outputItem = func(item *drive.File, directory string) {
// fmt.Printf("found %q %q parent %q dir %q ok %s\n", item.Title, item.Id, parentId, directory, ok)
path := item.Title
if directory != "" {
path = directory + "/" + path
if item.MimeType == driveFolderType {
// Put the directory into the dircache
f.dirCache.Put(path, item.Id)
// fmt.Printf("directory %s %s %s\n", path, item.Title, item.Id)
// Collect the orphans if any
for _, orphan := range orphans[item.Id] {
// fmt.Printf("rescuing orphan %s %s %s\n", path, orphan.Title, orphan.Id)
outputItem(orphan, path)
delete(orphans, item.Id)
} else {
// fmt.Printf("file %s %s %s\n", path, item.Title, item.Id)
// If item has no MD5 sum it isn't stored on drive, so ignore it
if item.Md5Checksum != "" {
if fs := f.newFsObjectWithInfo(path, item); fs != nil {
out <- fs
// Make the API request
_, err := f.listAll("", "", false, false, func(item *drive.File) bool {
if len(item.Parents) == 0 {
// fmt.Printf("no parents %s %s: %#v\n", item.Title, item.Id, item)
return false
parentId := item.Parents[0].Id
directory, ok := f.dirCache.GetInv(parentId)
if !ok {
// Haven't found the parent yet so add to orphans
// fmt.Printf("orphan[%s] %s %s\n", parentId, item.Title, item.Id)
orphans[parentId] = append(orphans[parentId], item)
} else {
outputItem(item, directory)
return false
if err != nil {
return err
if len(orphans) > 0 {
// fmt.Printf("Orphans!!!! %v", orphans)
return nil
// Splits a path into directory, leaf
// Path shouldn't start or end with a /
// If there are no slashes then directory will be "" and leaf = path
func splitPath(path string) (directory, leaf string) {
lastSlash := strings.LastIndex(path, "/")
if lastSlash >= 0 {
directory = path[:lastSlash]
leaf = path[lastSlash+1:]
} else {
directory = ""
leaf = path
// Finds the directory passed in returning the directory Id starting from pathId
// Path shouldn't start or end with a /
// If create is set it will make the directory if not found
// Algorithm:
// Look in the cache for the path, if found return the pathId
// If not found strip the last path off the path and recurse
// Now have a parent directory id, so look in the parent for self and return it
func (f *FsDrive) findDir(path string, create bool) (pathId string, err error) {
pathId = f._findDirInCache(path)
if pathId != "" {
defer f.findDirLock.Unlock()
return f._findDir(path, create)
// Look for the root and in the cache - safe to call without the findDirLock
func (f *FsDrive) _findDirInCache(path string) string {
// fmt.Println("Finding",path,"create",create,"cache",cache)
// If it is the root, then return it
if path == "" {
// fmt.Println("Root")
return f.rootId
// If it is in the cache then return it
pathId, ok := f.dirCache.Get(path)
if ok {
// fmt.Println("Cache hit on", path)
return pathId
return ""
// Unlocked findDir - must have findDirLock
func (f *FsDrive) _findDir(path string, create bool) (pathId string, err error) {
pathId = f._findDirInCache(path)
if pathId != "" {
// Split the path into directory, leaf
directory, leaf := splitPath(path)
// Recurse and find pathId for directory
pathId, err = f._findDir(directory, create)
if err != nil {
return pathId, err
// Find the leaf in pathId
found, err := f.listAll(pathId, leaf, true, false, func(item *drive.File) bool {
if item.Title == leaf {
pathId = item.Id
return true
return false
if err != nil {
return pathId, err
// If not found create the directory if required or return an error
if !found {
if create {
// fmt.Println("Making", path)
// Define the metadata for the directory we are going to create.
createInfo := &drive.File{
Title: leaf,
Description: leaf,
MimeType: driveFolderType,
Parents: []*drive.ParentReference{{Id: pathId}},
var info *drive.File
f.pace(&err, func() {
info, err = f.svc.Files.Insert(createInfo).Do()
if err != nil {
return pathId, fmt.Errorf("Failed to make directory: %v", err)
pathId = info.Id
} else {
return pathId, fmt.Errorf("Couldn't find directory: %q", path)
// Store the directory in the cache
f.dirCache.Put(path, pathId)
// fmt.Println("Dir", path, "is", pathId)
return pathId, nil
// Finds the root directory if not already found
// Resets the root directory
// If create is set it will make the directory if not found
func (f *FsDrive) findRoot(create bool) error {
defer f.findRootLock.Unlock()
if f.foundRoot {
return nil
rootId, err := f.findDir(f.root, create)
if err != nil {
return err
f.rootId = rootId
// Put the root directory in
f.dirCache.Put("", f.rootId)
f.foundRoot = true
return nil
// Resets the root directory to the absolute root and clears the dirCache
func (f *FsDrive) resetRoot() {
defer f.findRootLock.Unlock()
f.foundRoot = false
// Put the true root in
f.rootId = f.about.RootFolderId
// Put the root directory in
f.dirCache.Put("", f.rootId)
// Walk the path returning a channel of FsObjects
func (f *FsDrive) List() fs.ObjectsChan {
out := make(fs.ObjectsChan, fs.Config.Checkers)
go func() {
defer close(out)
err := f.findRoot(false)
if err != nil {
log.Printf("Couldn't find root: %s", err)
} else {
if f.root == "" && *driveFullList {
err = f.listDirFull(f.rootId, "", out)
} else {
err = f.listDirRecursive(f.rootId, "", out)
if err != nil {
log.Printf("List failed: %s", err)
return out
// Walk the path returning a channel of FsObjects
func (f *FsDrive) ListDir() fs.DirChan {
out := make(fs.DirChan, fs.Config.Checkers)
go func() {
defer close(out)
err := f.findRoot(false)
if err != nil {
log.Printf("Couldn't find root: %s", err)
} else {
_, err := f.listAll(f.rootId, "", true, false, func(item *drive.File) bool {
dir := &fs.Dir{
Name: item.Title,
Bytes: -1,
Count: -1,
dir.When, _ = time.Parse(timeFormatIn, item.ModifiedDate)
out <- dir
return false
if err != nil {
log.Printf("ListDir failed: %s", err)
return out
// Put the object
// This assumes that the object doesn't not already exists - if you
// call it when it does exist then it will create a duplicate. Call
// object.Update() in this case.
// Copy the reader in to the new object which is returned
// The new object may have been created if an error is returned
func (f *FsDrive) Put(in io.Reader, remote string, modTime time.Time, size int64) (fs.Object, error) {
// Temporary FsObject under construction
o := &FsObjectDrive{drive: f, remote: remote}
directory, leaf := splitPath(o.remote)
directoryId, err := f.findDir(directory, true)
if err != nil {
return o, fmt.Errorf("Couldn't find or make directory: %s", err)
// Guess the mime type
mimeType := mime.TypeByExtension(path.Ext(o.remote))
if mimeType == "" {
mimeType = "application/octet-stream"
modifiedDate := modTime.Format(timeFormatOut)
// Define the metadata for the file we are going to create.
createInfo := &drive.File{
Title: leaf,
Description: leaf,
Parents: []*drive.ParentReference{{Id: directoryId}},
MimeType: mimeType,
ModifiedDate: modifiedDate,
// Make the API request to upload metadata and file data.
in = &fs.SeekWrapper{In: in, Size: size}
var info *drive.File
// Don't retry, return a retry error instead
info, err = f.svc.Files.Insert(createInfo).Media(in).Do()
if f.paceRefresh(err) {
return o, fs.RetryErrorf("Upload failed - retry: %s", err)
if err != nil {
return o, fmt.Errorf("Upload failed: %s", err)
return o, nil
// Mkdir creates the container if it doesn't exist
func (f *FsDrive) Mkdir() error {
return f.findRoot(true)
// Rmdir deletes the container
// Returns an error if it isn't empty
func (f *FsDrive) Rmdir() error {
err := f.findRoot(false)
if err != nil {
return err
var children *drive.ChildList
f.pace(&err, func() {
children, err = f.svc.Children.List(f.rootId).MaxResults(10).Do()
if err != nil {
return err
if len(children.Items) > 0 {
return fmt.Errorf("Directory not empty: %#v", children.Items)
// Delete the directory if it isn't the root
if f.root != "" {
f.pace(&err, func() {
err = f.svc.Files.Delete(f.rootId).Do()
if err != nil {
return err
return nil
// Return the precision
func (fs *FsDrive) Precision() time.Duration {
return time.Millisecond
// Purge deletes all the files and the container
// Optional interface: Only implement this if you have a way of
// deleting all the files quicker than just running Remove() on the
// result of List()
func (f *FsDrive) Purge() error {
if f.root == "" {
return fmt.Errorf("Can't purge root directory")
err := f.findRoot(false)
if err != nil {
return err
f.pace(&err, func() {
err = f.svc.Files.Delete(f.rootId).Do()
if err != nil {
return err
return nil
// Return the parent Fs
func (o *FsObjectDrive) Fs() fs.Fs {
// Return a string version
func (o *FsObjectDrive) String() string {
if o == nil {
return "<nil>"
return o.remote
// Return the remote path
func (o *FsObjectDrive) Remote() string {
return o.remote
// Md5sum returns the Md5sum of an object returning a lowercase hex string
func (o *FsObjectDrive) Md5sum() (string, error) {
return o.md5sum, nil
// Size returns the size of an object in bytes
func (o *FsObjectDrive) Size() int64 {
return o.bytes
// setMetaData sets the fs data from a drive.File
func (o *FsObjectDrive) setMetaData(info *drive.File) {
| = info.Id
o.url = info.DownloadUrl
o.md5sum = strings.ToLower(info.Md5Checksum)
o.bytes = info.FileSize
o.modifiedDate = info.ModifiedDate
// readMetaData gets the info if it hasn't already been fetched
func (o *FsObjectDrive) readMetaData() (err error) {
if != "" {
return nil
directory, leaf := splitPath(o.remote)
directoryId, err :=, false)
if err != nil {
fs.Debug(o, "Couldn't find directory: %s", err)
return fmt.Errorf("Couldn't find directory: %s", err)
found, err :=, leaf, false, true, func(item *drive.File) bool {
if item.Title == leaf {
return true
return false
if err != nil {
return err
if !found {
fs.Debug(o, "Couldn't find object")
return fmt.Errorf("Couldn't find object")
return nil
// ModTime returns the modification time of the object
// It attempts to read the objects mtime and if that isn't present the
// LastModified returned in the http headers
func (o *FsObjectDrive) ModTime() time.Time {
err := o.readMetaData()
if err != nil {
fs.Log(o, "Failed to read metadata: %s", err)
return time.Now()
modTime, err := time.Parse(timeFormatIn, o.modifiedDate)
if err != nil {
fs.Log(o, "Failed to read mtime from object: %s", err)
return time.Now()
return modTime
// Sets the modification time of the local fs object
func (o *FsObjectDrive) SetModTime(modTime time.Time) {
err := o.readMetaData()
if err != nil {
fs.Log(o, "Failed to read metadata: %s", err)
// New metadata
updateInfo := &drive.File{
ModifiedDate: modTime.Format(timeFormatOut),
// Set modified date
var info *drive.File
|, func() {
info, err =, updateInfo).SetModifiedDate(true).Do()
if err != nil {
fs.Log(o, "Failed to update remote mtime: %s", err)
// Update info from read data
// Is this object storable
func (o *FsObjectDrive) Storable() bool {
return true
// Open an object for read
func (o *FsObjectDrive) Open() (in io.ReadCloser, err error) {
req, err := http.NewRequest("GET", o.url, nil)
if err != nil {
return nil, err
req.Header.Set("User-Agent", fs.UserAgent)
var res *http.Response
|, func() {
res, err =
if err != nil {
return nil, err
if res.StatusCode != 200 {
_ = res.Body.Close() // ignore error
return nil, fmt.Errorf("Bad response: %d: %s", res.StatusCode, res.Status)
return res.Body, nil
// Update the already existing object
// Copy the reader into the object updating modTime and size
// The new object may have been created if an error is returned
func (o *FsObjectDrive) Update(in io.Reader, modTime time.Time, size int64) error {
updateInfo := &drive.File{
ModifiedDate: modTime.Format(timeFormatOut),
// Make the API request to upload metadata and file data.
in = &fs.SeekWrapper{In: in, Size: size}
var err error
var info *drive.File
// Don't retry, return a retry error instead
info, err =, updateInfo).SetModifiedDate(true).Media(in).Do()
if {
return fs.RetryErrorf("Update failed - retry: %s", err)
if err != nil {
return fmt.Errorf("Update failed: %s", err)
return nil
// Remove an object
func (o *FsObjectDrive) Remove() error {
var err error
|, func() {
err =
return err
// Check the interfaces are satisfied
var _ fs.Fs = &FsDrive{}
var _ fs.Purger = &FsDrive{}
var _ fs.Object = &FsObjectDrive{}