2021-03-31 18:24:41 +00:00
|
|
|
package downloader
|
2019-12-13 16:02:48 +00:00
|
|
|
|
|
|
|
import (
|
2021-03-31 18:24:41 +00:00
|
|
|
"context"
|
2021-04-29 15:32:01 +00:00
|
|
|
"errors"
|
|
|
|
"fmt"
|
2019-12-13 16:02:48 +00:00
|
|
|
"io"
|
|
|
|
"net/http"
|
2020-02-04 11:02:29 +00:00
|
|
|
"path"
|
2019-12-13 16:02:48 +00:00
|
|
|
"strconv"
|
2020-11-09 13:43:23 +00:00
|
|
|
"strings"
|
2020-02-14 10:06:43 +00:00
|
|
|
"time"
|
2019-12-13 16:02:48 +00:00
|
|
|
|
2021-05-28 08:57:28 +00:00
|
|
|
"github.com/nspcc-dev/neofs-api-go/pkg/client"
|
2021-06-04 12:55:56 +00:00
|
|
|
cid "github.com/nspcc-dev/neofs-api-go/pkg/container/id"
|
2020-11-09 13:43:23 +00:00
|
|
|
"github.com/nspcc-dev/neofs-api-go/pkg/object"
|
2021-05-18 11:18:50 +00:00
|
|
|
"github.com/nspcc-dev/neofs-http-gw/tokens"
|
2021-05-28 20:24:04 +00:00
|
|
|
"github.com/nspcc-dev/neofs-sdk-go/pkg/pool"
|
2020-02-28 17:03:56 +00:00
|
|
|
"github.com/valyala/fasthttp"
|
2019-12-13 16:02:48 +00:00
|
|
|
"go.uber.org/zap"
|
2020-04-22 10:34:48 +00:00
|
|
|
"google.golang.org/grpc/codes"
|
|
|
|
"google.golang.org/grpc/status"
|
2019-12-13 16:02:48 +00:00
|
|
|
)
|
|
|
|
|
2020-12-03 15:00:43 +00:00
|
|
|
type (
|
|
|
|
detector struct {
|
2021-06-23 10:51:53 +00:00
|
|
|
io.Reader
|
|
|
|
err error
|
2020-12-03 15:00:43 +00:00
|
|
|
contentType string
|
2021-06-23 10:51:53 +00:00
|
|
|
done chan struct{}
|
|
|
|
data []byte
|
2020-12-03 15:00:43 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
request struct {
|
|
|
|
*fasthttp.RequestCtx
|
2021-05-28 08:57:28 +00:00
|
|
|
log *zap.Logger
|
2020-12-03 15:00:43 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
objectIDs []*object.ID
|
2021-06-23 10:51:53 +00:00
|
|
|
|
|
|
|
errReader struct {
|
|
|
|
data []byte
|
|
|
|
err error
|
|
|
|
offset int
|
|
|
|
}
|
2020-12-03 15:00:43 +00:00
|
|
|
)
|
2020-11-09 13:43:23 +00:00
|
|
|
|
2021-06-23 10:51:53 +00:00
|
|
|
func newReader(data []byte, err error) *errReader {
|
|
|
|
return &errReader{data: data, err: err}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *errReader) Read(b []byte) (int, error) {
|
|
|
|
if r.offset >= len(r.data) {
|
|
|
|
return 0, io.EOF
|
|
|
|
}
|
|
|
|
n := copy(b, r.data[r.offset:])
|
|
|
|
r.offset += n
|
|
|
|
if r.offset >= len(r.data) {
|
|
|
|
return n, r.err
|
|
|
|
}
|
|
|
|
return n, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
const contentTypeDetectSize = 512
|
|
|
|
|
|
|
|
func newDetector() *detector {
|
|
|
|
return &detector{done: make(chan struct{}), data: make([]byte, contentTypeDetectSize)}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *detector) Wait() {
|
|
|
|
<-d.done
|
2020-11-09 13:43:23 +00:00
|
|
|
}
|
|
|
|
|
2021-06-23 10:51:53 +00:00
|
|
|
func (d *detector) SetReader(reader io.Reader) {
|
|
|
|
d.Reader = reader
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *detector) Detect() {
|
|
|
|
n, err := d.Reader.Read(d.data)
|
|
|
|
if err != nil && err != io.EOF {
|
|
|
|
d.err = err
|
|
|
|
return
|
|
|
|
}
|
|
|
|
d.data = d.data[:n]
|
|
|
|
d.contentType = http.DetectContentType(d.data)
|
|
|
|
close(d.done)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *detector) MultiReader() io.Reader {
|
|
|
|
return io.MultiReader(newReader(d.data, d.err), d.Reader)
|
2020-11-09 13:43:23 +00:00
|
|
|
}
|
|
|
|
|
2021-04-29 20:46:38 +00:00
|
|
|
func isValidToken(s string) bool {
|
|
|
|
for _, c := range s {
|
|
|
|
if c <= ' ' || c > 127 {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if strings.ContainsRune("()<>@,;:\\\"/[]?={}", c) {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
func isValidValue(s string) bool {
|
|
|
|
for _, c := range s {
|
|
|
|
// HTTP specification allows for more technically, but we don't want to escape things.
|
|
|
|
if c < ' ' || c > 127 || c == '"' {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
2021-06-15 08:28:30 +00:00
|
|
|
func (r *request) receiveFile(clnt client.Object, objectAddress *object.Address) {
|
2019-12-13 16:02:48 +00:00
|
|
|
var (
|
2020-12-03 15:00:43 +00:00
|
|
|
err error
|
|
|
|
dis = "inline"
|
|
|
|
start = time.Now()
|
2020-11-09 13:43:23 +00:00
|
|
|
filename string
|
2021-05-28 08:57:28 +00:00
|
|
|
obj *object.Object
|
2019-12-13 16:02:48 +00:00
|
|
|
)
|
2021-03-31 16:58:42 +00:00
|
|
|
if err = tokens.StoreBearerToken(r.RequestCtx); err != nil {
|
2021-03-30 22:46:33 +00:00
|
|
|
r.log.Error("could not fetch and store bearer token", zap.Error(err))
|
|
|
|
r.Error("could not fetch and store bearer token", fasthttp.StatusBadRequest)
|
2021-02-16 15:20:15 +00:00
|
|
|
return
|
|
|
|
}
|
2021-06-23 10:51:53 +00:00
|
|
|
readDetector := newDetector()
|
2021-05-28 08:57:28 +00:00
|
|
|
options := new(client.GetObjectParams).
|
|
|
|
WithAddress(objectAddress).
|
2021-06-23 10:51:53 +00:00
|
|
|
WithPayloadReaderHandler(func(reader io.Reader) {
|
|
|
|
readDetector.SetReader(reader)
|
|
|
|
readDetector.Detect()
|
|
|
|
})
|
2021-05-28 08:57:28 +00:00
|
|
|
|
|
|
|
obj, err = clnt.GetObject(
|
|
|
|
r.RequestCtx,
|
|
|
|
options,
|
|
|
|
)
|
2020-11-09 13:43:23 +00:00
|
|
|
if err != nil {
|
2021-03-30 22:46:33 +00:00
|
|
|
r.log.Error(
|
|
|
|
"could not receive object",
|
2020-02-25 15:35:46 +00:00
|
|
|
zap.Stringer("elapsed", time.Since(start)),
|
2021-03-30 22:46:33 +00:00
|
|
|
zap.Error(err),
|
|
|
|
)
|
2020-04-22 10:34:48 +00:00
|
|
|
var (
|
2021-04-29 15:32:01 +00:00
|
|
|
msg = fmt.Sprintf("could not receive object: %v", err)
|
|
|
|
code = fasthttp.StatusBadRequest
|
|
|
|
cause = err
|
2020-04-22 10:34:48 +00:00
|
|
|
)
|
2021-04-29 15:32:01 +00:00
|
|
|
for unwrap := errors.Unwrap(err); unwrap != nil; unwrap = errors.Unwrap(cause) {
|
|
|
|
cause = unwrap
|
|
|
|
}
|
|
|
|
if st, ok := status.FromError(cause); ok && st != nil {
|
2020-04-22 10:34:48 +00:00
|
|
|
if st.Code() == codes.NotFound {
|
|
|
|
code = fasthttp.StatusNotFound
|
|
|
|
}
|
|
|
|
msg = st.Message()
|
2019-12-13 16:02:48 +00:00
|
|
|
}
|
2020-12-03 15:00:43 +00:00
|
|
|
r.Error(msg, code)
|
2020-02-28 17:03:56 +00:00
|
|
|
return
|
2019-12-13 16:02:48 +00:00
|
|
|
}
|
2020-12-03 15:00:43 +00:00
|
|
|
if r.Request.URI().QueryArgs().GetBool("download") {
|
|
|
|
dis = "attachment"
|
2020-11-09 13:43:23 +00:00
|
|
|
}
|
2021-06-23 10:51:53 +00:00
|
|
|
r.Response.SetBodyStream(readDetector.MultiReader(), int(obj.PayloadSize()))
|
2020-12-03 15:00:43 +00:00
|
|
|
r.Response.Header.Set("Content-Length", strconv.FormatUint(obj.PayloadSize(), 10))
|
2021-06-23 10:51:53 +00:00
|
|
|
var contentType string
|
2020-11-23 09:32:03 +00:00
|
|
|
for _, attr := range obj.Attributes() {
|
|
|
|
key := attr.Key()
|
|
|
|
val := attr.Value()
|
2021-04-29 20:46:38 +00:00
|
|
|
if !isValidToken(key) || !isValidValue(val) {
|
|
|
|
continue
|
|
|
|
}
|
2021-04-30 09:55:51 +00:00
|
|
|
r.Response.Header.Set("X-Attribute-"+key, val)
|
2020-11-23 09:32:03 +00:00
|
|
|
switch key {
|
|
|
|
case object.AttributeFileName:
|
2020-11-09 13:43:23 +00:00
|
|
|
filename = val
|
2020-11-23 09:32:03 +00:00
|
|
|
case object.AttributeTimestamp:
|
|
|
|
value, err := strconv.ParseInt(val, 10, 64)
|
|
|
|
if err != nil {
|
2020-12-03 15:00:43 +00:00
|
|
|
r.log.Info("couldn't parse creation date",
|
2020-11-23 09:32:03 +00:00
|
|
|
zap.String("key", key),
|
|
|
|
zap.String("val", val),
|
|
|
|
zap.Error(err))
|
|
|
|
continue
|
|
|
|
}
|
2020-12-03 15:00:43 +00:00
|
|
|
r.Response.Header.Set("Last-Modified",
|
2020-11-23 09:32:03 +00:00
|
|
|
time.Unix(value, 0).Format(time.RFC1123))
|
2021-06-21 13:56:51 +00:00
|
|
|
case object.AttributeContentType:
|
2021-06-23 10:51:53 +00:00
|
|
|
contentType = val
|
2020-02-28 17:03:56 +00:00
|
|
|
}
|
2020-11-09 13:43:23 +00:00
|
|
|
}
|
2021-04-29 20:09:37 +00:00
|
|
|
r.Response.Header.Set("x-object-id", obj.ID().String())
|
|
|
|
r.Response.Header.Set("x-owner-id", obj.OwnerID().String())
|
|
|
|
r.Response.Header.Set("x-container-id", obj.ContainerID().String())
|
2021-06-23 10:51:53 +00:00
|
|
|
|
|
|
|
if len(contentType) == 0 {
|
|
|
|
if readDetector.err != nil {
|
|
|
|
r.log.Error("could not read object", zap.Error(err))
|
|
|
|
r.Error("could not read object", fasthttp.StatusBadRequest)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
readDetector.Wait()
|
|
|
|
contentType = readDetector.contentType
|
|
|
|
}
|
|
|
|
r.SetContentType(contentType)
|
|
|
|
|
2020-12-03 15:00:43 +00:00
|
|
|
r.Response.Header.Set("Content-Disposition", dis+"; filename="+path.Base(filename))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (o objectIDs) Slice() []string {
|
|
|
|
res := make([]string, 0, len(o))
|
|
|
|
for _, oid := range o {
|
|
|
|
res = append(res, oid.String())
|
|
|
|
}
|
|
|
|
return res
|
|
|
|
}
|
|
|
|
|
2021-05-13 12:22:03 +00:00
|
|
|
// Downloader is a download request handler.
|
2021-03-31 18:24:41 +00:00
|
|
|
type Downloader struct {
|
2021-05-28 20:24:04 +00:00
|
|
|
log *zap.Logger
|
|
|
|
pool pool.Pool
|
2021-03-31 18:24:41 +00:00
|
|
|
}
|
|
|
|
|
2021-05-13 12:22:03 +00:00
|
|
|
// New creates an instance of Downloader using specified options.
|
2021-05-28 20:24:04 +00:00
|
|
|
func New(ctx context.Context, log *zap.Logger, conns pool.Pool) (*Downloader, error) {
|
2021-03-31 18:24:41 +00:00
|
|
|
var err error
|
2021-05-28 20:24:04 +00:00
|
|
|
d := &Downloader{log: log, pool: conns}
|
2021-03-31 18:24:41 +00:00
|
|
|
if err != nil {
|
2021-04-29 15:32:01 +00:00
|
|
|
return nil, fmt.Errorf("failed to get neofs client's reusable artifacts: %w", err)
|
2021-03-31 18:24:41 +00:00
|
|
|
}
|
|
|
|
return d, nil
|
|
|
|
}
|
|
|
|
|
2021-04-07 12:54:30 +00:00
|
|
|
func (d *Downloader) newRequest(ctx *fasthttp.RequestCtx, log *zap.Logger) *request {
|
2020-12-03 15:00:43 +00:00
|
|
|
return &request{
|
2021-05-28 08:57:28 +00:00
|
|
|
RequestCtx: ctx,
|
|
|
|
log: log,
|
2020-12-03 15:00:43 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-05-13 12:22:03 +00:00
|
|
|
// DownloadByAddress handles download requests using simple cid/oid format.
|
2021-04-07 12:54:30 +00:00
|
|
|
func (d *Downloader) DownloadByAddress(c *fasthttp.RequestCtx) {
|
2020-12-03 15:00:43 +00:00
|
|
|
var (
|
2021-03-30 22:46:33 +00:00
|
|
|
err error
|
|
|
|
address = object.NewAddress()
|
|
|
|
cid, _ = c.UserValue("cid").(string)
|
|
|
|
oid, _ = c.UserValue("oid").(string)
|
|
|
|
val = strings.Join([]string{cid, oid}, "/")
|
2021-04-07 12:54:30 +00:00
|
|
|
log = d.log.With(zap.String("cid", cid), zap.String("oid", oid))
|
2020-12-03 15:00:43 +00:00
|
|
|
)
|
2021-03-30 22:46:33 +00:00
|
|
|
if err = address.Parse(val); err != nil {
|
2020-12-03 15:00:43 +00:00
|
|
|
log.Error("wrong object address", zap.Error(err))
|
|
|
|
c.Error("wrong object address", fasthttp.StatusBadRequest)
|
|
|
|
return
|
|
|
|
}
|
2021-05-28 08:57:28 +00:00
|
|
|
|
2021-06-15 08:28:30 +00:00
|
|
|
d.newRequest(c, log).receiveFile(d.pool, address)
|
2020-12-03 15:00:43 +00:00
|
|
|
}
|
|
|
|
|
2021-05-13 12:22:03 +00:00
|
|
|
// DownloadByAttribute handles attribute-based download requests.
|
2021-04-07 12:54:30 +00:00
|
|
|
func (d *Downloader) DownloadByAttribute(c *fasthttp.RequestCtx) {
|
2020-12-03 15:00:43 +00:00
|
|
|
var (
|
|
|
|
err error
|
2021-03-30 22:46:33 +00:00
|
|
|
scid, _ = c.UserValue("cid").(string)
|
2020-12-03 15:00:43 +00:00
|
|
|
key, _ = c.UserValue("attr_key").(string)
|
|
|
|
val, _ = c.UserValue("attr_val").(string)
|
2021-04-07 12:54:30 +00:00
|
|
|
log = d.log.With(zap.String("cid", scid), zap.String("attr_key", key), zap.String("attr_val", val))
|
2021-05-28 08:57:28 +00:00
|
|
|
ids []*object.ID
|
2020-12-03 15:00:43 +00:00
|
|
|
)
|
2021-06-04 12:55:56 +00:00
|
|
|
cid := cid.New()
|
2021-03-30 22:46:33 +00:00
|
|
|
if err = cid.Parse(scid); err != nil {
|
2020-12-03 15:00:43 +00:00
|
|
|
log.Error("wrong container id", zap.Error(err))
|
|
|
|
c.Error("wrong container id", fasthttp.StatusBadRequest)
|
|
|
|
return
|
2021-03-30 22:46:33 +00:00
|
|
|
}
|
2021-05-28 08:57:28 +00:00
|
|
|
|
|
|
|
options := object.NewSearchFilters()
|
|
|
|
options.AddRootFilter()
|
|
|
|
options.AddFilter(key, val, object.MatchStringEqual)
|
|
|
|
|
|
|
|
sops := new(client.SearchObjectParams).WithContainerID(cid).WithSearchFilters(options)
|
2021-06-15 08:28:30 +00:00
|
|
|
if ids, err = d.pool.SearchObject(c, sops); err != nil {
|
2020-12-03 15:00:43 +00:00
|
|
|
log.Error("something went wrong", zap.Error(err))
|
|
|
|
c.Error("something went wrong", fasthttp.StatusBadRequest)
|
|
|
|
return
|
|
|
|
} else if len(ids) == 0 {
|
2021-01-23 13:28:12 +00:00
|
|
|
log.Debug("object not found")
|
2021-03-30 22:46:33 +00:00
|
|
|
c.Error("object not found", fasthttp.StatusNotFound)
|
2020-12-03 15:00:43 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
if len(ids) > 1 {
|
|
|
|
log.Debug("found multiple objects",
|
|
|
|
zap.Strings("object_ids", objectIDs(ids).Slice()),
|
|
|
|
zap.Stringer("show_object_id", ids[0]))
|
|
|
|
}
|
2021-03-30 22:46:33 +00:00
|
|
|
address := object.NewAddress()
|
|
|
|
address.SetContainerID(cid)
|
|
|
|
address.SetObjectID(ids[0])
|
2021-05-28 08:57:28 +00:00
|
|
|
|
2021-06-15 08:28:30 +00:00
|
|
|
d.newRequest(c, log).receiveFile(d.pool, address)
|
2019-12-13 16:02:48 +00:00
|
|
|
}
|