2018-05-28 06:53:10 +00:00
|
|
|
package weed_server
|
|
|
|
|
|
|
|
import (
|
2019-03-15 22:55:34 +00:00
|
|
|
"context"
|
2020-04-08 15:12:00 +00:00
|
|
|
"crypto/md5"
|
2020-08-08 17:45:37 +00:00
|
|
|
"hash"
|
2018-05-28 06:53:10 +00:00
|
|
|
"io"
|
2020-04-08 15:12:00 +00:00
|
|
|
"io/ioutil"
|
2018-05-28 06:53:10 +00:00
|
|
|
"net/http"
|
2020-08-08 19:02:06 +00:00
|
|
|
"os"
|
2018-05-28 06:53:10 +00:00
|
|
|
"path"
|
|
|
|
"strconv"
|
2018-07-22 00:47:59 +00:00
|
|
|
"strings"
|
2018-05-28 06:59:49 +00:00
|
|
|
"time"
|
|
|
|
|
2020-09-01 07:21:19 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/filer"
|
2018-05-28 06:53:10 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/operation"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/pb/filer_pb"
|
2019-02-15 08:09:19 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/security"
|
2019-06-23 05:53:52 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/stats"
|
2020-03-23 07:01:34 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/util"
|
2018-05-28 06:53:10 +00:00
|
|
|
)
|
|
|
|
|
2019-03-18 07:35:15 +00:00
|
|
|
func (fs *FilerServer) autoChunk(ctx context.Context, w http.ResponseWriter, r *http.Request,
|
2020-08-08 19:02:06 +00:00
|
|
|
replication string, collection string, dataCenter string, ttlSec int32, ttlString string, fsync bool) {
|
2018-05-28 06:53:10 +00:00
|
|
|
|
|
|
|
// autoChunking can be set at the command-line level or as a query param. Query param overrides command-line
|
|
|
|
query := r.URL.Query()
|
|
|
|
|
|
|
|
parsedMaxMB, _ := strconv.ParseInt(query.Get("maxMB"), 10, 32)
|
|
|
|
maxMB := int32(parsedMaxMB)
|
2018-07-07 09:18:47 +00:00
|
|
|
if maxMB <= 0 && fs.option.MaxMB > 0 {
|
|
|
|
maxMB = int32(fs.option.MaxMB)
|
2018-05-28 06:53:10 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
chunkSize := 1024 * 1024 * maxMB
|
|
|
|
|
2020-08-08 17:45:37 +00:00
|
|
|
stats.FilerRequestCounter.WithLabelValues("postAutoChunk").Inc()
|
|
|
|
start := time.Now()
|
|
|
|
defer func() {
|
|
|
|
stats.FilerRequestHistogram.WithLabelValues("postAutoChunk").Observe(time.Since(start).Seconds())
|
|
|
|
}()
|
|
|
|
|
|
|
|
var reply *FilerPostResult
|
|
|
|
var err error
|
2020-08-08 19:02:06 +00:00
|
|
|
var md5bytes []byte
|
2020-08-08 17:45:37 +00:00
|
|
|
if r.Method == "POST" {
|
2020-08-08 19:02:06 +00:00
|
|
|
reply, md5bytes, err = fs.doPostAutoChunk(ctx, w, r, chunkSize, replication, collection, dataCenter, ttlSec, ttlString, fsync)
|
2020-08-08 17:45:37 +00:00
|
|
|
} else {
|
2020-08-08 19:02:06 +00:00
|
|
|
reply, md5bytes, err = fs.doPutAutoChunk(ctx, w, r, chunkSize, replication, collection, dataCenter, ttlSec, ttlString, fsync)
|
2020-08-08 17:45:37 +00:00
|
|
|
}
|
2018-05-28 06:53:10 +00:00
|
|
|
if err != nil {
|
|
|
|
writeJsonError(w, r, http.StatusInternalServerError, err)
|
|
|
|
} else if reply != nil {
|
2020-08-08 19:02:06 +00:00
|
|
|
if len(md5bytes) > 0 {
|
|
|
|
w.Header().Set("Content-MD5", util.Base64Encode(md5bytes))
|
|
|
|
}
|
2018-05-28 06:53:10 +00:00
|
|
|
writeJsonQuiet(w, r, http.StatusCreated, reply)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
func (fs *FilerServer) doPostAutoChunk(ctx context.Context, w http.ResponseWriter, r *http.Request, chunkSize int32, replication string, collection string, dataCenter string, ttlSec int32, ttlString string, fsync bool) (filerResult *FilerPostResult, md5bytes []byte, replyerr error) {
|
2018-05-28 06:53:10 +00:00
|
|
|
|
|
|
|
multipartReader, multipartReaderErr := r.MultipartReader()
|
|
|
|
if multipartReaderErr != nil {
|
2020-08-08 19:02:06 +00:00
|
|
|
return nil, nil, multipartReaderErr
|
2018-05-28 06:53:10 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
part1, part1Err := multipartReader.NextPart()
|
|
|
|
if part1Err != nil {
|
2020-08-08 19:02:06 +00:00
|
|
|
return nil, nil, part1Err
|
2018-05-28 06:53:10 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fileName := part1.FileName()
|
|
|
|
if fileName != "" {
|
|
|
|
fileName = path.Base(fileName)
|
|
|
|
}
|
2020-03-09 04:39:33 +00:00
|
|
|
contentType := part1.Header.Get("Content-Type")
|
2020-08-08 17:45:37 +00:00
|
|
|
if contentType == "application/octet-stream" {
|
|
|
|
contentType = ""
|
|
|
|
}
|
2020-03-09 04:39:33 +00:00
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
fileChunks, md5Hash, chunkOffset, err := fs.uploadReaderToChunks(w, r, part1, chunkSize, replication, collection, dataCenter, ttlString, fileName, contentType, fsync)
|
2020-08-08 17:45:37 +00:00
|
|
|
if err != nil {
|
2020-08-08 19:02:06 +00:00
|
|
|
return nil, nil, err
|
2020-08-08 17:45:37 +00:00
|
|
|
}
|
2018-05-28 06:53:10 +00:00
|
|
|
|
2020-09-01 07:21:19 +00:00
|
|
|
fileChunks, replyerr = filer.MaybeManifestize(fs.saveAsChunk(replication, collection, dataCenter, ttlString, fsync), fileChunks)
|
2020-08-08 17:45:37 +00:00
|
|
|
if replyerr != nil {
|
|
|
|
glog.V(0).Infof("manifestize %s: %v", r.RequestURI, replyerr)
|
|
|
|
return
|
|
|
|
}
|
2018-05-28 06:53:10 +00:00
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
md5bytes = md5Hash.Sum(nil)
|
|
|
|
filerResult, replyerr = fs.saveMetaData(ctx, r, fileName, replication, collection, ttlSec, contentType, md5bytes, fileChunks, chunkOffset)
|
2018-05-28 06:53:10 +00:00
|
|
|
|
2020-08-08 17:45:37 +00:00
|
|
|
return
|
|
|
|
}
|
2018-05-28 06:53:10 +00:00
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
func (fs *FilerServer) doPutAutoChunk(ctx context.Context, w http.ResponseWriter, r *http.Request, chunkSize int32, replication string, collection string, dataCenter string, ttlSec int32, ttlString string, fsync bool) (filerResult *FilerPostResult, md5bytes []byte, replyerr error) {
|
2020-02-04 01:04:06 +00:00
|
|
|
|
2020-08-08 17:45:37 +00:00
|
|
|
fileName := ""
|
|
|
|
contentType := ""
|
2020-03-03 04:27:14 +00:00
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
fileChunks, md5Hash, chunkOffset, err := fs.uploadReaderToChunks(w, r, r.Body, chunkSize, replication, collection, dataCenter, ttlString, fileName, contentType, fsync)
|
2020-08-08 17:45:37 +00:00
|
|
|
if err != nil {
|
2020-08-08 19:02:06 +00:00
|
|
|
return nil, nil, err
|
2018-05-28 06:53:10 +00:00
|
|
|
}
|
|
|
|
|
2020-09-01 07:21:19 +00:00
|
|
|
fileChunks, replyerr = filer.MaybeManifestize(fs.saveAsChunk(replication, collection, dataCenter, ttlString, fsync), fileChunks)
|
2020-07-20 00:59:43 +00:00
|
|
|
if replyerr != nil {
|
|
|
|
glog.V(0).Infof("manifestize %s: %v", r.RequestURI, replyerr)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
md5bytes = md5Hash.Sum(nil)
|
|
|
|
filerResult, replyerr = fs.saveMetaData(ctx, r, fileName, replication, collection, ttlSec, contentType, md5bytes, fileChunks, chunkOffset)
|
2020-08-08 17:45:37 +00:00
|
|
|
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
func (fs *FilerServer) saveMetaData(ctx context.Context, r *http.Request, fileName string, replication string, collection string, ttlSec int32, contentType string, md5bytes []byte, fileChunks []*filer_pb.FileChunk, chunkOffset int64) (filerResult *FilerPostResult, replyerr error) {
|
|
|
|
|
|
|
|
// detect file mode
|
|
|
|
modeStr := r.URL.Query().Get("mode")
|
|
|
|
if modeStr == "" {
|
|
|
|
modeStr = "0660"
|
|
|
|
}
|
|
|
|
mode, err := strconv.ParseUint(modeStr, 8, 32)
|
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("Invalid mode format: %s, use 0660 by default", modeStr)
|
|
|
|
mode = 0660
|
|
|
|
}
|
|
|
|
|
|
|
|
// fix the path
|
2018-05-28 06:53:10 +00:00
|
|
|
path := r.URL.Path
|
2018-07-22 00:47:59 +00:00
|
|
|
if strings.HasSuffix(path, "/") {
|
|
|
|
if fileName != "" {
|
|
|
|
path += fileName
|
2018-05-28 06:53:10 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
// fix the crTime
|
|
|
|
existingEntry, err := fs.filer.FindEntry(ctx, util.FullPath(path))
|
|
|
|
crTime := time.Now()
|
|
|
|
if err == nil && existingEntry != nil {
|
|
|
|
crTime = existingEntry.Crtime
|
|
|
|
}
|
|
|
|
|
2018-05-28 06:53:10 +00:00
|
|
|
glog.V(4).Infoln("saving", path)
|
2020-09-01 07:21:19 +00:00
|
|
|
entry := &filer.Entry{
|
2020-03-23 07:01:34 +00:00
|
|
|
FullPath: util.FullPath(path),
|
2020-09-01 07:21:19 +00:00
|
|
|
Attr: filer.Attr{
|
2018-06-10 23:57:32 +00:00
|
|
|
Mtime: time.Now(),
|
2020-08-08 19:02:06 +00:00
|
|
|
Crtime: crTime,
|
|
|
|
Mode: os.FileMode(mode),
|
2018-07-22 00:47:59 +00:00
|
|
|
Uid: OS_UID,
|
|
|
|
Gid: OS_GID,
|
2018-06-10 23:57:32 +00:00
|
|
|
Replication: replication,
|
|
|
|
Collection: collection,
|
2020-03-09 07:16:10 +00:00
|
|
|
TtlSec: ttlSec,
|
2020-03-09 04:39:33 +00:00
|
|
|
Mime: contentType,
|
2020-08-08 19:02:06 +00:00
|
|
|
Md5: md5bytes,
|
2018-05-28 06:53:10 +00:00
|
|
|
},
|
|
|
|
Chunks: fileChunks,
|
|
|
|
}
|
2020-02-04 01:04:06 +00:00
|
|
|
|
|
|
|
filerResult = &FilerPostResult{
|
|
|
|
Name: fileName,
|
|
|
|
Size: chunkOffset,
|
|
|
|
}
|
|
|
|
|
2020-08-29 06:48:48 +00:00
|
|
|
if dbErr := fs.filer.CreateEntry(ctx, entry, false, false, nil); dbErr != nil {
|
2019-12-13 08:23:05 +00:00
|
|
|
fs.filer.DeleteChunks(entry.Chunks)
|
2019-06-23 05:53:52 +00:00
|
|
|
replyerr = dbErr
|
|
|
|
filerResult.Error = dbErr.Error()
|
|
|
|
glog.V(0).Infof("failing to write %s to filer server : %v", path, dbErr)
|
2018-05-28 06:53:10 +00:00
|
|
|
}
|
2020-08-08 17:45:37 +00:00
|
|
|
return filerResult, replyerr
|
|
|
|
}
|
2018-05-28 06:53:10 +00:00
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
func (fs *FilerServer) uploadReaderToChunks(w http.ResponseWriter, r *http.Request, reader io.Reader, chunkSize int32, replication string, collection string, dataCenter string, ttlString string, fileName string, contentType string, fsync bool) ([]*filer_pb.FileChunk, hash.Hash, int64, error) {
|
2020-08-08 17:45:37 +00:00
|
|
|
var fileChunks []*filer_pb.FileChunk
|
|
|
|
|
|
|
|
md5Hash := md5.New()
|
|
|
|
var partReader = ioutil.NopCloser(io.TeeReader(reader, md5Hash))
|
|
|
|
|
|
|
|
chunkOffset := int64(0)
|
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
for {
|
2020-08-08 17:45:37 +00:00
|
|
|
limitedReader := io.LimitReader(partReader, int64(chunkSize))
|
|
|
|
|
|
|
|
// assign one file id for one chunk
|
|
|
|
fileId, urlLocation, auth, assignErr := fs.assignNewFileInfo(replication, collection, dataCenter, ttlString, fsync)
|
|
|
|
if assignErr != nil {
|
|
|
|
return nil, nil, 0, assignErr
|
|
|
|
}
|
|
|
|
|
|
|
|
// upload the chunk to the volume server
|
|
|
|
uploadResult, uploadErr := fs.doUpload(urlLocation, w, r, limitedReader, fileName, contentType, nil, auth)
|
|
|
|
if uploadErr != nil {
|
|
|
|
return nil, nil, 0, uploadErr
|
|
|
|
}
|
|
|
|
|
|
|
|
// if last chunk exhausted the reader exactly at the border
|
|
|
|
if uploadResult.Size == 0 {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
|
|
|
|
// Save to chunk manifest structure
|
|
|
|
fileChunks = append(fileChunks, uploadResult.ToPbFileChunk(fileId, chunkOffset))
|
|
|
|
|
2020-08-08 19:02:06 +00:00
|
|
|
glog.V(4).Infof("uploaded %s chunk %d to %s [%d,%d)", fileName, len(fileChunks), fileId, chunkOffset, chunkOffset+int64(uploadResult.Size))
|
2020-08-08 17:45:37 +00:00
|
|
|
|
|
|
|
// reset variables for the next chunk
|
|
|
|
chunkOffset = chunkOffset + int64(uploadResult.Size)
|
|
|
|
|
|
|
|
// if last chunk was not at full chunk size, but already exhausted the reader
|
|
|
|
if int64(uploadResult.Size) < int64(chunkSize) {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return fileChunks, md5Hash, chunkOffset, nil
|
2018-05-28 06:53:10 +00:00
|
|
|
}
|
|
|
|
|
2020-03-08 22:42:44 +00:00
|
|
|
func (fs *FilerServer) doUpload(urlLocation string, w http.ResponseWriter, r *http.Request, limitedReader io.Reader, fileName string, contentType string, pairMap map[string]string, auth security.EncodedJwt) (*operation.UploadResult, error) {
|
2018-05-28 06:53:10 +00:00
|
|
|
|
2019-06-23 05:53:52 +00:00
|
|
|
stats.FilerRequestCounter.WithLabelValues("postAutoChunkUpload").Inc()
|
|
|
|
start := time.Now()
|
2019-06-23 08:57:51 +00:00
|
|
|
defer func() {
|
|
|
|
stats.FilerRequestHistogram.WithLabelValues("postAutoChunkUpload").Observe(time.Since(start).Seconds())
|
|
|
|
}()
|
2019-06-23 05:53:52 +00:00
|
|
|
|
2020-03-28 20:41:58 +00:00
|
|
|
uploadResult, err, _ := operation.Upload(urlLocation, fileName, fs.option.Cipher, limitedReader, false, contentType, pairMap, auth)
|
|
|
|
return uploadResult, err
|
2018-05-28 06:53:10 +00:00
|
|
|
}
|
2020-07-20 00:59:43 +00:00
|
|
|
|
2020-09-01 07:21:19 +00:00
|
|
|
func (fs *FilerServer) saveAsChunk(replication string, collection string, dataCenter string, ttlString string, fsync bool) filer.SaveDataAsChunkFunctionType {
|
2020-07-20 00:59:43 +00:00
|
|
|
|
|
|
|
return func(reader io.Reader, name string, offset int64) (*filer_pb.FileChunk, string, string, error) {
|
|
|
|
// assign one file id for one chunk
|
|
|
|
fileId, urlLocation, auth, assignErr := fs.assignNewFileInfo(replication, collection, dataCenter, ttlString, fsync)
|
|
|
|
if assignErr != nil {
|
|
|
|
return nil, "", "", assignErr
|
|
|
|
}
|
|
|
|
|
|
|
|
// upload the chunk to the volume server
|
|
|
|
uploadResult, uploadErr, _ := operation.Upload(urlLocation, name, fs.option.Cipher, reader, false, "", nil, auth)
|
|
|
|
if uploadErr != nil {
|
|
|
|
return nil, "", "", uploadErr
|
|
|
|
}
|
|
|
|
|
|
|
|
return uploadResult.ToPbFileChunk(fileId, offset), collection, replication, nil
|
|
|
|
}
|
|
|
|
}
|