2018-05-28 19:30:17 +00:00
|
|
|
package filesys
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
|
|
|
"context"
|
2018-07-22 00:39:10 +00:00
|
|
|
"fmt"
|
2020-01-23 07:00:04 +00:00
|
|
|
"io"
|
2019-02-15 17:59:22 +00:00
|
|
|
"sync"
|
2018-07-22 00:39:10 +00:00
|
|
|
"time"
|
2018-05-28 19:30:17 +00:00
|
|
|
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
2018-07-22 00:39:10 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/operation"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/pb/filer_pb"
|
2019-02-15 17:59:22 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/security"
|
2018-05-28 19:30:17 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
type ContinuousDirtyPages struct {
|
2020-02-25 06:28:45 +00:00
|
|
|
intervals *ContinuousIntervals
|
|
|
|
f *File
|
|
|
|
lock sync.Mutex
|
|
|
|
collection string
|
|
|
|
replication string
|
2018-05-28 19:30:17 +00:00
|
|
|
}
|
|
|
|
|
2018-05-29 08:21:21 +00:00
|
|
|
func newDirtyPages(file *File) *ContinuousDirtyPages {
|
|
|
|
return &ContinuousDirtyPages{
|
2020-01-23 07:00:04 +00:00
|
|
|
intervals: &ContinuousIntervals{},
|
|
|
|
f: file,
|
2018-05-28 19:30:17 +00:00
|
|
|
}
|
2018-05-29 08:21:21 +00:00
|
|
|
}
|
2018-05-28 19:30:17 +00:00
|
|
|
|
2018-12-28 11:27:48 +00:00
|
|
|
func (pages *ContinuousDirtyPages) releaseResource() {
|
2018-11-15 06:48:54 +00:00
|
|
|
}
|
|
|
|
|
2019-01-01 10:14:40 +00:00
|
|
|
var counter = int32(0)
|
|
|
|
|
2020-02-26 06:23:59 +00:00
|
|
|
func (pages *ContinuousDirtyPages) AddPage(offset int64, data []byte) (chunks []*filer_pb.FileChunk, err error) {
|
2018-05-31 05:02:21 +00:00
|
|
|
|
2018-09-07 20:11:43 +00:00
|
|
|
pages.lock.Lock()
|
|
|
|
defer pages.lock.Unlock()
|
|
|
|
|
2020-01-23 07:00:04 +00:00
|
|
|
glog.V(3).Infof("%s AddPage [%d,%d)", pages.f.fullpath(), offset, offset+int64(len(data)))
|
2018-05-28 19:30:17 +00:00
|
|
|
|
2019-01-01 10:14:40 +00:00
|
|
|
if len(data) > int(pages.f.wfs.option.ChunkSizeLimit) {
|
2018-05-31 05:09:24 +00:00
|
|
|
// this is more than what buffer can hold.
|
2020-02-26 06:23:59 +00:00
|
|
|
return pages.flushAndSave(offset, data)
|
2018-05-28 19:30:17 +00:00
|
|
|
}
|
|
|
|
|
2020-01-26 21:01:11 +00:00
|
|
|
pages.intervals.AddInterval(data, offset)
|
2018-05-28 19:30:17 +00:00
|
|
|
|
2020-01-23 07:00:04 +00:00
|
|
|
var chunk *filer_pb.FileChunk
|
|
|
|
var hasSavedData bool
|
|
|
|
|
|
|
|
if pages.intervals.TotalSize() > pages.f.wfs.option.ChunkSizeLimit {
|
2020-02-26 05:50:12 +00:00
|
|
|
chunk, hasSavedData, err = pages.saveExistingLargestPageToStorage()
|
2020-01-23 07:00:04 +00:00
|
|
|
if hasSavedData {
|
|
|
|
chunks = append(chunks, chunk)
|
2018-09-10 09:39:41 +00:00
|
|
|
}
|
2018-09-07 20:11:43 +00:00
|
|
|
}
|
2018-09-10 09:21:57 +00:00
|
|
|
|
2018-05-28 19:30:17 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2020-02-26 06:23:59 +00:00
|
|
|
func (pages *ContinuousDirtyPages) flushAndSave(offset int64, data []byte) (chunks []*filer_pb.FileChunk, err error) {
|
2018-09-10 09:21:57 +00:00
|
|
|
|
|
|
|
var chunk *filer_pb.FileChunk
|
2020-01-23 07:00:04 +00:00
|
|
|
var newChunks []*filer_pb.FileChunk
|
2018-09-10 09:21:57 +00:00
|
|
|
|
|
|
|
// flush existing
|
2020-02-26 05:50:12 +00:00
|
|
|
if newChunks, err = pages.saveExistingPagesToStorage(); err == nil {
|
2020-01-23 07:00:04 +00:00
|
|
|
if newChunks != nil {
|
|
|
|
chunks = append(chunks, newChunks...)
|
2018-09-10 09:21:57 +00:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// flush the new page
|
2020-02-26 05:50:12 +00:00
|
|
|
if chunk, err = pages.saveToStorage(bytes.NewReader(data), offset, int64(len(data))); err == nil {
|
2018-09-10 09:21:57 +00:00
|
|
|
if chunk != nil {
|
2019-06-21 18:46:12 +00:00
|
|
|
glog.V(4).Infof("%s/%s flush big request [%d,%d) to %s", pages.f.dir.Path, pages.f.Name, chunk.Offset, chunk.Offset+int64(chunk.Size), chunk.FileId)
|
2018-09-10 09:21:57 +00:00
|
|
|
chunks = append(chunks, chunk)
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
glog.V(0).Infof("%s/%s failed to flush2 [%d,%d): %v", pages.f.dir.Path, pages.f.Name, chunk.Offset, chunk.Offset+int64(chunk.Size), err)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
func (pages *ContinuousDirtyPages) FlushToStorage() (chunks []*filer_pb.FileChunk, err error) {
|
2018-05-28 19:30:17 +00:00
|
|
|
|
2018-09-07 20:11:43 +00:00
|
|
|
pages.lock.Lock()
|
|
|
|
defer pages.lock.Unlock()
|
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
return pages.saveExistingPagesToStorage()
|
2020-01-23 07:00:04 +00:00
|
|
|
}
|
2018-05-28 19:30:17 +00:00
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
func (pages *ContinuousDirtyPages) saveExistingPagesToStorage() (chunks []*filer_pb.FileChunk, err error) {
|
2020-01-23 07:00:04 +00:00
|
|
|
|
|
|
|
var hasSavedData bool
|
|
|
|
var chunk *filer_pb.FileChunk
|
|
|
|
|
|
|
|
for {
|
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
chunk, hasSavedData, err = pages.saveExistingLargestPageToStorage()
|
2020-01-23 07:00:04 +00:00
|
|
|
if !hasSavedData {
|
|
|
|
return chunks, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if err == nil {
|
|
|
|
chunks = append(chunks, chunk)
|
|
|
|
} else {
|
|
|
|
return
|
2018-05-28 21:32:16 +00:00
|
|
|
}
|
2018-05-28 19:30:17 +00:00
|
|
|
}
|
2020-01-23 07:00:04 +00:00
|
|
|
|
2018-05-28 19:30:17 +00:00
|
|
|
}
|
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
func (pages *ContinuousDirtyPages) saveExistingLargestPageToStorage() (chunk *filer_pb.FileChunk, hasSavedData bool, err error) {
|
2018-09-07 20:11:43 +00:00
|
|
|
|
2020-01-23 07:00:04 +00:00
|
|
|
maxList := pages.intervals.RemoveLargestIntervalLinkedList()
|
|
|
|
if maxList == nil {
|
|
|
|
return nil, false, nil
|
2018-09-07 20:11:43 +00:00
|
|
|
}
|
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
chunk, err = pages.saveToStorage(maxList.ToReader(), maxList.Offset(), maxList.Size())
|
2020-01-23 07:00:04 +00:00
|
|
|
if err == nil {
|
|
|
|
hasSavedData = true
|
|
|
|
glog.V(3).Infof("%s saveToStorage [%d,%d) %s", pages.f.fullpath(), maxList.Offset(), maxList.Offset()+maxList.Size(), chunk.FileId)
|
|
|
|
} else {
|
|
|
|
glog.V(0).Infof("%s saveToStorage [%d,%d): %v", pages.f.fullpath(), maxList.Offset(), maxList.Offset()+maxList.Size(), err)
|
|
|
|
return
|
|
|
|
}
|
2020-01-21 04:21:01 +00:00
|
|
|
|
2020-01-23 07:00:04 +00:00
|
|
|
return
|
2018-05-31 05:02:21 +00:00
|
|
|
}
|
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
func (pages *ContinuousDirtyPages) saveToStorage(reader io.Reader, offset int64, size int64) (*filer_pb.FileChunk, error) {
|
2018-05-28 19:30:17 +00:00
|
|
|
|
|
|
|
var fileId, host string
|
2019-02-15 17:59:22 +00:00
|
|
|
var auth security.EncodedJwt
|
2018-05-28 19:30:17 +00:00
|
|
|
|
2020-02-25 06:28:45 +00:00
|
|
|
dir, _ := pages.f.fullpath().DirAndName()
|
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
if err := pages.f.wfs.WithFilerClient(func(client filer_pb.SeaweedFilerClient) error {
|
2018-05-28 19:30:17 +00:00
|
|
|
|
|
|
|
request := &filer_pb.AssignVolumeRequest{
|
|
|
|
Count: 1,
|
2018-07-22 08:14:36 +00:00
|
|
|
Replication: pages.f.wfs.option.Replication,
|
|
|
|
Collection: pages.f.wfs.option.Collection,
|
|
|
|
TtlSec: pages.f.wfs.option.TtlSec,
|
|
|
|
DataCenter: pages.f.wfs.option.DataCenter,
|
2020-02-25 06:28:45 +00:00
|
|
|
ParentPath: dir,
|
2018-05-28 19:30:17 +00:00
|
|
|
}
|
|
|
|
|
2020-02-26 05:50:12 +00:00
|
|
|
resp, err := client.AssignVolume(context.Background(), request)
|
2018-05-28 19:30:17 +00:00
|
|
|
if err != nil {
|
|
|
|
glog.V(0).Infof("assign volume failure %v: %v", request, err)
|
|
|
|
return err
|
|
|
|
}
|
2020-02-26 01:15:09 +00:00
|
|
|
if resp.Error != "" {
|
|
|
|
return fmt.Errorf("assign volume failure %v: %v", request, resp.Error)
|
|
|
|
}
|
2018-05-28 19:30:17 +00:00
|
|
|
|
2019-02-15 17:59:22 +00:00
|
|
|
fileId, host, auth = resp.FileId, resp.Url, security.EncodedJwt(resp.Auth)
|
2020-02-27 00:46:01 +00:00
|
|
|
host = pages.f.wfs.AdjustedUrl(host)
|
2020-02-25 06:28:45 +00:00
|
|
|
pages.collection, pages.replication = resp.Collection, resp.Replication
|
2018-05-28 19:30:17 +00:00
|
|
|
|
|
|
|
return nil
|
|
|
|
}); err != nil {
|
2018-06-06 06:37:41 +00:00
|
|
|
return nil, fmt.Errorf("filerGrpcAddress assign volume: %v", err)
|
2018-05-28 19:30:17 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fileUrl := fmt.Sprintf("http://%s/%s", host, fileId)
|
2020-03-06 08:49:47 +00:00
|
|
|
uploadResult, err := operation.Upload(fileUrl, pages.f.Name, pages.f.wfs.option.Cipher, reader, false, "", nil, auth)
|
2018-05-28 19:30:17 +00:00
|
|
|
if err != nil {
|
|
|
|
glog.V(0).Infof("upload data %v to %s: %v", pages.f.Name, fileUrl, err)
|
|
|
|
return nil, fmt.Errorf("upload data: %v", err)
|
|
|
|
}
|
|
|
|
if uploadResult.Error != "" {
|
|
|
|
glog.V(0).Infof("upload failure %v to %s: %v", pages.f.Name, fileUrl, err)
|
|
|
|
return nil, fmt.Errorf("upload result: %v", uploadResult.Error)
|
|
|
|
}
|
|
|
|
|
|
|
|
return &filer_pb.FileChunk{
|
2020-03-06 08:49:47 +00:00
|
|
|
FileId: fileId,
|
|
|
|
Offset: offset,
|
|
|
|
Size: uint64(size),
|
|
|
|
Mtime: time.Now().UnixNano(),
|
|
|
|
ETag: uploadResult.ETag,
|
|
|
|
CipherKey: uploadResult.CipherKey,
|
2020-03-09 04:39:33 +00:00
|
|
|
IsGzipped: uploadResult.Gzip > 0,
|
2018-05-28 19:30:17 +00:00
|
|
|
}, nil
|
|
|
|
|
|
|
|
}
|
2018-05-29 08:21:21 +00:00
|
|
|
|
|
|
|
func max(x, y int64) int64 {
|
|
|
|
if x > y {
|
|
|
|
return x
|
|
|
|
}
|
|
|
|
return y
|
|
|
|
}
|
2020-01-22 21:42:03 +00:00
|
|
|
func min(x, y int64) int64 {
|
|
|
|
if x < y {
|
|
|
|
return x
|
|
|
|
}
|
|
|
|
return y
|
|
|
|
}
|
|
|
|
|
2020-02-26 06:23:59 +00:00
|
|
|
func (pages *ContinuousDirtyPages) ReadDirtyData(data []byte, startOffset int64) (offset int64, size int) {
|
2020-01-22 23:38:25 +00:00
|
|
|
|
|
|
|
pages.lock.Lock()
|
|
|
|
defer pages.lock.Unlock()
|
|
|
|
|
2020-01-23 07:00:04 +00:00
|
|
|
return pages.intervals.ReadData(data, startOffset)
|
2020-01-22 21:42:03 +00:00
|
|
|
|
|
|
|
}
|