2020-09-01 07:21:19 +00:00
|
|
|
package filer
|
2020-03-27 11:50:51 +00:00
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"fmt"
|
2020-11-01 10:36:43 +00:00
|
|
|
"io"
|
|
|
|
"math/rand"
|
|
|
|
"sync"
|
|
|
|
|
2022-07-29 07:17:28 +00:00
|
|
|
"github.com/seaweedfs/seaweedfs/weed/glog"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/pb/filer_pb"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/util"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/util/chunk_cache"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/wdclient"
|
2020-10-11 03:09:43 +00:00
|
|
|
)
|
|
|
|
|
2020-03-27 11:50:51 +00:00
|
|
|
type ChunkReadAt struct {
|
2022-02-26 10:16:47 +00:00
|
|
|
masterClient *wdclient.MasterClient
|
|
|
|
chunkViews []*ChunkView
|
|
|
|
readerLock sync.Mutex
|
|
|
|
fileSize int64
|
|
|
|
readerCache *ReaderCache
|
|
|
|
readerPattern *ReaderPattern
|
2022-02-27 07:20:45 +00:00
|
|
|
lastChunkFid string
|
2020-03-27 11:50:51 +00:00
|
|
|
}
|
|
|
|
|
2020-12-09 06:26:46 +00:00
|
|
|
var _ = io.ReaderAt(&ChunkReadAt{})
|
|
|
|
var _ = io.Closer(&ChunkReadAt{})
|
2020-03-27 11:50:51 +00:00
|
|
|
|
2021-01-06 12:21:34 +00:00
|
|
|
func LookupFn(filerClient filer_pb.FilerClient) wdclient.LookupFileIdFunctionType {
|
2020-10-04 03:16:42 +00:00
|
|
|
|
|
|
|
vidCache := make(map[string]*filer_pb.Locations)
|
2020-10-22 02:28:59 +00:00
|
|
|
var vicCacheLock sync.RWMutex
|
2020-10-08 05:49:04 +00:00
|
|
|
return func(fileId string) (targetUrls []string, err error) {
|
2020-10-04 03:16:42 +00:00
|
|
|
vid := VolumeId(fileId)
|
2020-10-22 02:28:59 +00:00
|
|
|
vicCacheLock.RLock()
|
2020-10-04 03:16:42 +00:00
|
|
|
locations, found := vidCache[vid]
|
2020-10-22 02:28:59 +00:00
|
|
|
vicCacheLock.RUnlock()
|
2020-10-04 03:16:42 +00:00
|
|
|
|
2020-11-01 08:58:48 +00:00
|
|
|
if !found {
|
2020-11-01 10:36:43 +00:00
|
|
|
util.Retry("lookup volume "+vid, func() error {
|
2021-12-26 08:15:03 +00:00
|
|
|
err = filerClient.WithFilerClient(false, func(client filer_pb.SeaweedFilerClient) error {
|
2020-11-01 08:58:48 +00:00
|
|
|
resp, err := client.LookupVolume(context.Background(), &filer_pb.LookupVolumeRequest{
|
|
|
|
VolumeIds: []string{vid},
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
locations = resp.LocationsMap[vid]
|
|
|
|
if locations == nil || len(locations.Locations) == 0 {
|
|
|
|
glog.V(0).Infof("failed to locate %s", fileId)
|
|
|
|
return fmt.Errorf("failed to locate %s", fileId)
|
|
|
|
}
|
|
|
|
vicCacheLock.Lock()
|
|
|
|
vidCache[vid] = locations
|
|
|
|
vicCacheLock.Unlock()
|
|
|
|
|
|
|
|
return nil
|
2020-10-04 03:16:42 +00:00
|
|
|
})
|
2020-11-01 08:58:48 +00:00
|
|
|
return err
|
2020-04-30 00:40:08 +00:00
|
|
|
})
|
2020-10-04 03:16:42 +00:00
|
|
|
}
|
2020-04-30 00:40:08 +00:00
|
|
|
|
2020-10-10 22:43:22 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2022-08-05 00:35:00 +00:00
|
|
|
fcDataCenter := filerClient.GetDataCenter()
|
|
|
|
var sameDcTargetUrls, otherTargetUrls []string
|
2020-10-08 05:49:04 +00:00
|
|
|
for _, loc := range locations.Locations {
|
2021-01-28 22:36:29 +00:00
|
|
|
volumeServerAddress := filerClient.AdjustedUrl(loc)
|
2020-10-08 05:49:04 +00:00
|
|
|
targetUrl := fmt.Sprintf("http://%s/%s", volumeServerAddress, fileId)
|
2022-08-05 00:35:00 +00:00
|
|
|
if fcDataCenter == "" || fcDataCenter != loc.DataCenter {
|
|
|
|
otherTargetUrls = append(otherTargetUrls, targetUrl)
|
|
|
|
} else {
|
|
|
|
sameDcTargetUrls = append(sameDcTargetUrls, targetUrl)
|
|
|
|
}
|
2020-10-08 05:49:04 +00:00
|
|
|
}
|
2022-08-05 00:35:00 +00:00
|
|
|
rand.Shuffle(len(sameDcTargetUrls), func(i, j int) {
|
|
|
|
sameDcTargetUrls[i], sameDcTargetUrls[j] = sameDcTargetUrls[j], sameDcTargetUrls[i]
|
|
|
|
})
|
|
|
|
rand.Shuffle(len(otherTargetUrls), func(i, j int) {
|
|
|
|
otherTargetUrls[i], otherTargetUrls[j] = otherTargetUrls[j], otherTargetUrls[i]
|
|
|
|
})
|
|
|
|
// Prefer same data center
|
|
|
|
targetUrls = append(sameDcTargetUrls, otherTargetUrls...)
|
2020-04-30 00:40:08 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-01-25 03:01:58 +00:00
|
|
|
func NewChunkReaderAtFromClient(lookupFn wdclient.LookupFileIdFunctionType, chunkViews []*ChunkView, chunkCache chunk_cache.ChunkCache, fileSize int64) *ChunkReadAt {
|
2020-03-27 11:50:51 +00:00
|
|
|
|
|
|
|
return &ChunkReadAt{
|
2021-12-20 06:43:14 +00:00
|
|
|
chunkViews: chunkViews,
|
|
|
|
fileSize: fileSize,
|
2022-02-27 07:20:45 +00:00
|
|
|
readerCache: newReaderCache(32, chunkCache, lookupFn),
|
2021-12-20 06:43:14 +00:00
|
|
|
readerPattern: NewReaderPattern(),
|
2020-03-27 11:50:51 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-12-09 06:26:46 +00:00
|
|
|
func (c *ChunkReadAt) Close() error {
|
2022-02-26 10:16:47 +00:00
|
|
|
c.readerCache.destroy()
|
2020-12-09 06:26:46 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-03-27 11:50:51 +00:00
|
|
|
func (c *ChunkReadAt) ReadAt(p []byte, offset int64) (n int, err error) {
|
|
|
|
|
2021-12-29 00:30:33 +00:00
|
|
|
c.readerPattern.MonitorReadAt(offset, len(p))
|
|
|
|
|
2020-03-27 11:50:51 +00:00
|
|
|
c.readerLock.Lock()
|
|
|
|
defer c.readerLock.Unlock()
|
|
|
|
|
2022-12-23 04:39:24 +00:00
|
|
|
// glog.V(4).Infof("ReadAt [%d,%d) of total file size %d bytes %d chunk views", offset, offset+int64(len(p)), c.fileSize, len(c.chunkViews))
|
|
|
|
n, _, err = c.doReadAt(p, offset)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *ChunkReadAt) ReadAtWithTime(p []byte, offset int64) (n int, ts int64, err error) {
|
|
|
|
|
|
|
|
c.readerPattern.MonitorReadAt(offset, len(p))
|
|
|
|
|
|
|
|
c.readerLock.Lock()
|
|
|
|
defer c.readerLock.Unlock()
|
|
|
|
|
2021-05-11 04:47:51 +00:00
|
|
|
// glog.V(4).Infof("ReadAt [%d,%d) of total file size %d bytes %d chunk views", offset, offset+int64(len(p)), c.fileSize, len(c.chunkViews))
|
2021-01-18 09:14:27 +00:00
|
|
|
return c.doReadAt(p, offset)
|
2020-03-27 11:50:51 +00:00
|
|
|
}
|
|
|
|
|
2022-12-23 04:39:24 +00:00
|
|
|
func (c *ChunkReadAt) doReadAt(p []byte, offset int64) (n int, ts int64, err error) {
|
2020-03-27 11:50:51 +00:00
|
|
|
|
2020-08-18 03:14:40 +00:00
|
|
|
startOffset, remaining := offset, int64(len(p))
|
2022-02-26 11:06:17 +00:00
|
|
|
var nextChunks []*ChunkView
|
2020-08-17 23:05:40 +00:00
|
|
|
for i, chunk := range c.chunkViews {
|
2020-08-18 03:14:40 +00:00
|
|
|
if remaining <= 0 {
|
|
|
|
break
|
|
|
|
}
|
2020-10-04 08:31:04 +00:00
|
|
|
if i+1 < len(c.chunkViews) {
|
2022-02-26 11:06:17 +00:00
|
|
|
nextChunks = c.chunkViews[i+1:]
|
2020-10-04 08:31:04 +00:00
|
|
|
}
|
2020-08-18 03:14:40 +00:00
|
|
|
if startOffset < chunk.LogicOffset {
|
2022-08-21 18:33:58 +00:00
|
|
|
gap := chunk.LogicOffset - startOffset
|
2022-01-13 14:20:33 +00:00
|
|
|
glog.V(4).Infof("zero [%d,%d)", startOffset, chunk.LogicOffset)
|
2022-08-21 18:49:29 +00:00
|
|
|
n += zero(p, startOffset-offset, gap)
|
2022-08-21 18:33:58 +00:00
|
|
|
startOffset, remaining = chunk.LogicOffset, remaining-gap
|
2020-08-18 03:14:40 +00:00
|
|
|
if remaining <= 0 {
|
|
|
|
break
|
|
|
|
}
|
2020-08-17 04:07:46 +00:00
|
|
|
}
|
2020-08-16 22:16:46 +00:00
|
|
|
// fmt.Printf(">>> doReadAt [%d,%d), chunk[%d,%d)\n", offset, offset+int64(len(p)), chunk.LogicOffset, chunk.LogicOffset+int64(chunk.Size))
|
2020-08-18 03:14:40 +00:00
|
|
|
chunkStart, chunkStop := max(chunk.LogicOffset, startOffset), min(chunk.LogicOffset+int64(chunk.Size), startOffset+remaining)
|
2020-08-17 04:07:46 +00:00
|
|
|
if chunkStart >= chunkStop {
|
|
|
|
continue
|
|
|
|
}
|
2021-05-11 04:47:51 +00:00
|
|
|
// glog.V(4).Infof("read [%d,%d), %d/%d chunk %s [%d,%d)", chunkStart, chunkStop, i, len(c.chunkViews), chunk.FileId, chunk.LogicOffset-chunk.Offset, chunk.LogicOffset-chunk.Offset+int64(chunk.Size))
|
2021-04-28 23:13:37 +00:00
|
|
|
bufferOffset := chunkStart - chunk.LogicOffset + chunk.Offset
|
2022-12-23 04:39:24 +00:00
|
|
|
ts = chunk.ModifiedTsNs
|
2022-02-26 11:06:17 +00:00
|
|
|
copied, err := c.readChunkSliceAt(p[startOffset-offset:chunkStop-chunkStart+startOffset-offset], chunk, nextChunks, uint64(bufferOffset))
|
2020-08-17 04:07:46 +00:00
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("fetching chunk %+v: %v\n", chunk, err)
|
2022-12-23 04:39:24 +00:00
|
|
|
return copied, ts, err
|
2020-03-27 11:50:51 +00:00
|
|
|
}
|
2021-04-28 23:13:37 +00:00
|
|
|
|
2020-08-17 04:07:46 +00:00
|
|
|
n += copied
|
2020-08-18 03:20:08 +00:00
|
|
|
startOffset, remaining = startOffset+int64(copied), remaining-int64(copied)
|
2020-03-27 11:50:51 +00:00
|
|
|
}
|
2020-08-16 07:49:08 +00:00
|
|
|
|
2021-05-11 04:47:51 +00:00
|
|
|
// glog.V(4).Infof("doReadAt [%d,%d), n:%v, err:%v", offset, offset+int64(len(p)), n, err)
|
2020-08-16 07:49:08 +00:00
|
|
|
|
2022-08-21 18:33:58 +00:00
|
|
|
// zero the remaining bytes if a gap exists at the end of the last chunk (or a fully sparse file)
|
|
|
|
if err == nil && remaining > 0 {
|
|
|
|
var delta int64
|
|
|
|
if c.fileSize > startOffset {
|
|
|
|
delta = min(remaining, c.fileSize-startOffset)
|
|
|
|
startOffset -= offset
|
|
|
|
} else {
|
|
|
|
delta = remaining
|
|
|
|
startOffset = max(startOffset-offset, startOffset-remaining-offset)
|
|
|
|
}
|
|
|
|
glog.V(4).Infof("zero2 [%d,%d) of file size %d bytes", startOffset, startOffset+delta, c.fileSize)
|
2022-08-21 18:49:29 +00:00
|
|
|
n += zero(p, startOffset, delta)
|
2020-03-27 11:50:51 +00:00
|
|
|
}
|
2020-08-18 03:14:40 +00:00
|
|
|
|
2020-10-14 19:18:24 +00:00
|
|
|
if err == nil && offset+int64(len(p)) >= c.fileSize {
|
2020-08-16 07:49:08 +00:00
|
|
|
err = io.EOF
|
|
|
|
}
|
2020-08-16 22:16:46 +00:00
|
|
|
// fmt.Printf("~~~ filled %d, err: %v\n\n", n, err)
|
2020-03-27 11:50:51 +00:00
|
|
|
|
|
|
|
return
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2022-02-26 11:06:17 +00:00
|
|
|
func (c *ChunkReadAt) readChunkSliceAt(buffer []byte, chunkView *ChunkView, nextChunkViews []*ChunkView, offset uint64) (n int, err error) {
|
2021-04-28 23:13:37 +00:00
|
|
|
|
2021-12-23 00:17:30 +00:00
|
|
|
if c.readerPattern.IsRandomMode() {
|
2022-07-07 18:50:28 +00:00
|
|
|
n, err := c.readerCache.chunkCache.ReadChunkAt(buffer, chunkView.FileId, offset)
|
|
|
|
if n > 0 {
|
|
|
|
return n, err
|
|
|
|
}
|
2022-03-13 09:38:52 +00:00
|
|
|
return fetchChunkRange(buffer, c.readerCache.lookupFileIdFn, chunkView.FileId, chunkView.CipherKey, chunkView.IsGzipped, int64(offset))
|
2021-04-28 23:13:37 +00:00
|
|
|
}
|
|
|
|
|
2022-02-26 10:16:47 +00:00
|
|
|
n, err = c.readerCache.ReadChunkAt(buffer, chunkView.FileId, chunkView.CipherKey, chunkView.IsGzipped, int64(offset), int(chunkView.ChunkSize), chunkView.LogicOffset == 0)
|
2022-02-27 11:57:24 +00:00
|
|
|
if c.lastChunkFid != chunkView.FileId {
|
2022-02-27 07:20:45 +00:00
|
|
|
if chunkView.Offset == 0 { // start of a new chunk
|
2022-02-27 11:57:24 +00:00
|
|
|
if c.lastChunkFid != "" {
|
|
|
|
c.readerCache.UnCache(c.lastChunkFid)
|
|
|
|
c.readerCache.MaybeCache(nextChunkViews)
|
|
|
|
} else {
|
|
|
|
if len(nextChunkViews) >= 1 {
|
|
|
|
c.readerCache.MaybeCache(nextChunkViews[:1]) // just read the next chunk if at the very beginning
|
|
|
|
}
|
|
|
|
}
|
2022-02-26 11:06:17 +00:00
|
|
|
}
|
2020-12-09 06:26:46 +00:00
|
|
|
}
|
2022-02-27 07:20:45 +00:00
|
|
|
c.lastChunkFid = chunkView.FileId
|
2020-08-16 22:16:46 +00:00
|
|
|
return
|
2020-03-29 07:54:39 +00:00
|
|
|
}
|
2022-08-21 18:33:58 +00:00
|
|
|
|
2022-08-21 18:49:29 +00:00
|
|
|
func zero(buffer []byte, start, length int64) int {
|
2022-08-21 18:33:58 +00:00
|
|
|
end := min(start+length, int64(len(buffer)))
|
2022-08-21 18:49:29 +00:00
|
|
|
start = max(start, 0)
|
2022-08-21 18:33:58 +00:00
|
|
|
|
|
|
|
// zero the bytes
|
|
|
|
for o := start; o < end; o++ {
|
|
|
|
buffer[o] = 0
|
|
|
|
}
|
2022-08-21 18:49:29 +00:00
|
|
|
return int(end - start)
|
2022-08-21 18:33:58 +00:00
|
|
|
}
|