2020-04-11 19:45:24 +00:00
|
|
|
package chunk_cache
|
2020-03-28 20:43:31 +00:00
|
|
|
|
|
|
|
import (
|
2021-04-28 23:13:37 +00:00
|
|
|
"errors"
|
2020-04-12 04:12:41 +00:00
|
|
|
"sync"
|
2020-03-28 20:43:31 +00:00
|
|
|
|
2020-04-12 04:12:41 +00:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/storage/needle"
|
2020-03-28 20:43:31 +00:00
|
|
|
)
|
|
|
|
|
2021-04-28 23:13:37 +00:00
|
|
|
var ErrorOutOfBounds = errors.New("attempt to read out of bounds")
|
|
|
|
|
2020-08-18 03:20:08 +00:00
|
|
|
type ChunkCache interface {
|
|
|
|
GetChunk(fileId string, minSize uint64) (data []byte)
|
2021-04-28 23:13:37 +00:00
|
|
|
GetChunkSlice(fileId string, offset, length uint64) []byte
|
2020-08-18 03:20:08 +00:00
|
|
|
SetChunk(fileId string, data []byte)
|
|
|
|
}
|
|
|
|
|
2020-03-28 20:43:31 +00:00
|
|
|
// a global cache for recently accessed file chunks
|
2020-08-18 03:15:53 +00:00
|
|
|
type TieredChunkCache struct {
|
2020-04-14 05:19:27 +00:00
|
|
|
memCache *ChunkCacheInMemory
|
|
|
|
diskCaches []*OnDiskCacheLayer
|
2020-04-12 04:12:41 +00:00
|
|
|
sync.RWMutex
|
2020-09-27 17:41:29 +00:00
|
|
|
onDiskCacheSizeLimit0 uint64
|
|
|
|
onDiskCacheSizeLimit1 uint64
|
2020-09-27 18:58:48 +00:00
|
|
|
onDiskCacheSizeLimit2 uint64
|
2020-03-28 20:43:31 +00:00
|
|
|
}
|
|
|
|
|
2021-04-28 23:13:37 +00:00
|
|
|
var _ ChunkCache = &TieredChunkCache{}
|
|
|
|
|
2020-09-27 17:41:29 +00:00
|
|
|
func NewTieredChunkCache(maxEntries int64, dir string, diskSizeInUnit int64, unitSize int64) *TieredChunkCache {
|
2020-04-12 04:12:41 +00:00
|
|
|
|
2020-08-18 03:15:53 +00:00
|
|
|
c := &TieredChunkCache{
|
2020-04-14 05:19:27 +00:00
|
|
|
memCache: NewChunkCacheInMemory(maxEntries),
|
2020-03-28 20:43:31 +00:00
|
|
|
}
|
2020-04-14 05:19:27 +00:00
|
|
|
c.diskCaches = make([]*OnDiskCacheLayer, 3)
|
2020-09-27 17:41:29 +00:00
|
|
|
c.onDiskCacheSizeLimit0 = uint64(unitSize)
|
|
|
|
c.onDiskCacheSizeLimit1 = 4 * c.onDiskCacheSizeLimit0
|
2020-09-27 18:58:48 +00:00
|
|
|
c.onDiskCacheSizeLimit2 = 2 * c.onDiskCacheSizeLimit1
|
2020-09-27 18:42:51 +00:00
|
|
|
c.diskCaches[0] = NewOnDiskCacheLayer(dir, "c0_2", diskSizeInUnit*unitSize/8, 2)
|
|
|
|
c.diskCaches[1] = NewOnDiskCacheLayer(dir, "c1_3", diskSizeInUnit*unitSize/4+diskSizeInUnit*unitSize/8, 3)
|
|
|
|
c.diskCaches[2] = NewOnDiskCacheLayer(dir, "c2_2", diskSizeInUnit*unitSize/2, 2)
|
2020-04-12 04:12:41 +00:00
|
|
|
|
|
|
|
return c
|
2020-03-28 20:43:31 +00:00
|
|
|
}
|
|
|
|
|
2020-08-18 03:15:53 +00:00
|
|
|
func (c *TieredChunkCache) GetChunk(fileId string, minSize uint64) (data []byte) {
|
2020-04-12 08:00:12 +00:00
|
|
|
if c == nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2020-04-12 04:12:41 +00:00
|
|
|
c.RLock()
|
|
|
|
defer c.RUnlock()
|
|
|
|
|
2020-08-17 23:05:13 +00:00
|
|
|
return c.doGetChunk(fileId, minSize)
|
2020-04-12 08:06:50 +00:00
|
|
|
}
|
|
|
|
|
2020-08-18 03:15:53 +00:00
|
|
|
func (c *TieredChunkCache) doGetChunk(fileId string, minSize uint64) (data []byte) {
|
2020-04-14 04:58:10 +00:00
|
|
|
|
2020-09-27 18:42:51 +00:00
|
|
|
if minSize <= c.onDiskCacheSizeLimit0 {
|
2020-06-27 19:51:04 +00:00
|
|
|
data = c.memCache.GetChunk(fileId)
|
2020-08-17 23:05:13 +00:00
|
|
|
if len(data) >= int(minSize) {
|
2020-06-27 19:51:04 +00:00
|
|
|
return data
|
|
|
|
}
|
2020-04-12 04:12:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fid, err := needle.ParseFileIdFromString(fileId)
|
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("failed to parse file id %s", fileId)
|
2020-03-28 20:43:31 +00:00
|
|
|
return nil
|
|
|
|
}
|
2020-04-14 04:58:10 +00:00
|
|
|
|
2020-09-27 18:42:51 +00:00
|
|
|
if minSize <= c.onDiskCacheSizeLimit0 {
|
2020-06-27 19:51:04 +00:00
|
|
|
data = c.diskCaches[0].getChunk(fid.Key)
|
2020-08-17 23:05:13 +00:00
|
|
|
if len(data) >= int(minSize) {
|
2020-06-27 19:51:04 +00:00
|
|
|
return data
|
|
|
|
}
|
|
|
|
}
|
2020-09-27 18:42:51 +00:00
|
|
|
if minSize <= c.onDiskCacheSizeLimit1 {
|
2020-06-27 19:51:04 +00:00
|
|
|
data = c.diskCaches[1].getChunk(fid.Key)
|
2020-08-17 23:05:13 +00:00
|
|
|
if len(data) >= int(minSize) {
|
2020-06-27 19:51:04 +00:00
|
|
|
return data
|
|
|
|
}
|
|
|
|
}
|
2020-10-03 21:12:38 +00:00
|
|
|
{
|
2020-06-27 19:51:04 +00:00
|
|
|
data = c.diskCaches[2].getChunk(fid.Key)
|
2020-08-17 23:05:13 +00:00
|
|
|
if len(data) >= int(minSize) {
|
2020-04-14 05:19:27 +00:00
|
|
|
return data
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
2020-04-14 04:58:10 +00:00
|
|
|
|
2020-03-28 20:43:31 +00:00
|
|
|
}
|
|
|
|
|
2021-04-28 23:13:37 +00:00
|
|
|
func (c *TieredChunkCache) GetChunkSlice(fileId string, offset, length uint64) []byte {
|
|
|
|
if c == nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
c.RLock()
|
|
|
|
defer c.RUnlock()
|
|
|
|
|
|
|
|
return c.doGetChunkSlice(fileId, offset, length)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *TieredChunkCache) doGetChunkSlice(fileId string, offset, length uint64) (data []byte) {
|
|
|
|
|
|
|
|
minSize := offset + length
|
|
|
|
if minSize <= c.onDiskCacheSizeLimit0 {
|
|
|
|
data, err := c.memCache.getChunkSlice(fileId, offset, length)
|
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("failed to read from memcache: %s", err)
|
|
|
|
}
|
|
|
|
if len(data) >= int(minSize) {
|
|
|
|
return data
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fid, err := needle.ParseFileIdFromString(fileId)
|
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("failed to parse file id %s", fileId)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if minSize <= c.onDiskCacheSizeLimit0 {
|
|
|
|
data = c.diskCaches[0].getChunkSlice(fid.Key, offset, length)
|
|
|
|
if len(data) >= int(minSize) {
|
|
|
|
return data
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if minSize <= c.onDiskCacheSizeLimit1 {
|
|
|
|
data = c.diskCaches[1].getChunkSlice(fid.Key, offset, length)
|
|
|
|
if len(data) >= int(minSize) {
|
|
|
|
return data
|
|
|
|
}
|
|
|
|
}
|
|
|
|
{
|
|
|
|
data = c.diskCaches[2].getChunkSlice(fid.Key, offset, length)
|
|
|
|
if len(data) >= int(minSize) {
|
|
|
|
return data
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-08-18 03:15:53 +00:00
|
|
|
func (c *TieredChunkCache) SetChunk(fileId string, data []byte) {
|
2020-04-12 08:00:12 +00:00
|
|
|
if c == nil {
|
|
|
|
return
|
|
|
|
}
|
2020-04-12 04:12:41 +00:00
|
|
|
c.Lock()
|
|
|
|
defer c.Unlock()
|
|
|
|
|
2020-08-31 03:12:04 +00:00
|
|
|
glog.V(4).Infof("SetChunk %s size %d\n", fileId, len(data))
|
2020-06-26 17:01:55 +00:00
|
|
|
|
2020-04-12 10:34:36 +00:00
|
|
|
c.doSetChunk(fileId, data)
|
2020-04-12 08:06:50 +00:00
|
|
|
}
|
|
|
|
|
2020-08-18 03:15:53 +00:00
|
|
|
func (c *TieredChunkCache) doSetChunk(fileId string, data []byte) {
|
2020-04-12 08:06:50 +00:00
|
|
|
|
2020-09-27 18:42:51 +00:00
|
|
|
if len(data) <= int(c.onDiskCacheSizeLimit0) {
|
2020-04-14 04:58:10 +00:00
|
|
|
c.memCache.SetChunk(fileId, data)
|
2020-04-12 04:12:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fid, err := needle.ParseFileIdFromString(fileId)
|
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("failed to parse file id %s", fileId)
|
|
|
|
return
|
|
|
|
}
|
2020-04-14 04:58:10 +00:00
|
|
|
|
2020-09-27 18:42:51 +00:00
|
|
|
if len(data) <= int(c.onDiskCacheSizeLimit0) {
|
2020-04-14 05:19:27 +00:00
|
|
|
c.diskCaches[0].setChunk(fid.Key, data)
|
2020-09-27 18:42:51 +00:00
|
|
|
} else if len(data) <= int(c.onDiskCacheSizeLimit1) {
|
2020-04-14 05:19:27 +00:00
|
|
|
c.diskCaches[1].setChunk(fid.Key, data)
|
2020-10-03 21:12:38 +00:00
|
|
|
} else {
|
2020-04-14 05:19:27 +00:00
|
|
|
c.diskCaches[2].setChunk(fid.Key, data)
|
|
|
|
}
|
2020-04-12 04:12:41 +00:00
|
|
|
|
2020-03-28 20:43:31 +00:00
|
|
|
}
|
2020-04-12 04:12:41 +00:00
|
|
|
|
2020-08-18 03:15:53 +00:00
|
|
|
func (c *TieredChunkCache) Shutdown() {
|
2020-04-12 08:00:12 +00:00
|
|
|
if c == nil {
|
|
|
|
return
|
|
|
|
}
|
2020-04-12 04:12:41 +00:00
|
|
|
c.Lock()
|
|
|
|
defer c.Unlock()
|
2020-04-14 05:19:27 +00:00
|
|
|
for _, diskCache := range c.diskCaches {
|
|
|
|
diskCache.shutdown()
|
|
|
|
}
|
2020-04-13 04:00:55 +00:00
|
|
|
}
|
2021-04-28 23:13:37 +00:00
|
|
|
|
|
|
|
func min(x, y int) int {
|
|
|
|
if x < y {
|
|
|
|
return x
|
|
|
|
}
|
|
|
|
return y
|
|
|
|
}
|