seaweedfs/weed/util/chunk_cache/chunk_cache.go

194 lines
4.3 KiB
Go
Raw Normal View History

2020-04-12 03:45:24 +08:00
package chunk_cache
import (
"errors"
2020-04-12 12:12:41 +08:00
"sync"
"github.com/seaweedfs/seaweedfs/weed/glog"
"github.com/seaweedfs/seaweedfs/weed/storage/needle"
)
var ErrorOutOfBounds = errors.New("attempt to read out of bounds")
2020-08-18 11:20:08 +08:00
type ChunkCache interface {
2022-02-26 13:55:04 +08:00
ReadChunkAt(data []byte, fileId string, offset uint64) (n int, err error)
2020-08-18 11:20:08 +08:00
SetChunk(fileId string, data []byte)
IsInCache(fileId string, lockNeeded bool) (answer bool)
GetMaxFilePartSizeInCache() (answer uint64)
2020-08-18 11:20:08 +08:00
}
// a global cache for recently accessed file chunks
2020-08-18 11:15:53 +08:00
type TieredChunkCache struct {
memCache *ChunkCacheInMemory
diskCaches []*OnDiskCacheLayer
2020-04-12 12:12:41 +08:00
sync.RWMutex
2024-09-14 23:33:35 +08:00
onDiskCacheSizeLimit0 uint64
onDiskCacheSizeLimit1 uint64
onDiskCacheSizeLimit2 uint64
maxFilePartSizeInCache uint64
}
var _ ChunkCache = &TieredChunkCache{}
func NewTieredChunkCache(maxEntries int64, dir string, diskSizeInUnit int64, unitSize int64) *TieredChunkCache {
2020-04-12 12:12:41 +08:00
2020-08-18 11:15:53 +08:00
c := &TieredChunkCache{
memCache: NewChunkCacheInMemory(maxEntries),
}
c.diskCaches = make([]*OnDiskCacheLayer, 3)
2020-09-28 01:41:29 +08:00
c.onDiskCacheSizeLimit0 = uint64(unitSize)
c.onDiskCacheSizeLimit1 = 4 * c.onDiskCacheSizeLimit0
2020-09-28 02:58:48 +08:00
c.onDiskCacheSizeLimit2 = 2 * c.onDiskCacheSizeLimit1
2020-09-28 02:42:51 +08:00
c.diskCaches[0] = NewOnDiskCacheLayer(dir, "c0_2", diskSizeInUnit*unitSize/8, 2)
c.diskCaches[1] = NewOnDiskCacheLayer(dir, "c1_3", diskSizeInUnit*unitSize/4+diskSizeInUnit*unitSize/8, 3)
c.diskCaches[2] = NewOnDiskCacheLayer(dir, "c2_2", diskSizeInUnit*unitSize/2, 2)
2024-09-14 23:33:35 +08:00
c.maxFilePartSizeInCache = uint64(unitSize*diskSizeInUnit) / 4
2020-04-12 12:12:41 +08:00
return c
}
func (c *TieredChunkCache) GetMaxFilePartSizeInCache() (answer uint64) {
2024-09-14 23:33:35 +08:00
if c == nil {
return 0
}
return c.maxFilePartSizeInCache
}
func (c *TieredChunkCache) IsInCache(fileId string, lockNeeded bool) (answer bool) {
if c == nil {
return false
}
if lockNeeded {
c.RLock()
defer c.RUnlock()
}
item := c.memCache.cache.Get(fileId)
if item != nil {
glog.V(4).Infof("fileId %s is in memcache", fileId)
return true
}
fid, err := needle.ParseFileIdFromString(fileId)
if err != nil {
glog.V(4).Infof("failed to parse file id %s", fileId)
return false
}
for i, diskCacheLayer := range c.diskCaches {
for k, v := range diskCacheLayer.diskCaches {
_, ok := v.nm.Get(fid.Key)
if ok {
glog.V(4).Infof("fileId %s is in diskCaches[%d].volume[%d]", fileId, i, k)
return true
}
}
}
return false
}
2022-02-26 13:55:04 +08:00
func (c *TieredChunkCache) ReadChunkAt(data []byte, fileId string, offset uint64) (n int, err error) {
if c == nil {
return 0, nil
}
c.RLock()
defer c.RUnlock()
minSize := offset + uint64(len(data))
if minSize <= c.onDiskCacheSizeLimit0 {
n, err = c.memCache.readChunkAt(data, fileId, offset)
if err != nil {
glog.Errorf("failed to read from memcache: %s", err)
}
if n == int(len(data)) {
2022-02-26 13:55:04 +08:00
return n, nil
}
}
fid, err := needle.ParseFileIdFromString(fileId)
if err != nil {
glog.Errorf("failed to parse file id %s", fileId)
return 0, nil
2022-02-26 13:55:04 +08:00
}
if minSize <= c.onDiskCacheSizeLimit0 {
n, err = c.diskCaches[0].readChunkAt(data, fid.Key, offset)
if n == int(len(data)) {
2022-02-26 13:55:04 +08:00
return
}
}
if minSize <= c.onDiskCacheSizeLimit1 {
n, err = c.diskCaches[1].readChunkAt(data, fid.Key, offset)
if n == int(len(data)) {
2022-02-26 13:55:04 +08:00
return
}
}
{
n, err = c.diskCaches[2].readChunkAt(data, fid.Key, offset)
if n == int(len(data)) {
2022-02-26 13:55:04 +08:00
return
}
}
return 0, nil
}
2020-08-18 11:15:53 +08:00
func (c *TieredChunkCache) SetChunk(fileId string, data []byte) {
2020-04-12 16:00:12 +08:00
if c == nil {
return
}
2020-04-12 12:12:41 +08:00
c.Lock()
defer c.Unlock()
2020-08-31 11:12:04 +08:00
glog.V(4).Infof("SetChunk %s size %d\n", fileId, len(data))
if c.IsInCache(fileId, false) {
glog.V(4).Infof("fileId %s is already in cache", fileId)
return
}
2020-06-27 01:01:55 +08:00
c.doSetChunk(fileId, data)
}
2020-08-18 11:15:53 +08:00
func (c *TieredChunkCache) doSetChunk(fileId string, data []byte) {
2020-09-28 02:42:51 +08:00
if len(data) <= int(c.onDiskCacheSizeLimit0) {
2020-04-14 12:58:10 +08:00
c.memCache.SetChunk(fileId, data)
2020-04-12 12:12:41 +08:00
}
fid, err := needle.ParseFileIdFromString(fileId)
if err != nil {
glog.Errorf("failed to parse file id %s", fileId)
return
}
2020-04-14 12:58:10 +08:00
2020-09-28 02:42:51 +08:00
if len(data) <= int(c.onDiskCacheSizeLimit0) {
c.diskCaches[0].setChunk(fid.Key, data)
2020-09-28 02:42:51 +08:00
} else if len(data) <= int(c.onDiskCacheSizeLimit1) {
c.diskCaches[1].setChunk(fid.Key, data)
} else {
c.diskCaches[2].setChunk(fid.Key, data)
}
2020-04-12 12:12:41 +08:00
}
2020-04-12 12:12:41 +08:00
2020-08-18 11:15:53 +08:00
func (c *TieredChunkCache) Shutdown() {
2020-04-12 16:00:12 +08:00
if c == nil {
return
}
2020-04-12 12:12:41 +08:00
c.Lock()
defer c.Unlock()
for _, diskCache := range c.diskCaches {
diskCache.shutdown()
}
2020-04-13 12:00:55 +08:00
}
func min(x, y int) int {
if x < y {
return x
}
return y
}