2018-05-29 03:30:17 +08:00
|
|
|
package filesys
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
2021-05-10 06:15:18 +08:00
|
|
|
"fmt"
|
2021-12-20 17:02:23 +08:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/filesys/page_writer"
|
2020-10-15 14:28:03 +08:00
|
|
|
"io"
|
|
|
|
"sync"
|
2020-10-16 02:08:45 +08:00
|
|
|
"time"
|
2020-10-21 17:16:21 +08:00
|
|
|
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/pb/filer_pb"
|
2018-05-29 03:30:17 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
type ContinuousDirtyPages struct {
|
2021-12-20 17:02:23 +08:00
|
|
|
intervals *page_writer.ContinuousIntervals
|
2021-01-29 07:23:46 +08:00
|
|
|
f *File
|
|
|
|
writeWaitGroup sync.WaitGroup
|
|
|
|
chunkAddLock sync.Mutex
|
|
|
|
lastErr error
|
|
|
|
collection string
|
|
|
|
replication string
|
2018-05-29 03:30:17 +08:00
|
|
|
}
|
|
|
|
|
2021-12-20 17:11:43 +08:00
|
|
|
func newContinuousDirtyPages(file *File) *ContinuousDirtyPages {
|
2020-10-21 17:16:21 +08:00
|
|
|
dirtyPages := &ContinuousDirtyPages{
|
2021-12-20 17:02:23 +08:00
|
|
|
intervals: &page_writer.ContinuousIntervals{},
|
2021-01-29 07:23:46 +08:00
|
|
|
f: file,
|
2018-05-29 03:30:17 +08:00
|
|
|
}
|
2020-10-21 17:16:21 +08:00
|
|
|
return dirtyPages
|
2018-05-29 16:21:21 +08:00
|
|
|
}
|
2018-05-29 03:30:17 +08:00
|
|
|
|
2020-10-15 14:28:03 +08:00
|
|
|
func (pages *ContinuousDirtyPages) AddPage(offset int64, data []byte) {
|
2018-05-31 13:02:21 +08:00
|
|
|
|
2021-03-10 15:08:38 +08:00
|
|
|
glog.V(4).Infof("%s AddPage [%d,%d)", pages.f.fullpath(), offset, offset+int64(len(data)))
|
2018-05-29 03:30:17 +08:00
|
|
|
|
2019-01-01 18:14:40 +08:00
|
|
|
if len(data) > int(pages.f.wfs.option.ChunkSizeLimit) {
|
2018-05-31 13:09:24 +08:00
|
|
|
// this is more than what buffer can hold.
|
2020-10-15 14:28:03 +08:00
|
|
|
pages.flushAndSave(offset, data)
|
2018-05-29 03:30:17 +08:00
|
|
|
}
|
|
|
|
|
2020-01-27 05:01:11 +08:00
|
|
|
pages.intervals.AddInterval(data, offset)
|
2018-05-29 03:30:17 +08:00
|
|
|
|
2020-10-22 10:29:51 +08:00
|
|
|
if pages.intervals.TotalSize() >= pages.f.wfs.option.ChunkSizeLimit {
|
2020-10-15 14:28:03 +08:00
|
|
|
pages.saveExistingLargestPageToStorage()
|
2018-09-08 04:11:43 +08:00
|
|
|
}
|
2018-09-10 17:21:57 +08:00
|
|
|
|
2018-05-29 03:30:17 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2020-10-15 14:28:03 +08:00
|
|
|
func (pages *ContinuousDirtyPages) flushAndSave(offset int64, data []byte) {
|
2018-09-10 17:21:57 +08:00
|
|
|
|
|
|
|
// flush existing
|
2020-10-15 14:28:03 +08:00
|
|
|
pages.saveExistingPagesToStorage()
|
2018-09-10 17:21:57 +08:00
|
|
|
|
|
|
|
// flush the new page
|
2020-10-15 14:28:03 +08:00
|
|
|
pages.saveToStorage(bytes.NewReader(data), offset, int64(len(data)))
|
2018-09-10 17:21:57 +08:00
|
|
|
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2021-05-10 06:15:18 +08:00
|
|
|
func (pages *ContinuousDirtyPages) FlushData() error {
|
|
|
|
|
|
|
|
pages.saveExistingPagesToStorage()
|
|
|
|
pages.writeWaitGroup.Wait()
|
|
|
|
if pages.lastErr != nil {
|
|
|
|
return fmt.Errorf("flush data: %v", pages.lastErr)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-10-15 14:28:03 +08:00
|
|
|
func (pages *ContinuousDirtyPages) saveExistingPagesToStorage() {
|
|
|
|
for pages.saveExistingLargestPageToStorage() {
|
2018-05-29 03:30:17 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-10-15 14:28:03 +08:00
|
|
|
func (pages *ContinuousDirtyPages) saveExistingLargestPageToStorage() (hasSavedData bool) {
|
2018-09-08 04:11:43 +08:00
|
|
|
|
2020-01-23 15:00:04 +08:00
|
|
|
maxList := pages.intervals.RemoveLargestIntervalLinkedList()
|
|
|
|
if maxList == nil {
|
2020-10-15 14:28:03 +08:00
|
|
|
return false
|
2018-09-08 04:11:43 +08:00
|
|
|
}
|
|
|
|
|
2021-03-10 15:08:38 +08:00
|
|
|
entry := pages.f.getEntry()
|
|
|
|
if entry == nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2021-03-16 17:59:26 +08:00
|
|
|
fileSize := int64(entry.Attributes.FileSize)
|
2020-10-15 14:28:03 +08:00
|
|
|
|
|
|
|
chunkSize := min(maxList.Size(), fileSize-maxList.Offset())
|
|
|
|
if chunkSize == 0 {
|
|
|
|
return false
|
2020-01-23 15:00:04 +08:00
|
|
|
}
|
2020-01-21 12:21:01 +08:00
|
|
|
|
2020-10-15 14:28:03 +08:00
|
|
|
pages.saveToStorage(maxList.ToReader(), maxList.Offset(), chunkSize)
|
|
|
|
|
|
|
|
return true
|
2018-05-31 13:02:21 +08:00
|
|
|
}
|
|
|
|
|
2020-10-15 14:28:03 +08:00
|
|
|
func (pages *ContinuousDirtyPages) saveToStorage(reader io.Reader, offset int64, size int64) {
|
2018-05-29 03:30:17 +08:00
|
|
|
|
2020-10-16 02:08:45 +08:00
|
|
|
mtime := time.Now().UnixNano()
|
2020-10-15 14:28:03 +08:00
|
|
|
pages.writeWaitGroup.Add(1)
|
2020-10-31 12:22:20 +08:00
|
|
|
writer := func() {
|
2020-10-15 14:28:03 +08:00
|
|
|
defer pages.writeWaitGroup.Done()
|
2020-02-25 14:28:45 +08:00
|
|
|
|
2020-10-15 14:28:03 +08:00
|
|
|
reader = io.LimitReader(reader, size)
|
2021-12-20 17:11:43 +08:00
|
|
|
chunk, collection, replication, err := pages.f.wfs.saveDataAsChunk(pages.f.fullpath())(reader, pages.f.Name, offset)
|
2020-10-15 14:28:03 +08:00
|
|
|
if err != nil {
|
|
|
|
glog.V(0).Infof("%s saveToStorage [%d,%d): %v", pages.f.fullpath(), offset, offset+size, err)
|
2021-01-28 20:46:37 +08:00
|
|
|
pages.lastErr = err
|
2020-10-15 14:28:03 +08:00
|
|
|
return
|
|
|
|
}
|
2020-10-16 02:08:45 +08:00
|
|
|
chunk.Mtime = mtime
|
2020-10-15 14:28:03 +08:00
|
|
|
pages.collection, pages.replication = collection, replication
|
2020-11-04 04:20:41 +08:00
|
|
|
pages.chunkAddLock.Lock()
|
|
|
|
defer pages.chunkAddLock.Unlock()
|
2020-10-15 14:28:03 +08:00
|
|
|
pages.f.addChunks([]*filer_pb.FileChunk{chunk})
|
2020-10-21 17:17:40 +08:00
|
|
|
glog.V(3).Infof("%s saveToStorage [%d,%d)", pages.f.fullpath(), offset, offset+size)
|
2020-10-31 12:22:20 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if pages.f.wfs.concurrentWriters != nil {
|
|
|
|
pages.f.wfs.concurrentWriters.Execute(writer)
|
|
|
|
} else {
|
|
|
|
go writer()
|
|
|
|
}
|
2018-05-29 03:30:17 +08:00
|
|
|
}
|
2018-05-29 16:21:21 +08:00
|
|
|
|
2020-08-18 02:12:10 +08:00
|
|
|
func (pages *ContinuousDirtyPages) ReadDirtyDataAt(data []byte, startOffset int64) (maxStop int64) {
|
|
|
|
return pages.intervals.ReadDataAt(data, startOffset)
|
2020-01-23 05:42:03 +08:00
|
|
|
}
|
2021-05-10 06:28:54 +08:00
|
|
|
|
|
|
|
func (pages *ContinuousDirtyPages) GetStorageOptions() (collection, replication string) {
|
|
|
|
return pages.collection, pages.replication
|
|
|
|
}
|
2021-12-24 09:17:32 +08:00
|
|
|
func (pages ContinuousDirtyPages) Destroy() {
|
|
|
|
}
|