seaweedfs/weed/filesys/filehandle.go

304 lines
8.1 KiB
Go
Raw Normal View History

2018-05-23 18:08:46 +08:00
package filesys
import (
2018-05-28 02:52:26 +08:00
"context"
2018-05-23 18:08:46 +08:00
"fmt"
2020-06-10 09:04:40 +08:00
"io"
"math"
2020-04-15 02:32:31 +08:00
"net/http"
2020-06-25 14:26:54 +08:00
"os"
"sync"
2019-05-03 15:24:35 +08:00
"time"
"github.com/seaweedfs/fuse"
"github.com/seaweedfs/fuse/fs"
2020-09-01 15:21:19 +08:00
"github.com/chrislusf/seaweedfs/weed/filer"
2018-05-23 18:08:46 +08:00
"github.com/chrislusf/seaweedfs/weed/glog"
2018-05-28 02:52:26 +08:00
"github.com/chrislusf/seaweedfs/weed/pb/filer_pb"
2018-05-23 18:08:46 +08:00
)
type FileHandle struct {
// cache file has been written to
dirtyPages *ContinuousDirtyPages
contentType string
handle uint64
sync.RWMutex
2018-06-06 17:09:57 +08:00
2018-05-25 15:57:25 +08:00
f *File
RequestId fuse.RequestID // unique ID for request
NodeId fuse.NodeID // file or directory the request is about
Uid uint32 // user ID of process making request
Gid uint32 // group ID of process making request
2018-05-23 18:08:46 +08:00
}
2018-06-06 17:09:57 +08:00
func newFileHandle(file *File, uid, gid uint32) *FileHandle {
fh := &FileHandle{
2018-06-06 17:09:57 +08:00
f: file,
dirtyPages: newDirtyPages(file),
Uid: uid,
Gid: gid,
}
if fh.f.entry != nil {
2020-09-01 15:21:19 +08:00
fh.f.entry.Attributes.FileSize = filer.FileSize(fh.f.entry)
}
return fh
2018-06-06 17:09:57 +08:00
}
2018-05-23 18:08:46 +08:00
var _ = fs.Handle(&FileHandle{})
2018-05-28 02:52:26 +08:00
// var _ = fs.HandleReadAller(&FileHandle{})
var _ = fs.HandleReader(&FileHandle{})
2018-05-23 18:08:46 +08:00
var _ = fs.HandleFlusher(&FileHandle{})
var _ = fs.HandleWriter(&FileHandle{})
var _ = fs.HandleReleaser(&FileHandle{})
func (fh *FileHandle) Read(ctx context.Context, req *fuse.ReadRequest, resp *fuse.ReadResponse) error {
2018-05-23 18:08:46 +08:00
2020-08-19 03:52:54 +08:00
glog.V(4).Infof("%s read fh %d: [%d,%d) size %d resp.Data cap=%d", fh.f.fullpath(), fh.handle, req.Offset, req.Offset+int64(req.Size), req.Size, cap(resp.Data))
fh.RLock()
defer fh.RUnlock()
if req.Size <= 0 {
return nil
}
2018-05-23 18:08:46 +08:00
2020-08-17 07:24:40 +08:00
buff := resp.Data[:cap(resp.Data)]
if req.Size > cap(resp.Data) {
// should not happen
buff = make([]byte, req.Size)
}
2020-02-26 14:23:59 +08:00
totalRead, err := fh.readFromChunks(buff, req.Offset)
2021-01-18 17:14:42 +08:00
if err == nil || err == io.EOF {
maxStop := fh.readFromDirtyPages(buff, req.Offset)
totalRead = max(maxStop-req.Offset, totalRead)
}
if err == io.EOF {
err = nil
}
if err != nil {
2020-08-31 12:01:44 +08:00
glog.Warningf("file handle read %s %d: %v", fh.f.fullpath(), totalRead, err)
2020-10-11 06:43:22 +08:00
return fuse.EIO
}
2020-08-18 07:04:56 +08:00
if totalRead > int64(len(buff)) {
glog.Warningf("%s FileHandle Read %d: [%d,%d) size %d totalRead %d", fh.f.fullpath(), fh.handle, req.Offset, req.Offset+int64(req.Size), req.Size, totalRead)
totalRead = min(int64(len(buff)), totalRead)
}
if err == nil {
resp.Data = buff[:totalRead]
}
2020-08-17 14:49:10 +08:00
return err
}
func (fh *FileHandle) readFromDirtyPages(buff []byte, startOffset int64) (maxStop int64) {
maxStop = fh.dirtyPages.ReadDirtyDataAt(buff, startOffset)
return
}
2020-02-26 14:23:59 +08:00
func (fh *FileHandle) readFromChunks(buff []byte, offset int64) (int64, error) {
2020-09-01 15:21:19 +08:00
fileSize := int64(filer.FileSize(fh.f.entry))
2020-08-16 15:49:08 +08:00
if fileSize == 0 {
2020-01-25 23:34:09 +08:00
glog.V(1).Infof("empty fh %v", fh.f.fullpath())
2020-08-16 15:49:08 +08:00
return 0, io.EOF
2018-05-23 18:08:46 +08:00
}
2020-11-30 20:34:04 +08:00
if offset+int64(len(buff)) <= int64(len(fh.f.entry.Content)) {
totalRead := copy(buff, fh.f.entry.Content[offset:])
glog.V(4).Infof("file handle read cached %s [%d,%d] %d", fh.f.fullpath(), offset, offset+int64(totalRead), totalRead)
return int64(totalRead), nil
}
var chunkResolveErr error
if fh.f.entryViewCache == nil {
2020-09-01 15:21:19 +08:00
fh.f.entryViewCache, chunkResolveErr = filer.NonOverlappingVisibleIntervals(filer.LookupFn(fh.f.wfs), fh.f.entry.Chunks)
if chunkResolveErr != nil {
return 0, fmt.Errorf("fail to resolve chunk manifest: %v", chunkResolveErr)
}
fh.f.reader = nil
}
if fh.f.reader == nil {
2020-09-01 15:21:19 +08:00
chunkViews := filer.ViewFromVisibleIntervals(fh.f.entryViewCache, 0, math.MaxInt64)
fh.f.reader = filer.NewChunkReaderAtFromClient(fh.f.wfs, chunkViews, fh.f.wfs.chunkCache, fileSize)
}
totalRead, err := fh.f.reader.ReadAt(buff, offset)
2020-10-25 11:12:04 +08:00
if err != nil && err != io.EOF {
2019-06-21 14:45:30 +08:00
glog.Errorf("file handle read %s: %v", fh.f.fullpath(), err)
}
2020-08-19 03:52:54 +08:00
glog.V(4).Infof("file handle read %s [%d,%d] %d : %v", fh.f.fullpath(), offset, offset+int64(totalRead), totalRead, err)
return int64(totalRead), err
2018-05-23 18:08:46 +08:00
}
// Write to the file handle
func (fh *FileHandle) Write(ctx context.Context, req *fuse.WriteRequest, resp *fuse.WriteResponse) error {
fh.Lock()
defer fh.Unlock()
2018-05-23 18:08:46 +08:00
// write the request to volume servers
2020-10-21 13:54:21 +08:00
data := req.Data
if len(data) <= 512 {
// fuse message cacheable size
data = make([]byte, len(req.Data))
copy(data, req.Data)
}
2020-11-30 20:34:04 +08:00
fh.f.entry.Content = nil
fh.f.entry.Attributes.FileSize = uint64(max(req.Offset+int64(len(data)), int64(fh.f.entry.Attributes.FileSize)))
2020-08-19 00:09:29 +08:00
glog.V(4).Infof("%v write [%d,%d) %d", fh.f.fullpath(), req.Offset, req.Offset+int64(len(req.Data)), len(req.Data))
2020-10-15 14:28:03 +08:00
fh.dirtyPages.AddPage(req.Offset, data)
2018-05-23 18:08:46 +08:00
resp.Size = len(data)
2018-05-23 18:08:46 +08:00
if req.Offset == 0 {
2019-03-28 05:25:18 +08:00
// detect mime type
2020-04-15 02:32:31 +08:00
fh.contentType = http.DetectContentType(data)
fh.f.dirtyMetadata = true
}
2020-10-15 14:28:03 +08:00
fh.f.dirtyMetadata = true
2018-05-23 18:08:46 +08:00
return nil
}
func (fh *FileHandle) Release(ctx context.Context, req *fuse.ReleaseRequest) error {
2020-08-16 10:55:28 +08:00
glog.V(4).Infof("Release %v fh %d", fh.f.fullpath(), fh.handle)
2018-06-06 17:09:57 +08:00
fh.Lock()
defer fh.Unlock()
fh.f.isOpen--
2018-12-28 19:27:48 +08:00
if fh.f.isOpen < 0 {
glog.V(0).Infof("Release reset %s open count %d => %d", fh.f.Name, fh.f.isOpen, 0)
fh.f.isOpen = 0
return nil
}
if fh.f.isOpen == 0 {
2020-10-16 02:01:43 +08:00
if err := fh.doFlush(ctx, req.Header); err != nil {
glog.Errorf("Release doFlush %s: %v", fh.f.Name, err)
}
// stop the goroutine
if !fh.dirtyPages.chunkSaveErrChanClosed {
fh.dirtyPages.chunkSaveErrChanClosed = true
close(fh.dirtyPages.chunkSaveErrChan)
}
fh.f.wfs.ReleaseHandle(fh.f.fullpath(), fuse.HandleID(fh.handle))
if closer, ok := fh.f.reader.(io.Closer); ok {
closer.Close()
}
2020-12-09 14:48:18 +08:00
fh.f.reader = nil
}
2018-05-23 18:08:46 +08:00
return nil
}
func (fh *FileHandle) Flush(ctx context.Context, req *fuse.FlushRequest) error {
fh.Lock()
defer fh.Unlock()
2020-08-19 16:27:10 +08:00
return fh.doFlush(ctx, req.Header)
}
func (fh *FileHandle) doFlush(ctx context.Context, header fuse.Header) error {
2020-10-15 14:28:03 +08:00
// flush works at fh level
2018-05-23 18:08:46 +08:00
// send the data to the OS
2020-08-30 02:56:22 +08:00
glog.V(4).Infof("doFlush %s fh %d", fh.f.fullpath(), fh.handle)
2018-05-23 18:08:46 +08:00
2020-10-15 14:28:03 +08:00
fh.dirtyPages.saveExistingPagesToStorage()
2019-01-06 07:16:39 +08:00
2020-10-15 14:28:03 +08:00
fh.dirtyPages.writeWaitGroup.Wait()
2020-10-21 17:16:21 +08:00
if fh.dirtyPages.lastErr != nil {
return fh.dirtyPages.lastErr
}
if !fh.f.dirtyMetadata {
2018-05-23 18:08:46 +08:00
return nil
}
2020-10-21 17:16:21 +08:00
err := fh.f.wfs.WithFilerClient(func(client filer_pb.SeaweedFilerClient) error {
2018-05-23 18:08:46 +08:00
if fh.f.entry.Attributes != nil {
fh.f.entry.Attributes.Mime = fh.contentType
if fh.f.entry.Attributes.Uid == 0 {
2020-08-19 16:27:10 +08:00
fh.f.entry.Attributes.Uid = header.Uid
}
if fh.f.entry.Attributes.Gid == 0 {
2020-08-19 16:27:10 +08:00
fh.f.entry.Attributes.Gid = header.Gid
}
if fh.f.entry.Attributes.Crtime == 0 {
fh.f.entry.Attributes.Crtime = time.Now().Unix()
}
fh.f.entry.Attributes.Mtime = time.Now().Unix()
2020-06-25 14:26:54 +08:00
fh.f.entry.Attributes.FileMode = uint32(os.FileMode(fh.f.entry.Attributes.FileMode) &^ fh.f.wfs.option.Umask)
fh.f.entry.Attributes.Collection = fh.dirtyPages.collection
fh.f.entry.Attributes.Replication = fh.dirtyPages.replication
}
request := &filer_pb.CreateEntryRequest{
Directory: fh.f.dir.FullPath(),
Entry: fh.f.entry,
Signatures: []int32{fh.f.wfs.signature},
2018-05-23 18:08:46 +08:00
}
2020-08-14 15:22:21 +08:00
glog.V(4).Infof("%s set chunks: %v", fh.f.fullpath(), len(fh.f.entry.Chunks))
2019-06-22 03:14:40 +08:00
for i, chunk := range fh.f.entry.Chunks {
2020-08-16 10:55:28 +08:00
glog.V(4).Infof("%s chunks %d: %v [%d,%d)", fh.f.fullpath(), i, chunk.GetFileIdString(), chunk.Offset, chunk.Offset+int64(chunk.Size))
2019-06-22 03:14:40 +08:00
}
2019-01-01 18:33:57 +08:00
2020-09-01 15:21:19 +08:00
manifestChunks, nonManifestChunks := filer.SeparateManifestChunks(fh.f.entry.Chunks)
2020-08-24 07:59:01 +08:00
2020-09-01 15:21:19 +08:00
chunks, _ := filer.CompactFileChunks(filer.LookupFn(fh.f.wfs), nonManifestChunks)
chunks, manifestErr := filer.MaybeManifestize(fh.f.wfs.saveDataAsChunk(fh.f.fullpath()), chunks)
if manifestErr != nil {
// not good, but should be ok
glog.V(0).Infof("MaybeManifestize: %v", manifestErr)
}
fh.f.entry.Chunks = append(chunks, manifestChunks...)
fh.f.wfs.mapPbIdFromLocalToFiler(request.Entry)
defer fh.f.wfs.mapPbIdFromFilerToLocal(request.Entry)
if err := filer_pb.CreateEntry(client, request); err != nil {
glog.Errorf("fh flush create %s: %v", fh.f.fullpath(), err)
return fmt.Errorf("fh flush create %s: %v", fh.f.fullpath(), err)
2018-05-23 18:08:46 +08:00
}
2020-09-01 15:21:19 +08:00
fh.f.wfs.metaCache.InsertEntry(context.Background(), filer.FromPbEntry(request.Directory, request.Entry))
2018-05-23 18:08:46 +08:00
return nil
})
if err == nil {
fh.f.dirtyMetadata = false
}
2020-01-24 17:41:31 +08:00
if err != nil {
glog.Errorf("%v fh %d flush: %v", fh.f.fullpath(), fh.handle, err)
return fuse.EIO
}
return nil
2018-05-23 18:08:46 +08:00
}