2021-03-31 12:07:34 +08:00
|
|
|
package weed_server
|
|
|
|
|
|
|
|
import (
|
2021-04-29 01:28:05 +08:00
|
|
|
"bytes"
|
2021-03-31 12:07:34 +08:00
|
|
|
"crypto/md5"
|
2022-02-22 00:15:00 +08:00
|
|
|
"fmt"
|
2021-03-31 12:07:34 +08:00
|
|
|
"hash"
|
|
|
|
"io"
|
|
|
|
"net/http"
|
2021-06-07 11:23:36 +08:00
|
|
|
"sort"
|
2022-02-22 00:15:00 +08:00
|
|
|
"strconv"
|
2021-03-31 12:07:34 +08:00
|
|
|
"strings"
|
2021-06-07 04:42:36 +08:00
|
|
|
"sync"
|
2021-06-07 14:05:17 +08:00
|
|
|
"sync/atomic"
|
2021-03-31 12:07:34 +08:00
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/filer"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/operation"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/pb/filer_pb"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/security"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/stats"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/util"
|
|
|
|
)
|
|
|
|
|
2021-06-07 04:42:36 +08:00
|
|
|
var bufPool = sync.Pool{
|
|
|
|
New: func() interface{} {
|
|
|
|
return new(bytes.Buffer)
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
2021-07-16 02:56:28 +08:00
|
|
|
func (fs *FilerServer) uploadReaderToChunks(w http.ResponseWriter, r *http.Request, reader io.Reader, chunkSize int32, fileName, contentType string, contentLength int64, so *operation.StorageOption) (fileChunks []*filer_pb.FileChunk, md5Hash hash.Hash, chunkOffset int64, uploadErr error, smallContent []byte) {
|
2022-02-22 00:15:00 +08:00
|
|
|
query := r.URL.Query()
|
|
|
|
|
2022-03-07 16:04:59 +08:00
|
|
|
isAppend := isAppend(r)
|
2022-02-22 00:15:00 +08:00
|
|
|
if query.Has("offset") {
|
|
|
|
offset := query.Get("offset")
|
|
|
|
offsetInt, err := strconv.ParseInt(offset, 10, 64)
|
|
|
|
if err != nil || offsetInt < 0 {
|
|
|
|
err = fmt.Errorf("invalid 'offset': '%s'", offset)
|
|
|
|
return nil, nil, 0, err, nil
|
|
|
|
}
|
2022-03-07 16:04:59 +08:00
|
|
|
if isAppend && offsetInt > 0 {
|
2022-02-22 00:15:00 +08:00
|
|
|
err = fmt.Errorf("cannot set offset when op=append")
|
|
|
|
return nil, nil, 0, err, nil
|
|
|
|
}
|
|
|
|
chunkOffset = offsetInt
|
|
|
|
}
|
2021-03-31 12:07:34 +08:00
|
|
|
|
2021-07-16 02:56:28 +08:00
|
|
|
md5Hash = md5.New()
|
2021-10-14 12:27:58 +08:00
|
|
|
var partReader = io.NopCloser(io.TeeReader(reader, md5Hash))
|
2021-03-31 12:07:34 +08:00
|
|
|
|
2021-06-07 11:23:36 +08:00
|
|
|
var wg sync.WaitGroup
|
2021-06-07 14:05:17 +08:00
|
|
|
var bytesBufferCounter int64
|
|
|
|
bytesBufferLimitCond := sync.NewCond(new(sync.Mutex))
|
2021-06-08 03:04:50 +08:00
|
|
|
var fileChunksLock sync.Mutex
|
2021-04-10 04:05:15 +08:00
|
|
|
for {
|
2021-06-07 11:23:36 +08:00
|
|
|
|
2021-06-07 14:05:17 +08:00
|
|
|
// need to throttle used byte buffer
|
|
|
|
bytesBufferLimitCond.L.Lock()
|
|
|
|
for atomic.LoadInt64(&bytesBufferCounter) >= 4 {
|
|
|
|
glog.V(4).Infof("waiting for byte buffer %d", bytesBufferCounter)
|
|
|
|
bytesBufferLimitCond.Wait()
|
|
|
|
}
|
|
|
|
atomic.AddInt64(&bytesBufferCounter, 1)
|
|
|
|
bytesBufferLimitCond.L.Unlock()
|
|
|
|
|
2021-06-07 11:23:36 +08:00
|
|
|
bytesBuffer := bufPool.Get().(*bytes.Buffer)
|
2021-06-07 14:05:17 +08:00
|
|
|
glog.V(4).Infof("received byte buffer %d", bytesBufferCounter)
|
2021-06-07 11:23:36 +08:00
|
|
|
|
2021-04-10 04:05:15 +08:00
|
|
|
limitedReader := io.LimitReader(partReader, int64(chunkSize))
|
2021-03-31 12:07:34 +08:00
|
|
|
|
2021-06-07 04:42:36 +08:00
|
|
|
bytesBuffer.Reset()
|
|
|
|
|
|
|
|
dataSize, err := bytesBuffer.ReadFrom(limitedReader)
|
|
|
|
|
2021-10-14 12:27:58 +08:00
|
|
|
// data, err := io.ReadAll(limitedReader)
|
2021-06-07 11:23:36 +08:00
|
|
|
if err != nil || dataSize == 0 {
|
2021-06-07 14:05:17 +08:00
|
|
|
bufPool.Put(bytesBuffer)
|
|
|
|
atomic.AddInt64(&bytesBufferCounter, -1)
|
|
|
|
bytesBufferLimitCond.Signal()
|
2022-03-10 11:40:39 +08:00
|
|
|
uploadErr = err
|
2021-07-16 02:56:28 +08:00
|
|
|
break
|
2021-03-31 12:07:34 +08:00
|
|
|
}
|
2022-03-07 16:04:59 +08:00
|
|
|
if chunkOffset == 0 && !isAppend {
|
2021-07-09 17:33:14 +08:00
|
|
|
if dataSize < fs.option.SaveToFilerLimit || strings.HasPrefix(r.URL.Path, filer.DirectoryEtcRoot) {
|
2021-06-07 04:42:36 +08:00
|
|
|
chunkOffset += dataSize
|
|
|
|
smallContent = make([]byte, dataSize)
|
2021-06-07 11:57:03 +08:00
|
|
|
bytesBuffer.Read(smallContent)
|
2021-06-07 14:05:17 +08:00
|
|
|
bufPool.Put(bytesBuffer)
|
|
|
|
atomic.AddInt64(&bytesBufferCounter, -1)
|
|
|
|
bytesBufferLimitCond.Signal()
|
2021-04-10 04:05:15 +08:00
|
|
|
break
|
2021-04-01 17:21:40 +08:00
|
|
|
}
|
2021-04-10 04:05:15 +08:00
|
|
|
}
|
2021-03-31 12:07:34 +08:00
|
|
|
|
2021-06-07 11:23:36 +08:00
|
|
|
wg.Add(1)
|
|
|
|
go func(offset int64) {
|
2021-06-07 14:05:17 +08:00
|
|
|
defer func() {
|
|
|
|
bufPool.Put(bytesBuffer)
|
|
|
|
atomic.AddInt64(&bytesBufferCounter, -1)
|
|
|
|
bytesBufferLimitCond.Signal()
|
|
|
|
wg.Done()
|
|
|
|
}()
|
2021-03-31 12:07:34 +08:00
|
|
|
|
2021-06-07 13:16:32 +08:00
|
|
|
chunk, toChunkErr := fs.dataToChunk(fileName, contentType, bytesBuffer.Bytes(), offset, so)
|
2021-06-07 11:23:36 +08:00
|
|
|
if toChunkErr != nil {
|
|
|
|
uploadErr = toChunkErr
|
|
|
|
}
|
|
|
|
if chunk != nil {
|
2021-06-08 03:04:50 +08:00
|
|
|
fileChunksLock.Lock()
|
2021-06-07 11:23:36 +08:00
|
|
|
fileChunks = append(fileChunks, chunk)
|
2021-06-08 03:04:50 +08:00
|
|
|
fileChunksLock.Unlock()
|
2021-06-07 11:23:36 +08:00
|
|
|
glog.V(4).Infof("uploaded %s chunk %d to %s [%d,%d)", fileName, len(fileChunks), chunk.FileId, offset, offset+int64(chunk.Size))
|
|
|
|
}
|
|
|
|
}(chunkOffset)
|
2021-03-31 12:07:34 +08:00
|
|
|
|
2021-04-10 04:05:15 +08:00
|
|
|
// reset variables for the next chunk
|
2021-06-07 11:23:36 +08:00
|
|
|
chunkOffset = chunkOffset + dataSize
|
2021-03-31 12:07:34 +08:00
|
|
|
|
2021-04-10 04:05:15 +08:00
|
|
|
// if last chunk was not at full chunk size, but already exhausted the reader
|
2021-06-07 11:23:36 +08:00
|
|
|
if dataSize < int64(chunkSize) {
|
2021-04-10 04:05:15 +08:00
|
|
|
break
|
2021-04-01 17:21:40 +08:00
|
|
|
}
|
|
|
|
}
|
2021-04-10 04:05:15 +08:00
|
|
|
|
2021-06-07 11:23:36 +08:00
|
|
|
wg.Wait()
|
|
|
|
|
|
|
|
if uploadErr != nil {
|
2022-03-10 11:40:39 +08:00
|
|
|
fs.filer.DeleteChunks(fileChunks)
|
2021-06-07 11:23:36 +08:00
|
|
|
return nil, md5Hash, 0, uploadErr, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
sort.Slice(fileChunks, func(i, j int) bool {
|
|
|
|
return fileChunks[i].Offset < fileChunks[j].Offset
|
|
|
|
})
|
|
|
|
|
2021-04-10 04:05:15 +08:00
|
|
|
return fileChunks, md5Hash, chunkOffset, nil, smallContent
|
2021-03-31 12:07:34 +08:00
|
|
|
}
|
|
|
|
|
2021-06-07 09:43:04 +08:00
|
|
|
func (fs *FilerServer) doUpload(urlLocation string, limitedReader io.Reader, fileName string, contentType string, pairMap map[string]string, auth security.EncodedJwt) (*operation.UploadResult, error, []byte) {
|
2021-03-31 12:07:34 +08:00
|
|
|
|
|
|
|
stats.FilerRequestCounter.WithLabelValues("chunkUpload").Inc()
|
|
|
|
start := time.Now()
|
|
|
|
defer func() {
|
|
|
|
stats.FilerRequestHistogram.WithLabelValues("chunkUpload").Observe(time.Since(start).Seconds())
|
|
|
|
}()
|
|
|
|
|
2021-09-07 07:20:49 +08:00
|
|
|
uploadOption := &operation.UploadOption{
|
|
|
|
UploadUrl: urlLocation,
|
|
|
|
Filename: fileName,
|
|
|
|
Cipher: fs.option.Cipher,
|
|
|
|
IsInputCompressed: false,
|
|
|
|
MimeType: contentType,
|
|
|
|
PairMap: pairMap,
|
|
|
|
Jwt: auth,
|
|
|
|
}
|
|
|
|
uploadResult, err, data := operation.Upload(limitedReader, uploadOption)
|
2021-03-31 12:07:34 +08:00
|
|
|
if uploadResult != nil && uploadResult.RetryCount > 0 {
|
|
|
|
stats.FilerRequestCounter.WithLabelValues("chunkUploadRetry").Add(float64(uploadResult.RetryCount))
|
|
|
|
}
|
|
|
|
return uploadResult, err, data
|
|
|
|
}
|
2021-06-07 09:43:04 +08:00
|
|
|
|
2021-06-07 13:16:32 +08:00
|
|
|
func (fs *FilerServer) dataToChunk(fileName, contentType string, data []byte, chunkOffset int64, so *operation.StorageOption) (*filer_pb.FileChunk, error) {
|
2021-06-07 09:43:04 +08:00
|
|
|
dataReader := util.NewBytesReader(data)
|
|
|
|
|
|
|
|
// retry to assign a different file id
|
|
|
|
var fileId, urlLocation string
|
|
|
|
var auth security.EncodedJwt
|
|
|
|
var uploadErr error
|
|
|
|
var uploadResult *operation.UploadResult
|
|
|
|
for i := 0; i < 3; i++ {
|
|
|
|
// assign one file id for one chunk
|
|
|
|
fileId, urlLocation, auth, uploadErr = fs.assignNewFileInfo(so)
|
|
|
|
if uploadErr != nil {
|
|
|
|
glog.V(4).Infof("retry later due to assign error: %v", uploadErr)
|
|
|
|
time.Sleep(time.Duration(i+1) * 251 * time.Millisecond)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
// upload the chunk to the volume server
|
|
|
|
uploadResult, uploadErr, _ = fs.doUpload(urlLocation, dataReader, fileName, contentType, nil, auth)
|
|
|
|
if uploadErr != nil {
|
|
|
|
glog.V(4).Infof("retry later due to upload error: %v", uploadErr)
|
|
|
|
time.Sleep(time.Duration(i+1) * 251 * time.Millisecond)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
break
|
|
|
|
}
|
|
|
|
if uploadErr != nil {
|
|
|
|
glog.Errorf("upload error: %v", uploadErr)
|
|
|
|
return nil, uploadErr
|
|
|
|
}
|
|
|
|
|
|
|
|
// if last chunk exhausted the reader exactly at the border
|
|
|
|
if uploadResult.Size == 0 {
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
return uploadResult.ToPbFileChunk(fileId, chunkOffset), nil
|
|
|
|
}
|