seaweedfs/weed/storage/disk_location.go

456 lines
11 KiB
Go
Raw Normal View History

2016-04-27 11:10:26 +08:00
package storage
import (
2020-06-06 06:27:10 +08:00
"fmt"
"os"
"path/filepath"
2022-07-12 16:19:33 +08:00
"runtime"
"strconv"
2020-06-06 06:27:10 +08:00
"strings"
"sync"
"time"
2016-04-27 11:10:26 +08:00
2022-05-16 10:41:18 +08:00
"github.com/google/uuid"
"github.com/seaweedfs/seaweedfs/weed/glog"
"github.com/seaweedfs/seaweedfs/weed/stats"
"github.com/seaweedfs/seaweedfs/weed/storage/erasure_coding"
"github.com/seaweedfs/seaweedfs/weed/storage/needle"
"github.com/seaweedfs/seaweedfs/weed/storage/types"
"github.com/seaweedfs/seaweedfs/weed/util"
2016-04-27 11:10:26 +08:00
)
type DiskLocation struct {
Directory string
DirectoryUuid string
IdxDirectory string
2021-02-16 18:47:02 +08:00
DiskType types.DiskType
MaxVolumeCount int32
OriginalMaxVolumeCount int32
2021-04-27 10:37:24 +08:00
MinFreeSpace util.MinFreeSpace
volumes map[needle.VolumeId]*Volume
volumesLock sync.RWMutex
// erasure coding
2019-05-28 12:40:51 +08:00
ecVolumes map[needle.VolumeId]*erasure_coding.EcVolume
ecVolumesLock sync.RWMutex
2020-07-04 07:34:31 +08:00
isDiskSpaceLow bool
closeCh chan struct{}
2016-04-27 11:10:26 +08:00
}
func GenerateDirUuid(dir string) (dirUuidString string, err error) {
glog.V(1).Infof("Getting uuid of volume directory:%s", dir)
dirUuidString = ""
fileName := dir + "/vol_dir.uuid"
2022-05-16 10:41:18 +08:00
if !util.FileExists(fileName) {
dirUuid, _ := uuid.NewRandom()
dirUuidString = dirUuid.String()
writeErr := util.WriteFile(fileName, []byte(dirUuidString), 0644)
2022-05-16 10:41:18 +08:00
if writeErr != nil {
return "", fmt.Errorf("failed to write uuid to %s : %v", fileName, writeErr)
2022-05-16 10:41:18 +08:00
}
} else {
uuidData, readErr := os.ReadFile(fileName)
if readErr != nil {
return "", fmt.Errorf("failed to read uuid from %s : %v", fileName, readErr)
2022-05-16 10:41:18 +08:00
}
dirUuidString = string(uuidData)
2022-05-16 10:41:18 +08:00
}
return dirUuidString, nil
2022-05-16 10:41:18 +08:00
}
func NewDiskLocation(dir string, maxVolumeCount int32, minFreeSpace util.MinFreeSpace, idxDir string, diskType types.DiskType) *DiskLocation {
dir = util.ResolvePath(dir)
if idxDir == "" {
idxDir = dir
} else {
idxDir = util.ResolvePath(idxDir)
}
dirUuid, err := GenerateDirUuid(dir)
if err != nil {
glog.Fatalf("cannot generate uuid of dir %s: %v", dir, err)
}
location := &DiskLocation{
2020-11-27 07:08:05 +08:00
Directory: dir,
DirectoryUuid: dirUuid,
2020-11-27 07:08:05 +08:00
IdxDirectory: idxDir,
2020-12-17 01:14:05 +08:00
DiskType: diskType,
2020-11-27 07:08:05 +08:00
MaxVolumeCount: maxVolumeCount,
OriginalMaxVolumeCount: maxVolumeCount,
MinFreeSpace: minFreeSpace,
}
2019-04-19 12:43:36 +08:00
location.volumes = make(map[needle.VolumeId]*Volume)
2019-05-28 12:40:51 +08:00
location.ecVolumes = make(map[needle.VolumeId]*erasure_coding.EcVolume)
location.closeCh = make(chan struct{})
go func() {
location.CheckDiskSpace()
for {
select {
case <-location.closeCh:
return
case <-time.After(time.Minute):
location.CheckDiskSpace()
}
}
}()
2016-04-27 11:45:35 +08:00
return location
2016-04-27 11:10:26 +08:00
}
2020-11-27 09:21:55 +08:00
func volumeIdFromFileName(filename string) (needle.VolumeId, string, error) {
if isValidVolume(filename) {
base := filename[:len(filename)-4]
collection, volumeId, err := parseCollectionVolumeId(base)
return volumeId, collection, err
}
2020-11-27 07:19:43 +08:00
return 0, "", fmt.Errorf("file is not a volume: %s", filename)
}
func parseCollectionVolumeId(base string) (collection string, vid needle.VolumeId, err error) {
i := strings.LastIndex(base, "_")
if i > 0 {
collection, base = base[0:i], base[i+1:]
}
vol, err := needle.NewVolumeId(base)
return collection, vol, err
}
func isValidVolume(basename string) bool {
return strings.HasSuffix(basename, ".idx") || strings.HasSuffix(basename, ".vif")
}
func getValidVolumeName(basename string) string {
if isValidVolume(basename) {
return basename[:len(basename)-4]
}
return ""
}
func (l *DiskLocation) loadExistingVolume(dirEntry os.DirEntry, needleMapKind NeedleMapKind, skipIfEcVolumesExists bool, ldbTimeout int64) bool {
basename := dirEntry.Name()
if dirEntry.IsDir() {
2020-11-27 07:08:05 +08:00
return false
}
volumeName := getValidVolumeName(basename)
if volumeName == "" {
2020-11-27 07:08:05 +08:00
return false
}
2020-11-27 09:21:55 +08:00
// skip if ec volumes exists
if skipIfEcVolumesExists {
if util.FileExists(l.Directory + "/" + volumeName + ".ecx") {
return false
}
}
2020-11-27 09:21:55 +08:00
// check for incomplete volume
2020-11-27 07:19:43 +08:00
noteFile := l.Directory + "/" + volumeName + ".note"
2020-11-27 07:08:05 +08:00
if util.FileExists(noteFile) {
note, _ := os.ReadFile(noteFile)
2020-11-27 07:19:43 +08:00
glog.Warningf("volume %s was not completed: %s", volumeName, string(note))
removeVolumeFiles(l.Directory + "/" + volumeName)
removeVolumeFiles(l.IdxDirectory + "/" + volumeName)
2020-11-27 07:08:05 +08:00
return false
}
2020-11-27 09:21:55 +08:00
// parse out collection, volume id
vid, collection, err := volumeIdFromFileName(basename)
2020-11-27 07:08:05 +08:00
if err != nil {
2020-11-27 07:19:43 +08:00
glog.Warningf("get volume id failed, %s, err : %s", volumeName, err)
2020-11-27 07:08:05 +08:00
return false
}
2020-02-13 15:19:00 +08:00
2020-11-27 09:21:55 +08:00
// avoid loading one volume more than once
l.volumesLock.RLock()
_, found := l.volumes[vid]
l.volumesLock.RUnlock()
if found {
2020-11-27 07:08:05 +08:00
glog.V(1).Infof("loaded volume, %v", vid)
return true
}
2020-02-13 15:19:00 +08:00
2020-11-27 09:21:55 +08:00
// load the volume
v, e := NewVolume(l.Directory, l.IdxDirectory, collection, vid, needleMapKind, nil, nil, 0, 0, ldbTimeout)
2020-11-27 07:08:05 +08:00
if e != nil {
2020-11-27 07:19:43 +08:00
glog.V(0).Infof("new volume %s error %s", volumeName, e)
2020-11-27 07:08:05 +08:00
return false
}
2020-12-17 01:14:05 +08:00
2020-11-27 07:08:05 +08:00
l.SetVolume(vid, v)
2023-10-03 23:15:18 +08:00
stats.VolumeServerVolumeCounter.WithLabelValues(v.Collection, "volume", v.DiskType().ReadableString()).Inc()
2020-07-04 07:34:31 +08:00
2020-11-27 07:08:05 +08:00
size, _, _ := v.FileStat()
2021-04-16 02:29:58 +08:00
glog.V(0).Infof("data file %s, replication=%s v=%d size=%d ttl=%s",
2020-11-27 07:19:43 +08:00
l.Directory+"/"+volumeName+".dat", v.ReplicaPlacement, v.Version(), size, v.Ttl.String())
2020-11-27 07:08:05 +08:00
return true
2016-11-13 13:24:52 +08:00
}
2016-04-27 11:45:35 +08:00
func (l *DiskLocation) concurrentLoadingVolumes(needleMapKind NeedleMapKind, concurrency int, ldbTimeout int64) {
2016-11-13 13:24:52 +08:00
task_queue := make(chan os.DirEntry, 10*concurrency)
2016-11-11 11:53:22 +08:00
go func() {
foundVolumeNames := make(map[string]bool)
if dirEntries, err := os.ReadDir(l.Directory); err == nil {
for _, entry := range dirEntries {
volumeName := getValidVolumeName(entry.Name())
if volumeName == "" {
continue
}
if _, found := foundVolumeNames[volumeName]; !found {
foundVolumeNames[volumeName] = true
task_queue <- entry
}
2016-11-11 11:53:22 +08:00
}
}
close(task_queue)
}()
var wg sync.WaitGroup
for workerNum := 0; workerNum < concurrency; workerNum++ {
wg.Add(1)
go func() {
defer wg.Done()
2020-11-27 07:08:05 +08:00
for fi := range task_queue {
_ = l.loadExistingVolume(fi, needleMapKind, true, ldbTimeout)
2016-04-27 11:10:26 +08:00
}
2016-11-11 11:53:22 +08:00
}()
2016-04-27 11:10:26 +08:00
}
2016-11-11 11:53:22 +08:00
wg.Wait()
2016-11-13 13:24:52 +08:00
}
func (l *DiskLocation) loadExistingVolumes(needleMapKind NeedleMapKind, ldbTimeout int64) {
2016-11-13 13:24:52 +08:00
2022-07-12 16:19:33 +08:00
workerNum := runtime.NumCPU()
val, ok := os.LookupEnv("GOMAXPROCS")
if ok {
num, err := strconv.Atoi(val)
if err != nil || num < 1 {
num = 10
glog.Warningf("failed to set worker number from GOMAXPROCS , set to default:10")
}
workerNum = num
} else {
if workerNum <= 10 {
workerNum = 10
}
2022-07-12 16:19:33 +08:00
}
l.concurrentLoadingVolumes(needleMapKind, workerNum, ldbTimeout)
glog.V(0).Infof("Store started on dir: %s with %d volumes max %d", l.Directory, len(l.volumes), l.MaxVolumeCount)
l.loadAllEcShards()
2019-05-28 12:40:51 +08:00
glog.V(0).Infof("Store started on dir: %s with %d ec shards", l.Directory, len(l.ecVolumes))
2016-11-13 13:24:52 +08:00
2016-04-27 11:10:26 +08:00
}
2016-04-27 11:45:35 +08:00
func (l *DiskLocation) DeleteCollectionFromDiskLocation(collection string) (e error) {
2019-12-03 12:49:50 +08:00
l.volumesLock.Lock()
delVolsMap := l.unmountVolumeByCollection(collection)
2019-12-03 12:49:50 +08:00
l.volumesLock.Unlock()
2019-05-31 00:47:54 +08:00
l.ecVolumesLock.Lock()
delEcVolsMap := l.unmountEcVolumeByCollection(collection)
l.ecVolumesLock.Unlock()
errChain := make(chan error, 2)
var wg sync.WaitGroup
wg.Add(2)
go func() {
for _, v := range delVolsMap {
if err := v.Destroy(false); err != nil {
errChain <- err
2016-04-27 11:45:35 +08:00
}
}
wg.Done()
}()
go func() {
for _, v := range delEcVolsMap {
v.Destroy()
}
wg.Done()
}()
go func() {
wg.Wait()
close(errChain)
}()
errBuilder := strings.Builder{}
for err := range errChain {
errBuilder.WriteString(err.Error())
errBuilder.WriteString("; ")
2016-04-27 11:45:35 +08:00
}
if errBuilder.Len() > 0 {
e = fmt.Errorf(errBuilder.String())
}
2016-04-27 11:45:35 +08:00
return
}
func (l *DiskLocation) deleteVolumeById(vid needle.VolumeId, onlyEmpty bool) (found bool, e error) {
2016-04-27 11:45:35 +08:00
v, ok := l.volumes[vid]
if !ok {
return
}
e = v.Destroy(onlyEmpty)
2016-04-27 11:45:35 +08:00
if e != nil {
return
}
found = true
2016-04-27 11:45:35 +08:00
delete(l.volumes, vid)
return
}
func (l *DiskLocation) LoadVolume(vid needle.VolumeId, needleMapKind NeedleMapKind) bool {
if fileInfo, found := l.LocateVolume(vid); found {
return l.loadExistingVolume(fileInfo, needleMapKind, false, 0)
}
return false
}
var ErrVolumeNotFound = fmt.Errorf("volume not found")
func (l *DiskLocation) DeleteVolume(vid needle.VolumeId, onlyEmpty bool) error {
2019-12-03 12:49:50 +08:00
l.volumesLock.Lock()
defer l.volumesLock.Unlock()
2017-01-21 02:18:43 +08:00
_, ok := l.volumes[vid]
if !ok {
return ErrVolumeNotFound
}
_, err := l.deleteVolumeById(vid, onlyEmpty)
return err
}
2019-04-19 12:43:36 +08:00
func (l *DiskLocation) UnloadVolume(vid needle.VolumeId) error {
2019-12-03 12:49:50 +08:00
l.volumesLock.Lock()
defer l.volumesLock.Unlock()
2017-01-21 02:18:43 +08:00
v, ok := l.volumes[vid]
if !ok {
return ErrVolumeNotFound
}
v.Close()
delete(l.volumes, vid)
return nil
}
func (l *DiskLocation) unmountVolumeByCollection(collectionName string) map[needle.VolumeId]*Volume {
deltaVols := make(map[needle.VolumeId]*Volume, 0)
for k, v := range l.volumes {
if v.Collection == collectionName && !v.isCompacting && !v.isCommitCompacting {
deltaVols[k] = v
}
}
for k := range deltaVols {
delete(l.volumes, k)
}
return deltaVols
}
2019-04-19 12:43:36 +08:00
func (l *DiskLocation) SetVolume(vid needle.VolumeId, volume *Volume) {
2019-12-03 12:49:50 +08:00
l.volumesLock.Lock()
defer l.volumesLock.Unlock()
l.volumes[vid] = volume
2020-07-04 07:34:31 +08:00
volume.location = l
}
2019-04-19 12:43:36 +08:00
func (l *DiskLocation) FindVolume(vid needle.VolumeId) (*Volume, bool) {
2019-12-03 12:49:50 +08:00
l.volumesLock.RLock()
defer l.volumesLock.RUnlock()
v, ok := l.volumes[vid]
return v, ok
}
func (l *DiskLocation) VolumesLen() int {
2019-12-03 12:49:50 +08:00
l.volumesLock.RLock()
defer l.volumesLock.RUnlock()
return len(l.volumes)
}
2022-02-17 01:11:34 +08:00
func (l *DiskLocation) SetStopping() {
l.volumesLock.Lock()
for _, v := range l.volumes {
v.SyncToDisk()
2022-02-17 01:11:34 +08:00
}
l.volumesLock.Unlock()
return
}
func (l *DiskLocation) Close() {
2019-12-03 12:49:50 +08:00
l.volumesLock.Lock()
for _, v := range l.volumes {
v.Close()
}
2019-12-03 12:49:50 +08:00
l.volumesLock.Unlock()
2019-05-28 12:40:51 +08:00
l.ecVolumesLock.Lock()
2019-06-06 14:20:26 +08:00
for _, ecVolume := range l.ecVolumes {
ecVolume.Close()
}
2019-05-28 12:40:51 +08:00
l.ecVolumesLock.Unlock()
close(l.closeCh)
return
}
func (l *DiskLocation) LocateVolume(vid needle.VolumeId) (os.DirEntry, bool) {
// println("LocateVolume", vid, "on", l.Directory)
if dirEntries, err := os.ReadDir(l.Directory); err == nil {
for _, entry := range dirEntries {
// println("checking", entry.Name(), "...")
volId, _, err := volumeIdFromFileName(entry.Name())
// println("volId", volId, "err", err)
if vid == volId && err == nil {
return entry, true
}
}
}
return nil, false
}
func (l *DiskLocation) UnUsedSpace(volumeSizeLimit uint64) (unUsedSpace uint64) {
l.volumesLock.RLock()
defer l.volumesLock.RUnlock()
for _, vol := range l.volumes {
if vol.IsReadOnly() {
continue
}
datSize, idxSize, _ := vol.FileStat()
unUsedSpace += volumeSizeLimit - (datSize + idxSize)
}
return
}
func (l *DiskLocation) CheckDiskSpace() {
if dir, e := filepath.Abs(l.Directory); e == nil {
s := stats.NewDiskStatus(dir)
stats.VolumeServerResourceGauge.WithLabelValues(l.Directory, "all").Set(float64(s.All))
stats.VolumeServerResourceGauge.WithLabelValues(l.Directory, "used").Set(float64(s.Used))
stats.VolumeServerResourceGauge.WithLabelValues(l.Directory, "free").Set(float64(s.Free))
isLow, desc := l.MinFreeSpace.IsLow(s.Free, s.PercentFree)
if isLow != l.isDiskSpaceLow {
l.isDiskSpaceLow = !l.isDiskSpaceLow
}
logLevel := glog.Level(4)
if l.isDiskSpaceLow {
logLevel = glog.Level(0)
}
glog.V(logLevel).Infof("dir %s %s", dir, desc)
}
2020-06-06 06:27:10 +08:00
}