2012-11-07 17:51:43 +08:00
|
|
|
package topology
|
|
|
|
|
|
|
|
import (
|
2018-10-15 14:12:43 +08:00
|
|
|
"context"
|
2021-09-13 13:47:52 +08:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/pb"
|
2021-10-24 16:55:34 +08:00
|
|
|
"io"
|
2019-07-22 12:49:10 +08:00
|
|
|
"sync/atomic"
|
2012-11-07 17:51:43 +08:00
|
|
|
"time"
|
2014-10-27 02:34:55 +08:00
|
|
|
|
2019-04-19 12:43:36 +08:00
|
|
|
"google.golang.org/grpc"
|
|
|
|
|
2020-03-14 06:41:24 +08:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/storage/needle"
|
|
|
|
|
2016-06-03 09:09:14 +08:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
2018-10-15 14:12:43 +08:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/operation"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/pb/volume_server_pb"
|
2012-11-07 17:51:43 +08:00
|
|
|
)
|
|
|
|
|
2021-02-23 04:52:37 +08:00
|
|
|
func (t *Topology) batchVacuumVolumeCheck(grpcDialOption grpc.DialOption, vid needle.VolumeId,
|
2019-12-01 23:29:41 +08:00
|
|
|
locationlist *VolumeLocationList, garbageThreshold float64) (*VolumeLocationList, bool) {
|
|
|
|
ch := make(chan int, locationlist.Length())
|
|
|
|
errCount := int32(0)
|
2012-11-24 09:03:27 +08:00
|
|
|
for index, dn := range locationlist.list {
|
2021-09-13 13:47:52 +08:00
|
|
|
go func(index int, url pb.ServerAddress, vid needle.VolumeId) {
|
2021-12-26 16:15:03 +08:00
|
|
|
err := operation.WithVolumeServerClient(true, url, grpcDialOption, func(volumeServerClient volume_server_pb.VolumeServerClient) error {
|
2020-02-26 13:50:12 +08:00
|
|
|
resp, err := volumeServerClient.VacuumVolumeCheck(context.Background(), &volume_server_pb.VacuumVolumeCheckRequest{
|
2019-03-24 02:33:34 +08:00
|
|
|
VolumeId: uint32(vid),
|
2018-10-15 14:12:43 +08:00
|
|
|
})
|
|
|
|
if err != nil {
|
2019-12-01 23:29:41 +08:00
|
|
|
atomic.AddInt32(&errCount, 1)
|
|
|
|
ch <- -1
|
2018-10-15 14:12:43 +08:00
|
|
|
return err
|
|
|
|
}
|
2019-12-01 23:29:41 +08:00
|
|
|
if resp.GarbageRatio >= garbageThreshold {
|
|
|
|
ch <- index
|
|
|
|
} else {
|
|
|
|
ch <- -1
|
|
|
|
}
|
2018-10-15 14:12:43 +08:00
|
|
|
return nil
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
glog.V(0).Infof("Checking vacuuming %d on %s: %v", vid, url, err)
|
2012-11-24 09:03:27 +08:00
|
|
|
}
|
2021-09-13 13:47:52 +08:00
|
|
|
}(index, dn.ServerAddress(), vid)
|
2012-11-24 09:03:27 +08:00
|
|
|
}
|
2019-12-01 23:29:41 +08:00
|
|
|
vacuumLocationList := NewVolumeLocationList()
|
2020-10-20 05:24:57 +08:00
|
|
|
|
2021-02-23 04:52:37 +08:00
|
|
|
waitTimeout := time.NewTimer(time.Minute * time.Duration(t.volumeSizeLimit/1024/1024/1000+1))
|
2020-10-20 05:24:57 +08:00
|
|
|
defer waitTimeout.Stop()
|
|
|
|
|
2019-11-20 08:24:58 +08:00
|
|
|
for range locationlist.list {
|
2012-11-24 09:03:27 +08:00
|
|
|
select {
|
2019-12-01 23:29:41 +08:00
|
|
|
case index := <-ch:
|
|
|
|
if index != -1 {
|
|
|
|
vacuumLocationList.list = append(vacuumLocationList.list, locationlist.list[index])
|
|
|
|
}
|
2020-10-20 05:24:57 +08:00
|
|
|
case <-waitTimeout.C:
|
2019-12-01 23:29:41 +08:00
|
|
|
return vacuumLocationList, false
|
2012-11-24 09:03:27 +08:00
|
|
|
}
|
|
|
|
}
|
2019-12-01 23:29:41 +08:00
|
|
|
return vacuumLocationList, errCount == 0 && len(vacuumLocationList.list) > 0
|
2012-11-24 09:03:27 +08:00
|
|
|
}
|
2021-02-23 04:52:37 +08:00
|
|
|
func (t *Topology) batchVacuumVolumeCompact(grpcDialOption grpc.DialOption, vl *VolumeLayout, vid needle.VolumeId,
|
2019-12-01 23:29:41 +08:00
|
|
|
locationlist *VolumeLocationList, preallocate int64) bool {
|
2019-07-22 04:49:09 +08:00
|
|
|
vl.accessLock.Lock()
|
2012-11-24 09:03:27 +08:00
|
|
|
vl.removeFromWritable(vid)
|
2019-07-22 04:49:09 +08:00
|
|
|
vl.accessLock.Unlock()
|
|
|
|
|
2012-11-24 09:03:27 +08:00
|
|
|
ch := make(chan bool, locationlist.Length())
|
|
|
|
for index, dn := range locationlist.list {
|
2021-09-13 13:47:52 +08:00
|
|
|
go func(index int, url pb.ServerAddress, vid needle.VolumeId) {
|
2013-08-09 14:57:22 +08:00
|
|
|
glog.V(0).Infoln(index, "Start vacuuming", vid, "on", url)
|
2021-12-26 16:15:03 +08:00
|
|
|
err := operation.WithVolumeServerClient(true, url, grpcDialOption, func(volumeServerClient volume_server_pb.VolumeServerClient) error {
|
2021-10-24 16:55:34 +08:00
|
|
|
stream, err := volumeServerClient.VacuumVolumeCompact(context.Background(), &volume_server_pb.VacuumVolumeCompactRequest{
|
2020-03-14 07:17:44 +08:00
|
|
|
VolumeId: uint32(vid),
|
|
|
|
Preallocate: preallocate,
|
2018-10-15 14:12:43 +08:00
|
|
|
})
|
2021-10-24 16:55:34 +08:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
for {
|
|
|
|
resp, recvErr := stream.Recv()
|
|
|
|
if recvErr != nil {
|
|
|
|
if recvErr == io.EOF {
|
|
|
|
break
|
|
|
|
} else {
|
|
|
|
return recvErr
|
|
|
|
}
|
|
|
|
}
|
|
|
|
glog.V(0).Infof("%d vacuum %d on %s processed %d bytes", index, vid, url, resp.ProcessedBytes)
|
|
|
|
}
|
|
|
|
return nil
|
2018-10-15 14:12:43 +08:00
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("Error when vacuuming %d on %s: %v", vid, url, err)
|
2012-11-24 09:03:27 +08:00
|
|
|
ch <- false
|
|
|
|
} else {
|
2018-10-15 14:12:43 +08:00
|
|
|
glog.V(0).Infof("Complete vacuuming %d on %s", vid, url)
|
2012-11-24 09:03:27 +08:00
|
|
|
ch <- true
|
|
|
|
}
|
2021-09-13 13:47:52 +08:00
|
|
|
}(index, dn.ServerAddress(), vid)
|
2012-11-24 09:03:27 +08:00
|
|
|
}
|
|
|
|
isVacuumSuccess := true
|
2020-10-20 05:24:57 +08:00
|
|
|
|
2021-02-23 04:52:37 +08:00
|
|
|
waitTimeout := time.NewTimer(3 * time.Minute * time.Duration(t.volumeSizeLimit/1024/1024/1000+1))
|
2020-10-20 05:24:57 +08:00
|
|
|
defer waitTimeout.Stop()
|
|
|
|
|
2019-11-20 08:24:58 +08:00
|
|
|
for range locationlist.list {
|
2012-11-24 09:03:27 +08:00
|
|
|
select {
|
2017-08-30 14:11:08 +08:00
|
|
|
case canCommit := <-ch:
|
|
|
|
isVacuumSuccess = isVacuumSuccess && canCommit
|
2020-10-20 05:24:57 +08:00
|
|
|
case <-waitTimeout.C:
|
2019-11-20 08:24:58 +08:00
|
|
|
return false
|
2012-11-24 09:03:27 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return isVacuumSuccess
|
|
|
|
}
|
2021-02-23 04:52:37 +08:00
|
|
|
func (t *Topology) batchVacuumVolumeCommit(grpcDialOption grpc.DialOption, vl *VolumeLayout, vid needle.VolumeId, locationlist *VolumeLocationList) bool {
|
2012-11-24 09:03:27 +08:00
|
|
|
isCommitSuccess := true
|
2020-03-18 00:43:57 +08:00
|
|
|
isReadOnly := false
|
2012-11-24 09:03:27 +08:00
|
|
|
for _, dn := range locationlist.list {
|
2019-02-06 21:59:15 +08:00
|
|
|
glog.V(0).Infoln("Start Committing vacuum", vid, "on", dn.Url())
|
2021-12-26 16:15:03 +08:00
|
|
|
err := operation.WithVolumeServerClient(true, dn.ServerAddress(), grpcDialOption, func(volumeServerClient volume_server_pb.VolumeServerClient) error {
|
2020-03-18 00:43:57 +08:00
|
|
|
resp, err := volumeServerClient.VacuumVolumeCommit(context.Background(), &volume_server_pb.VacuumVolumeCommitRequest{
|
2019-03-24 02:33:34 +08:00
|
|
|
VolumeId: uint32(vid),
|
2018-10-15 14:12:43 +08:00
|
|
|
})
|
2020-12-02 16:09:19 +08:00
|
|
|
if resp != nil && resp.IsReadOnly {
|
2020-03-18 00:43:57 +08:00
|
|
|
isReadOnly = true
|
|
|
|
}
|
2018-10-15 14:12:43 +08:00
|
|
|
return err
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("Error when committing vacuum %d on %s: %v", vid, dn.Url(), err)
|
2012-11-24 09:03:27 +08:00
|
|
|
isCommitSuccess = false
|
|
|
|
} else {
|
2019-02-06 21:59:15 +08:00
|
|
|
glog.V(0).Infof("Complete Committing vacuum %d on %s", vid, dn.Url())
|
2012-11-24 09:03:27 +08:00
|
|
|
}
|
2020-03-14 06:41:24 +08:00
|
|
|
}
|
|
|
|
if isCommitSuccess {
|
|
|
|
for _, dn := range locationlist.list {
|
2020-03-18 00:43:57 +08:00
|
|
|
vl.SetVolumeAvailable(dn, vid, isReadOnly)
|
2013-10-16 23:10:48 +08:00
|
|
|
}
|
2012-11-24 09:03:27 +08:00
|
|
|
}
|
|
|
|
return isCommitSuccess
|
|
|
|
}
|
2021-02-23 04:52:37 +08:00
|
|
|
func (t *Topology) batchVacuumVolumeCleanup(grpcDialOption grpc.DialOption, vl *VolumeLayout, vid needle.VolumeId, locationlist *VolumeLocationList) {
|
2017-08-30 14:59:53 +08:00
|
|
|
for _, dn := range locationlist.list {
|
|
|
|
glog.V(0).Infoln("Start cleaning up", vid, "on", dn.Url())
|
2021-12-26 16:15:03 +08:00
|
|
|
err := operation.WithVolumeServerClient(true, dn.ServerAddress(), grpcDialOption, func(volumeServerClient volume_server_pb.VolumeServerClient) error {
|
2020-02-26 13:50:12 +08:00
|
|
|
_, err := volumeServerClient.VacuumVolumeCleanup(context.Background(), &volume_server_pb.VacuumVolumeCleanupRequest{
|
2019-03-24 02:33:34 +08:00
|
|
|
VolumeId: uint32(vid),
|
2018-10-15 14:12:43 +08:00
|
|
|
})
|
|
|
|
return err
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
glog.Errorf("Error when cleaning up vacuum %d on %s: %v", vid, dn.Url(), err)
|
2017-08-30 14:59:53 +08:00
|
|
|
} else {
|
2018-10-15 14:12:43 +08:00
|
|
|
glog.V(0).Infof("Complete cleaning up vacuum %d on %s", vid, dn.Url())
|
2017-08-30 14:59:53 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-11-29 15:18:02 +08:00
|
|
|
func (t *Topology) Vacuum(grpcDialOption grpc.DialOption, garbageThreshold float64, preallocate int64) {
|
2019-07-22 12:49:10 +08:00
|
|
|
|
|
|
|
// if there is vacuum going on, return immediately
|
|
|
|
swapped := atomic.CompareAndSwapInt64(&t.vacuumLockCounter, 0, 1)
|
|
|
|
if !swapped {
|
2020-11-29 15:18:02 +08:00
|
|
|
return
|
2019-07-22 12:49:10 +08:00
|
|
|
}
|
|
|
|
defer atomic.StoreInt64(&t.vacuumLockCounter, 0)
|
|
|
|
|
|
|
|
// now only one vacuum process going on
|
|
|
|
|
2018-12-31 16:06:52 +08:00
|
|
|
glog.V(1).Infof("Start vacuum on demand with threshold: %f", garbageThreshold)
|
2016-05-31 03:30:26 +08:00
|
|
|
for _, col := range t.collectionMap.Items() {
|
2014-12-09 12:29:25 +08:00
|
|
|
c := col.(*Collection)
|
2016-05-31 03:30:26 +08:00
|
|
|
for _, vl := range c.storageType2VolumeLayout.Items() {
|
2013-11-12 18:21:22 +08:00
|
|
|
if vl != nil {
|
2014-12-09 12:29:25 +08:00
|
|
|
volumeLayout := vl.(*VolumeLayout)
|
2021-02-23 04:52:37 +08:00
|
|
|
t.vacuumOneVolumeLayout(grpcDialOption, volumeLayout, c, garbageThreshold, preallocate)
|
2018-10-19 11:34:43 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-02-23 04:52:37 +08:00
|
|
|
func (t *Topology) vacuumOneVolumeLayout(grpcDialOption grpc.DialOption, volumeLayout *VolumeLayout, c *Collection, garbageThreshold float64, preallocate int64) {
|
2017-05-23 08:05:27 +08:00
|
|
|
|
2018-10-19 11:34:43 +08:00
|
|
|
volumeLayout.accessLock.RLock()
|
2019-04-19 12:43:36 +08:00
|
|
|
tmpMap := make(map[needle.VolumeId]*VolumeLocationList)
|
2019-01-17 09:17:19 +08:00
|
|
|
for vid, locationList := range volumeLayout.vid2location {
|
2020-09-23 20:56:51 +08:00
|
|
|
tmpMap[vid] = locationList.Copy()
|
2018-10-19 11:34:43 +08:00
|
|
|
}
|
|
|
|
volumeLayout.accessLock.RUnlock()
|
2017-05-23 08:05:27 +08:00
|
|
|
|
2019-01-17 09:17:19 +08:00
|
|
|
for vid, locationList := range tmpMap {
|
2017-05-23 08:05:27 +08:00
|
|
|
|
2018-10-19 11:34:43 +08:00
|
|
|
volumeLayout.accessLock.RLock()
|
2020-09-22 21:31:14 +08:00
|
|
|
isReadOnly := volumeLayout.readonlyVolumes.IsTrue(vid)
|
2018-10-19 11:34:43 +08:00
|
|
|
volumeLayout.accessLock.RUnlock()
|
|
|
|
|
2020-09-22 21:31:14 +08:00
|
|
|
if isReadOnly {
|
2018-10-19 11:34:43 +08:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2018-12-31 16:06:52 +08:00
|
|
|
glog.V(2).Infof("check vacuum on collection:%s volume:%d", c.Name, vid)
|
2021-02-23 04:52:37 +08:00
|
|
|
if vacuumLocationList, needVacuum := t.batchVacuumVolumeCheck(grpcDialOption, vid, locationList, garbageThreshold); needVacuum {
|
|
|
|
if t.batchVacuumVolumeCompact(grpcDialOption, volumeLayout, vid, vacuumLocationList, preallocate) {
|
|
|
|
t.batchVacuumVolumeCommit(grpcDialOption, volumeLayout, vid, vacuumLocationList)
|
2018-10-24 15:00:01 +08:00
|
|
|
} else {
|
2021-02-23 04:52:37 +08:00
|
|
|
t.batchVacuumVolumeCleanup(grpcDialOption, volumeLayout, vid, vacuumLocationList)
|
2012-11-07 17:51:43 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|