2012-08-24 13:33:37 +08:00
|
|
|
package topology
|
|
|
|
|
|
|
|
import (
|
2014-10-27 02:34:55 +08:00
|
|
|
"errors"
|
|
|
|
"io/ioutil"
|
|
|
|
"math/rand"
|
|
|
|
|
2015-04-17 03:18:06 +08:00
|
|
|
"github.com/chrislusf/seaweedfs/go/glog"
|
|
|
|
"github.com/chrislusf/seaweedfs/go/operation"
|
|
|
|
"github.com/chrislusf/seaweedfs/go/sequence"
|
|
|
|
"github.com/chrislusf/seaweedfs/go/storage"
|
|
|
|
"github.com/chrislusf/seaweedfs/go/util"
|
2014-03-16 14:03:49 +08:00
|
|
|
"github.com/goraft/raft"
|
2012-08-24 13:33:37 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
type Topology struct {
|
2012-09-03 05:33:48 +08:00
|
|
|
NodeImpl
|
2012-09-10 15:18:07 +08:00
|
|
|
|
2014-12-09 12:29:25 +08:00
|
|
|
collectionMap *util.ConcurrentReadMap
|
2012-09-10 15:18:07 +08:00
|
|
|
|
|
|
|
pulse int64
|
|
|
|
|
|
|
|
volumeSizeLimit uint64
|
|
|
|
|
2014-04-17 14:43:27 +08:00
|
|
|
Sequence sequence.Sequencer
|
2012-09-19 05:05:12 +08:00
|
|
|
|
|
|
|
chanDeadDataNodes chan *DataNode
|
|
|
|
chanRecoveredDataNodes chan *DataNode
|
2012-12-04 12:28:12 +08:00
|
|
|
chanFullVolumes chan storage.VolumeInfo
|
2012-09-24 17:01:53 +08:00
|
|
|
|
2012-09-23 11:46:31 +08:00
|
|
|
configuration *Configuration
|
2014-03-16 14:03:49 +08:00
|
|
|
|
|
|
|
RaftServer raft.Server
|
2012-08-31 16:35:11 +08:00
|
|
|
}
|
2012-08-28 16:04:39 +08:00
|
|
|
|
2013-11-10 17:31:50 +08:00
|
|
|
func NewTopology(id string, confFile string, seq sequence.Sequencer, volumeSizeLimit uint64, pulse int) (*Topology, error) {
|
2012-09-03 05:33:48 +08:00
|
|
|
t := &Topology{}
|
|
|
|
t.id = NodeId(id)
|
|
|
|
t.nodeType = "Topology"
|
2012-09-19 16:45:30 +08:00
|
|
|
t.NodeImpl.value = t
|
2012-09-03 05:33:48 +08:00
|
|
|
t.children = make(map[NodeId]Node)
|
2014-12-09 12:29:25 +08:00
|
|
|
t.collectionMap = util.NewConcurrentReadMap()
|
2012-09-10 15:18:07 +08:00
|
|
|
t.pulse = int64(pulse)
|
|
|
|
t.volumeSizeLimit = volumeSizeLimit
|
2012-09-19 16:45:30 +08:00
|
|
|
|
2014-04-17 14:43:27 +08:00
|
|
|
t.Sequence = seq
|
2012-09-19 16:45:30 +08:00
|
|
|
|
2012-09-19 05:05:12 +08:00
|
|
|
t.chanDeadDataNodes = make(chan *DataNode)
|
|
|
|
t.chanRecoveredDataNodes = make(chan *DataNode)
|
2012-12-04 12:28:12 +08:00
|
|
|
t.chanFullVolumes = make(chan storage.VolumeInfo)
|
2012-09-19 16:45:30 +08:00
|
|
|
|
2013-02-27 14:54:22 +08:00
|
|
|
err := t.loadConfiguration(confFile)
|
2012-09-24 17:01:53 +08:00
|
|
|
|
2013-02-27 14:54:22 +08:00
|
|
|
return t, err
|
2012-09-03 05:33:48 +08:00
|
|
|
}
|
2012-09-17 08:31:15 +08:00
|
|
|
|
2014-03-16 14:03:49 +08:00
|
|
|
func (t *Topology) IsLeader() bool {
|
2014-04-12 07:23:58 +08:00
|
|
|
if leader, e := t.Leader(); e == nil {
|
|
|
|
return leader == t.RaftServer.Name()
|
|
|
|
}
|
|
|
|
return false
|
2014-03-16 14:03:49 +08:00
|
|
|
}
|
|
|
|
|
2014-04-12 07:23:58 +08:00
|
|
|
func (t *Topology) Leader() (string, error) {
|
2014-03-16 14:03:49 +08:00
|
|
|
l := ""
|
|
|
|
if t.RaftServer != nil {
|
|
|
|
l = t.RaftServer.Leader()
|
2014-04-12 07:23:58 +08:00
|
|
|
} else {
|
|
|
|
return "", errors.New("Raft Server not ready yet!")
|
2014-03-16 14:03:49 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if l == "" {
|
|
|
|
// We are a single node cluster, we are the leader
|
2014-04-12 07:23:58 +08:00
|
|
|
return t.RaftServer.Name(), errors.New("Raft Server not initialized!")
|
2014-03-16 14:03:49 +08:00
|
|
|
}
|
|
|
|
|
2014-04-12 07:23:58 +08:00
|
|
|
return l, nil
|
2014-03-16 14:03:49 +08:00
|
|
|
}
|
|
|
|
|
2012-09-24 17:01:53 +08:00
|
|
|
func (t *Topology) loadConfiguration(configurationFile string) error {
|
|
|
|
b, e := ioutil.ReadFile(configurationFile)
|
|
|
|
if e == nil {
|
|
|
|
t.configuration, e = NewConfiguration(b)
|
2013-03-20 01:33:33 +08:00
|
|
|
return e
|
2012-09-24 17:01:53 +08:00
|
|
|
}
|
2015-03-10 15:20:31 +08:00
|
|
|
glog.V(0).Infoln("Using default configurations.")
|
2013-03-20 01:33:33 +08:00
|
|
|
return nil
|
2012-09-23 11:46:31 +08:00
|
|
|
}
|
|
|
|
|
2013-11-12 18:21:22 +08:00
|
|
|
func (t *Topology) Lookup(collection string, vid storage.VolumeId) []*DataNode {
|
|
|
|
//maybe an issue if lots of collections?
|
|
|
|
if collection == "" {
|
2014-12-09 12:29:25 +08:00
|
|
|
for _, c := range t.collectionMap.Items {
|
|
|
|
if list := c.(*Collection).Lookup(vid); list != nil {
|
2012-09-24 17:01:53 +08:00
|
|
|
return list
|
|
|
|
}
|
|
|
|
}
|
2013-11-12 18:21:22 +08:00
|
|
|
} else {
|
2014-12-09 12:29:25 +08:00
|
|
|
if c, ok := t.collectionMap.Items[collection]; ok {
|
|
|
|
return c.(*Collection).Lookup(vid)
|
2013-11-12 18:21:22 +08:00
|
|
|
}
|
2012-09-24 17:01:53 +08:00
|
|
|
}
|
|
|
|
return nil
|
2012-09-24 06:45:26 +08:00
|
|
|
}
|
|
|
|
|
2012-09-03 16:50:04 +08:00
|
|
|
func (t *Topology) NextVolumeId() storage.VolumeId {
|
2012-09-03 05:33:48 +08:00
|
|
|
vid := t.GetMaxVolumeId()
|
2014-03-16 14:03:49 +08:00
|
|
|
next := vid.Next()
|
|
|
|
go t.RaftServer.Do(NewMaxVolumeIdCommand(next))
|
|
|
|
return next
|
2012-08-28 16:04:39 +08:00
|
|
|
}
|
2012-09-10 15:18:07 +08:00
|
|
|
|
2014-10-26 14:45:31 +08:00
|
|
|
func (t *Topology) HasWritableVolume(option *VolumeGrowOption) bool {
|
2014-09-21 03:38:59 +08:00
|
|
|
vl := t.GetVolumeLayout(option.Collection, option.ReplicaPlacement, option.Ttl)
|
2014-04-13 16:29:52 +08:00
|
|
|
return vl.GetActiveVolumeCount(option) > 0
|
|
|
|
}
|
|
|
|
|
2015-04-07 05:17:36 +08:00
|
|
|
func (t *Topology) PickForWrite(count uint64, option *VolumeGrowOption) (string, uint64, *DataNode, error) {
|
2014-09-21 03:38:59 +08:00
|
|
|
vid, count, datanodes, err := t.GetVolumeLayout(option.Collection, option.ReplicaPlacement, option.Ttl).PickForWrite(count, option)
|
2013-03-20 20:12:55 +08:00
|
|
|
if err != nil || datanodes.Length() == 0 {
|
2015-01-13 18:46:56 +08:00
|
|
|
return "", 0, nil, errors.New("No writable volumes available!")
|
2012-09-17 08:31:15 +08:00
|
|
|
}
|
2014-04-17 14:43:27 +08:00
|
|
|
fileId, count := t.Sequence.NextFileId(count)
|
2013-04-16 15:10:21 +08:00
|
|
|
return storage.NewFileId(*vid, fileId, rand.Uint32()).String(), count, datanodes.Head(), nil
|
2012-09-17 08:31:15 +08:00
|
|
|
}
|
|
|
|
|
2014-09-21 03:38:59 +08:00
|
|
|
func (t *Topology) GetVolumeLayout(collectionName string, rp *storage.ReplicaPlacement, ttl *storage.TTL) *VolumeLayout {
|
2014-12-09 12:29:25 +08:00
|
|
|
return t.collectionMap.Get(collectionName, func() interface{} {
|
|
|
|
return NewCollection(collectionName, t.volumeSizeLimit)
|
|
|
|
}).(*Collection).GetOrCreateVolumeLayout(rp, ttl)
|
2012-09-14 16:17:13 +08:00
|
|
|
}
|
|
|
|
|
2014-12-09 12:29:25 +08:00
|
|
|
func (t *Topology) GetCollection(collectionName string) (*Collection, bool) {
|
|
|
|
c, hasCollection := t.collectionMap.Items[collectionName]
|
|
|
|
return c.(*Collection), hasCollection
|
2014-03-11 02:43:54 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
func (t *Topology) DeleteCollection(collectionName string) {
|
2014-12-09 12:29:25 +08:00
|
|
|
delete(t.collectionMap.Items, collectionName)
|
2014-03-11 02:43:54 +08:00
|
|
|
}
|
|
|
|
|
2014-03-19 19:48:13 +08:00
|
|
|
func (t *Topology) RegisterVolumeLayout(v storage.VolumeInfo, dn *DataNode) {
|
2014-09-21 03:38:59 +08:00
|
|
|
t.GetVolumeLayout(v.Collection, v.ReplicaPlacement, v.Ttl).RegisterVolume(&v, dn)
|
|
|
|
}
|
|
|
|
func (t *Topology) UnRegisterVolumeLayout(v storage.VolumeInfo, dn *DataNode) {
|
|
|
|
glog.Infof("removing volume info:%+v", v)
|
|
|
|
t.GetVolumeLayout(v.Collection, v.ReplicaPlacement, v.Ttl).UnRegisterVolume(&v, dn)
|
2012-09-17 08:31:15 +08:00
|
|
|
}
|
|
|
|
|
2014-09-21 03:38:59 +08:00
|
|
|
func (t *Topology) ProcessJoinMessage(joinMessage *operation.JoinMessage) {
|
2014-04-21 17:11:10 +08:00
|
|
|
t.Sequence.SetMax(*joinMessage.MaxFileKey)
|
|
|
|
dcName, rackName := t.configuration.Locate(*joinMessage.Ip, *joinMessage.DataCenter, *joinMessage.Rack)
|
2012-09-23 11:46:31 +08:00
|
|
|
dc := t.GetOrCreateDataCenter(dcName)
|
|
|
|
rack := dc.GetOrCreateRack(rackName)
|
2014-04-21 17:11:10 +08:00
|
|
|
dn := rack.FindDataNode(*joinMessage.Ip, int(*joinMessage.Port))
|
|
|
|
if *joinMessage.IsInit && dn != nil {
|
2012-12-23 08:26:02 +08:00
|
|
|
t.UnRegisterDataNode(dn)
|
|
|
|
}
|
2015-01-19 09:03:38 +08:00
|
|
|
dn = rack.GetOrCreateDataNode(*joinMessage.Ip,
|
2015-03-09 16:10:01 +08:00
|
|
|
int(*joinMessage.Port), *joinMessage.PublicUrl,
|
2015-01-19 09:03:38 +08:00
|
|
|
int(*joinMessage.MaxVolumeCount))
|
2014-04-21 17:11:10 +08:00
|
|
|
var volumeInfos []storage.VolumeInfo
|
|
|
|
for _, v := range joinMessage.Volumes {
|
|
|
|
if vi, err := storage.NewVolumeInfo(v); err == nil {
|
|
|
|
volumeInfos = append(volumeInfos, vi)
|
|
|
|
} else {
|
|
|
|
glog.V(0).Infoln("Fail to convert joined volume information:", err.Error())
|
|
|
|
}
|
|
|
|
}
|
2014-09-21 03:38:59 +08:00
|
|
|
deletedVolumes := dn.UpdateVolumes(volumeInfos)
|
2012-09-17 08:31:15 +08:00
|
|
|
for _, v := range volumeInfos {
|
2014-03-19 19:48:13 +08:00
|
|
|
t.RegisterVolumeLayout(v, dn)
|
2012-09-17 08:31:15 +08:00
|
|
|
}
|
2014-09-21 03:38:59 +08:00
|
|
|
for _, v := range deletedVolumes {
|
|
|
|
t.UnRegisterVolumeLayout(v, dn)
|
|
|
|
}
|
2012-09-14 16:17:13 +08:00
|
|
|
}
|
|
|
|
|
2012-09-23 11:46:31 +08:00
|
|
|
func (t *Topology) GetOrCreateDataCenter(dcName string) *DataCenter {
|
2012-09-17 08:31:15 +08:00
|
|
|
for _, c := range t.Children() {
|
|
|
|
dc := c.(*DataCenter)
|
2012-09-23 11:46:31 +08:00
|
|
|
if string(dc.Id()) == dcName {
|
2012-09-17 08:31:15 +08:00
|
|
|
return dc
|
|
|
|
}
|
|
|
|
}
|
2012-09-23 11:46:31 +08:00
|
|
|
dc := NewDataCenter(dcName)
|
2012-09-17 08:31:15 +08:00
|
|
|
t.LinkChildNode(dc)
|
|
|
|
return dc
|
|
|
|
}
|