Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
package storage
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
"os"
|
|
|
|
|
|
|
|
"github.com/boltdb/bolt"
|
2016-04-10 15:24:22 +08:00
|
|
|
|
2016-06-03 09:09:14 +08:00
|
|
|
"github.com/chrislusf/seaweedfs/weed/glog"
|
|
|
|
"github.com/chrislusf/seaweedfs/weed/util"
|
Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
type BoltDbNeedleMap struct {
|
|
|
|
dbFileName string
|
|
|
|
db *bolt.DB
|
2015-05-26 15:58:41 +08:00
|
|
|
baseNeedleMapper
|
Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
var boltdbBucket = []byte("weed")
|
|
|
|
|
|
|
|
func NewBoltDbNeedleMap(dbFileName string, indexFile *os.File) (m *BoltDbNeedleMap, err error) {
|
2015-05-26 15:58:41 +08:00
|
|
|
m = &BoltDbNeedleMap{dbFileName: dbFileName}
|
|
|
|
m.indexFile = indexFile
|
Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
if !isBoltDbFresh(dbFileName, indexFile) {
|
|
|
|
glog.V(1).Infof("Start to Generate %s from %s", dbFileName, indexFile.Name())
|
|
|
|
generateBoltDbFile(dbFileName, indexFile)
|
|
|
|
glog.V(1).Infof("Finished Generating %s from %s", dbFileName, indexFile.Name())
|
|
|
|
}
|
|
|
|
glog.V(1).Infof("Opening %s...", dbFileName)
|
|
|
|
if m.db, err = bolt.Open(dbFileName, 0644, nil); err != nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
glog.V(1).Infof("Loading %s...", indexFile.Name())
|
|
|
|
nm, indexLoadError := LoadNeedleMap(indexFile)
|
|
|
|
if indexLoadError != nil {
|
|
|
|
return nil, indexLoadError
|
|
|
|
}
|
|
|
|
m.mapMetric = nm.mapMetric
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
func isBoltDbFresh(dbFileName string, indexFile *os.File) bool {
|
|
|
|
// normally we always write to index file first
|
|
|
|
dbLogFile, err := os.Open(dbFileName)
|
|
|
|
if err != nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
defer dbLogFile.Close()
|
|
|
|
dbStat, dbStatErr := dbLogFile.Stat()
|
|
|
|
indexStat, indexStatErr := indexFile.Stat()
|
|
|
|
if dbStatErr != nil || indexStatErr != nil {
|
|
|
|
glog.V(0).Infof("Can not stat file: %v and %v", dbStatErr, indexStatErr)
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
return dbStat.ModTime().After(indexStat.ModTime())
|
|
|
|
}
|
|
|
|
|
|
|
|
func generateBoltDbFile(dbFileName string, indexFile *os.File) error {
|
|
|
|
db, err := bolt.Open(dbFileName, 0644, nil)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer db.Close()
|
|
|
|
return WalkIndexFile(indexFile, func(key uint64, offset, size uint32) error {
|
|
|
|
if offset > 0 {
|
|
|
|
boltDbWrite(db, key, offset, size)
|
|
|
|
} else {
|
|
|
|
boltDbDelete(db, key)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *BoltDbNeedleMap) Get(key uint64) (element *NeedleValue, ok bool) {
|
|
|
|
bytes := make([]byte, 8)
|
|
|
|
var data []byte
|
2016-04-10 15:24:22 +08:00
|
|
|
util.Uint64toBytes(bytes, key)
|
Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
err := m.db.View(func(tx *bolt.Tx) error {
|
|
|
|
bucket := tx.Bucket(boltdbBucket)
|
|
|
|
if bucket == nil {
|
|
|
|
return fmt.Errorf("Bucket %q not found!", boltdbBucket)
|
|
|
|
}
|
|
|
|
|
|
|
|
data = bucket.Get(bytes)
|
|
|
|
return nil
|
|
|
|
})
|
|
|
|
|
|
|
|
if err != nil || len(data) != 8 {
|
|
|
|
return nil, false
|
|
|
|
}
|
2016-04-10 15:24:22 +08:00
|
|
|
offset := util.BytesToUint32(data[0:4])
|
|
|
|
size := util.BytesToUint32(data[4:8])
|
Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
return &NeedleValue{Key: Key(key), Offset: offset, Size: size}, true
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *BoltDbNeedleMap) Put(key uint64, offset uint32, size uint32) error {
|
|
|
|
var oldSize uint32
|
|
|
|
if oldNeedle, ok := m.Get(key); ok {
|
|
|
|
oldSize = oldNeedle.Size
|
|
|
|
}
|
|
|
|
m.logPut(key, oldSize, size)
|
|
|
|
// write to index file first
|
2015-05-26 15:58:41 +08:00
|
|
|
if err := m.appendToIndexFile(key, offset, size); err != nil {
|
Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
return fmt.Errorf("cannot write to indexfile %s: %v", m.indexFile.Name(), err)
|
|
|
|
}
|
|
|
|
return boltDbWrite(m.db, key, offset, size)
|
|
|
|
}
|
|
|
|
|
|
|
|
func boltDbWrite(db *bolt.DB,
|
|
|
|
key uint64, offset uint32, size uint32) error {
|
|
|
|
bytes := make([]byte, 16)
|
2016-04-10 15:24:22 +08:00
|
|
|
util.Uint64toBytes(bytes[0:8], key)
|
|
|
|
util.Uint32toBytes(bytes[8:12], offset)
|
|
|
|
util.Uint32toBytes(bytes[12:16], size)
|
Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
return db.Update(func(tx *bolt.Tx) error {
|
|
|
|
bucket, err := tx.CreateBucketIfNotExists(boltdbBucket)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
err = bucket.Put(bytes[0:8], bytes[8:16])
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
|
|
|
}
|
|
|
|
func boltDbDelete(db *bolt.DB, key uint64) error {
|
|
|
|
bytes := make([]byte, 8)
|
2016-04-10 15:24:22 +08:00
|
|
|
util.Uint64toBytes(bytes, key)
|
Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
return db.Update(func(tx *bolt.Tx) error {
|
|
|
|
bucket, err := tx.CreateBucketIfNotExists(boltdbBucket)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
err = bucket.Delete(bytes)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *BoltDbNeedleMap) Delete(key uint64) error {
|
|
|
|
if oldNeedle, ok := m.Get(key); ok {
|
|
|
|
m.logDelete(oldNeedle.Size)
|
|
|
|
}
|
|
|
|
// write to index file first
|
2015-05-26 15:58:41 +08:00
|
|
|
if err := m.appendToIndexFile(key, 0, 0); err != nil {
|
Add boltdb for volume needle map
boltdb is fairly slow to write, about 6 minutes for recreating index
for 1553934 files. Boltdb loads 1,553,934 x 16 = 24,862,944bytes from
disk, and generate the boltdb as large as 134,217,728 bytes in 6
minutes.
To compare, for leveldb, it recreates index in leveldb as large as
27,188,148 bytes in 8 seconds.
For in memory version, it loads the index in
To test the memory consumption, the leveldb or boltdb index are
created. And the server is restarted. Using the benchmark tool to read
lots of files. There are 7 volumes in benchmark collection, each with
about 1553K files.
For leveldb, the memory starts at 142,884KB, and stays at 179,340KB.
For boltdb, the memory starts at 73,756KB, and stays at 144,564KB.
For in-memory, the memory starts at 368,152KB, and stays at 448,032KB.
2015-03-30 02:04:32 +08:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
return boltDbDelete(m.db, key)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *BoltDbNeedleMap) Close() {
|
|
|
|
m.db.Close()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *BoltDbNeedleMap) Destroy() error {
|
|
|
|
m.Close()
|
|
|
|
os.Remove(m.indexFile.Name())
|
|
|
|
return os.Remove(m.dbFileName)
|
|
|
|
}
|