mirror of
https://github.com/seaweedfs/seaweedfs.git
synced 2025-01-22 09:25:48 +08:00
198 lines
5.5 KiB
Go
198 lines
5.5 KiB
Go
package main
|
|
|
|
import (
|
|
"archive/tar"
|
|
"bytes"
|
|
"fmt"
|
|
"os"
|
|
"path"
|
|
"strconv"
|
|
"strings"
|
|
"text/template"
|
|
"time"
|
|
|
|
"github.com/chrislusf/seaweedfs/go/glog"
|
|
"github.com/chrislusf/seaweedfs/go/storage"
|
|
)
|
|
|
|
func init() {
|
|
cmdExport.Run = runExport // break init cycle
|
|
}
|
|
|
|
const (
|
|
defaultFnFormat = `{{.Mime}}/{{.Id}}:{{.Name}}`
|
|
timeFormat = "2006-01-02T15:04:05"
|
|
)
|
|
|
|
var cmdExport = &Command{
|
|
UsageLine: "export -dir=/tmp -volumeId=234 -o=/dir/name.tar -fileNameFormat={{.Name}} -newer='" + timeFormat + "'",
|
|
Short: "list or export files from one volume data file",
|
|
Long: `List all files in a volume, or Export all files in a volume to a tar file if the output is specified.
|
|
|
|
The format of file name in the tar file can be customized. Default is {{.Mime}}/{{.Id}}:{{.Name}}. Also available is {{.Key}}.
|
|
|
|
`,
|
|
}
|
|
|
|
var (
|
|
exportVolumePath = cmdExport.Flag.String("dir", ".", "input data directory to store volume data files")
|
|
exportCollection = cmdExport.Flag.String("collection", "", "the volume collection name")
|
|
exportVolumeId = cmdExport.Flag.Int("volumeId", -1, "a volume id. The volume .dat and .idx files should already exist in the dir.")
|
|
dest = cmdExport.Flag.String("o", "", "output tar file name, must ends with .tar, or just a \"-\" for stdout")
|
|
format = cmdExport.Flag.String("fileNameFormat", defaultFnFormat, "filename format, default to {{.Mime}}/{{.Id}}:{{.Name}}")
|
|
newer = cmdExport.Flag.String("newer", "", "export only files newer than this time, default is all files. Must be specified in RFC3339 without timezone")
|
|
tarFh *tar.Writer
|
|
tarHeader tar.Header
|
|
fnTmpl *template.Template
|
|
fnTmplBuf = bytes.NewBuffer(nil)
|
|
newerThan time.Time
|
|
newerThanUnix int64 = -1
|
|
localLocation, _ = time.LoadLocation("Local")
|
|
)
|
|
|
|
func runExport(cmd *Command, args []string) bool {
|
|
|
|
var err error
|
|
|
|
if *newer != "" {
|
|
if newerThan, err = time.ParseInLocation(timeFormat, *newer, localLocation); err != nil {
|
|
fmt.Println("cannot parse 'newer' argument: " + err.Error())
|
|
return false
|
|
}
|
|
newerThanUnix = newerThan.Unix()
|
|
}
|
|
|
|
if *exportVolumeId == -1 {
|
|
return false
|
|
}
|
|
|
|
if *dest != "" {
|
|
if *dest != "-" && !strings.HasSuffix(*dest, ".tar") {
|
|
fmt.Println("the output file", *dest, "should be '-' or end with .tar")
|
|
return false
|
|
}
|
|
|
|
if fnTmpl, err = template.New("name").Parse(*format); err != nil {
|
|
fmt.Println("cannot parse format " + *format + ": " + err.Error())
|
|
return false
|
|
}
|
|
|
|
var fh *os.File
|
|
if *dest == "-" {
|
|
fh = os.Stdout
|
|
} else {
|
|
if fh, err = os.Create(*dest); err != nil {
|
|
glog.Fatalf("cannot open output tar %s: %s", *dest, err)
|
|
}
|
|
}
|
|
defer fh.Close()
|
|
tarFh = tar.NewWriter(fh)
|
|
defer tarFh.Close()
|
|
t := time.Now()
|
|
tarHeader = tar.Header{Mode: 0644,
|
|
ModTime: t, Uid: os.Getuid(), Gid: os.Getgid(),
|
|
Typeflag: tar.TypeReg,
|
|
AccessTime: t, ChangeTime: t}
|
|
}
|
|
|
|
fileName := strconv.Itoa(*exportVolumeId)
|
|
if *exportCollection != "" {
|
|
fileName = *exportCollection + "_" + fileName
|
|
}
|
|
vid := storage.VolumeId(*exportVolumeId)
|
|
indexFile, err := os.OpenFile(path.Join(*exportVolumePath, fileName+".idx"), os.O_RDONLY, 0644)
|
|
if err != nil {
|
|
glog.Fatalf("Create Volume Index [ERROR] %s\n", err)
|
|
}
|
|
defer indexFile.Close()
|
|
|
|
nm, err := storage.LoadNeedleMap(indexFile)
|
|
if err != nil {
|
|
glog.Fatalf("cannot load needle map from %s: %s", indexFile.Name(), err)
|
|
}
|
|
|
|
var version storage.Version
|
|
|
|
err = storage.ScanVolumeFile(*exportVolumePath, *exportCollection, vid,
|
|
storage.NeedleMapInMemory,
|
|
func(superBlock storage.SuperBlock) error {
|
|
version = superBlock.Version()
|
|
return nil
|
|
}, true, func(n *storage.Needle, offset int64) error {
|
|
nv, ok := nm.Get(n.Id)
|
|
glog.V(3).Infof("key %d offset %d size %d disk_size %d gzip %v ok %v nv %+v",
|
|
n.Id, offset, n.Size, n.DiskSize(), n.IsGzipped(), ok, nv)
|
|
if ok && nv.Size > 0 && int64(nv.Offset)*8 == offset {
|
|
if newerThanUnix >= 0 && n.HasLastModifiedDate() && n.LastModified < uint64(newerThanUnix) {
|
|
glog.V(3).Infof("Skipping this file, as it's old enough: LastModified %d vs %d",
|
|
n.LastModified, newerThanUnix)
|
|
return nil
|
|
}
|
|
return walker(vid, n, version)
|
|
}
|
|
if !ok {
|
|
glog.V(2).Infof("This seems deleted %d size %d", n.Id, n.Size)
|
|
} else {
|
|
glog.V(2).Infof("Skipping later-updated Id %d size %d", n.Id, n.Size)
|
|
}
|
|
return nil
|
|
})
|
|
if err != nil {
|
|
glog.Fatalf("Export Volume File [ERROR] %s\n", err)
|
|
}
|
|
return true
|
|
}
|
|
|
|
type nameParams struct {
|
|
Name string
|
|
Id uint64
|
|
Mime string
|
|
Key string
|
|
}
|
|
|
|
func walker(vid storage.VolumeId, n *storage.Needle, version storage.Version) (err error) {
|
|
key := storage.NewFileIdFromNeedle(vid, n).String()
|
|
if tarFh != nil {
|
|
fnTmplBuf.Reset()
|
|
if err = fnTmpl.Execute(fnTmplBuf,
|
|
nameParams{Name: string(n.Name),
|
|
Id: n.Id,
|
|
Mime: string(n.Mime),
|
|
Key: key,
|
|
},
|
|
); err != nil {
|
|
return err
|
|
}
|
|
nm := fnTmplBuf.String()
|
|
|
|
if n.IsGzipped() && path.Ext(nm) != ".gz" {
|
|
nm = nm + ".gz"
|
|
}
|
|
|
|
tarHeader.Name, tarHeader.Size = nm, int64(len(n.Data))
|
|
if n.HasLastModifiedDate() {
|
|
tarHeader.ModTime = time.Unix(int64(n.LastModified), 0)
|
|
} else {
|
|
tarHeader.ModTime = time.Unix(0, 0)
|
|
}
|
|
tarHeader.ChangeTime = tarHeader.ModTime
|
|
if err = tarFh.WriteHeader(&tarHeader); err != nil {
|
|
return err
|
|
}
|
|
_, err = tarFh.Write(n.Data)
|
|
} else {
|
|
size := n.DataSize
|
|
if version == storage.Version1 {
|
|
size = n.Size
|
|
}
|
|
fmt.Printf("key=%s Name=%s Size=%d gzip=%t mime=%s\n",
|
|
key,
|
|
n.Name,
|
|
size,
|
|
n.IsGzipped(),
|
|
n.Mime,
|
|
)
|
|
}
|
|
return
|
|
}
|