2019-04-19 12:43:36 +08:00
|
|
|
package util
|
2012-07-30 16:36:25 +08:00
|
|
|
|
|
|
|
import (
|
2012-12-23 05:15:09 +08:00
|
|
|
"bytes"
|
2020-06-20 23:01:00 +08:00
|
|
|
"fmt"
|
2012-12-23 05:15:09 +08:00
|
|
|
"strings"
|
2014-10-27 02:34:55 +08:00
|
|
|
|
2022-07-29 15:17:28 +08:00
|
|
|
"github.com/seaweedfs/seaweedfs/weed/glog"
|
2020-11-22 05:06:35 +08:00
|
|
|
// "github.com/klauspost/compress/zstd"
|
2012-07-30 16:36:25 +08:00
|
|
|
)
|
|
|
|
|
2020-09-12 19:08:03 +08:00
|
|
|
var (
|
2020-09-04 02:00:20 +08:00
|
|
|
UnsupportedCompression = fmt.Errorf("unsupported compression")
|
|
|
|
)
|
|
|
|
|
2020-09-12 19:08:03 +08:00
|
|
|
func MaybeGzipData(input []byte) []byte {
|
2020-09-04 02:00:20 +08:00
|
|
|
if IsGzippedContent(input) {
|
|
|
|
return input
|
|
|
|
}
|
|
|
|
gzipped, err := GzipData(input)
|
|
|
|
if err != nil {
|
|
|
|
return input
|
|
|
|
}
|
2020-09-12 19:08:03 +08:00
|
|
|
if len(gzipped)*10 > len(input)*9 {
|
2020-09-04 02:00:20 +08:00
|
|
|
return input
|
|
|
|
}
|
|
|
|
return gzipped
|
|
|
|
}
|
|
|
|
|
2020-09-12 19:08:03 +08:00
|
|
|
func MaybeDecompressData(input []byte) []byte {
|
2020-09-04 02:00:20 +08:00
|
|
|
uncompressed, err := DecompressData(input)
|
|
|
|
if err != nil {
|
|
|
|
if err != UnsupportedCompression {
|
|
|
|
glog.Errorf("decompressed data: %v", err)
|
|
|
|
}
|
|
|
|
return input
|
|
|
|
}
|
|
|
|
return uncompressed
|
|
|
|
}
|
|
|
|
|
2019-04-19 12:43:36 +08:00
|
|
|
func GzipData(input []byte) ([]byte, error) {
|
2021-08-20 18:36:51 +08:00
|
|
|
w := new(bytes.Buffer)
|
|
|
|
_, err := GzipStream(w, bytes.NewReader(input))
|
|
|
|
if err != nil {
|
2019-04-19 12:43:36 +08:00
|
|
|
return nil, err
|
|
|
|
}
|
2021-08-20 18:36:51 +08:00
|
|
|
return w.Bytes(), nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func ungzipData(input []byte) ([]byte, error) {
|
|
|
|
w := new(bytes.Buffer)
|
|
|
|
_, err := GunzipStream(w, bytes.NewReader(input))
|
|
|
|
if err != nil {
|
2019-04-19 12:43:36 +08:00
|
|
|
return nil, err
|
|
|
|
}
|
2021-08-20 18:36:51 +08:00
|
|
|
return w.Bytes(), nil
|
2019-04-19 12:43:36 +08:00
|
|
|
}
|
2020-06-25 02:39:09 +08:00
|
|
|
|
2020-06-20 23:16:16 +08:00
|
|
|
func DecompressData(input []byte) ([]byte, error) {
|
2020-06-20 13:45:27 +08:00
|
|
|
if IsGzippedContent(input) {
|
|
|
|
return ungzipData(input)
|
|
|
|
}
|
2020-11-22 05:06:35 +08:00
|
|
|
/*
|
2020-11-27 03:22:30 +08:00
|
|
|
if IsZstdContent(input) {
|
|
|
|
return unzstdData(input)
|
|
|
|
}
|
2020-11-22 05:06:35 +08:00
|
|
|
*/
|
2020-09-04 02:00:20 +08:00
|
|
|
return input, UnsupportedCompression
|
2020-06-20 13:45:27 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
func IsGzippedContent(data []byte) bool {
|
|
|
|
if len(data) < 2 {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
return data[0] == 31 && data[1] == 139
|
|
|
|
}
|
|
|
|
|
2020-11-22 05:06:35 +08:00
|
|
|
/*
|
|
|
|
var zstdEncoder, _ = zstd.NewWriter(nil)
|
|
|
|
|
|
|
|
func ZstdData(input []byte) ([]byte, error) {
|
|
|
|
return zstdEncoder.EncodeAll(input, nil), nil
|
|
|
|
}
|
|
|
|
|
|
|
|
var decoder, _ = zstd.NewReader(nil)
|
|
|
|
|
|
|
|
func unzstdData(input []byte) ([]byte, error) {
|
|
|
|
return decoder.DecodeAll(input, nil)
|
|
|
|
}
|
|
|
|
|
2020-06-24 00:12:02 +08:00
|
|
|
func IsZstdContent(data []byte) bool {
|
|
|
|
if len(data) < 4 {
|
|
|
|
return false
|
|
|
|
}
|
2020-06-25 02:39:09 +08:00
|
|
|
return data[3] == 0xFD && data[2] == 0x2F && data[1] == 0xB5 && data[0] == 0x28
|
2020-06-24 00:12:02 +08:00
|
|
|
}
|
2020-11-22 05:06:35 +08:00
|
|
|
*/
|
2020-06-24 00:12:02 +08:00
|
|
|
|
2019-04-07 05:14:28 +08:00
|
|
|
/*
|
2020-06-24 00:12:02 +08:00
|
|
|
* Default not to compressed since compression can be done on client side.
|
|
|
|
*/func IsCompressableFileType(ext, mtype string) (shouldBeCompressed, iAmSure bool) {
|
2019-04-07 05:14:28 +08:00
|
|
|
|
2018-12-23 07:05:31 +08:00
|
|
|
// text
|
2013-01-17 16:56:56 +08:00
|
|
|
if strings.HasPrefix(mtype, "text/") {
|
2019-04-07 05:14:28 +08:00
|
|
|
return true, true
|
2013-01-17 16:15:09 +08:00
|
|
|
}
|
2018-12-23 07:05:31 +08:00
|
|
|
|
|
|
|
// images
|
|
|
|
switch ext {
|
2020-01-30 12:51:58 +08:00
|
|
|
case ".svg", ".bmp", ".wav":
|
2019-04-07 05:14:28 +08:00
|
|
|
return true, true
|
2018-12-23 07:05:31 +08:00
|
|
|
}
|
|
|
|
if strings.HasPrefix(mtype, "image/") {
|
2019-04-07 05:14:28 +08:00
|
|
|
return false, true
|
2018-12-23 07:05:31 +08:00
|
|
|
}
|
|
|
|
|
2019-02-06 21:59:15 +08:00
|
|
|
// by file name extension
|
2013-01-17 16:56:56 +08:00
|
|
|
switch ext {
|
2021-04-28 16:51:49 +08:00
|
|
|
case ".zip", ".rar", ".gz", ".bz2", ".xz", ".zst", ".br":
|
2019-04-07 05:14:28 +08:00
|
|
|
return false, true
|
2014-07-09 00:32:55 +08:00
|
|
|
case ".pdf", ".txt", ".html", ".htm", ".css", ".js", ".json":
|
2019-04-07 05:14:28 +08:00
|
|
|
return true, true
|
2018-12-23 07:05:31 +08:00
|
|
|
case ".php", ".java", ".go", ".rb", ".c", ".cpp", ".h", ".hpp":
|
2019-04-07 05:14:28 +08:00
|
|
|
return true, true
|
2018-12-28 04:17:05 +08:00
|
|
|
case ".png", ".jpg", ".jpeg":
|
2019-04-07 05:14:28 +08:00
|
|
|
return false, true
|
2012-12-23 05:15:09 +08:00
|
|
|
}
|
2018-12-23 07:05:31 +08:00
|
|
|
|
|
|
|
// by mime type
|
2012-12-23 05:15:09 +08:00
|
|
|
if strings.HasPrefix(mtype, "application/") {
|
2020-06-24 00:12:02 +08:00
|
|
|
if strings.HasSuffix(mtype, "zstd") {
|
|
|
|
return false, true
|
|
|
|
}
|
2013-01-17 16:15:09 +08:00
|
|
|
if strings.HasSuffix(mtype, "xml") {
|
2019-04-07 05:14:28 +08:00
|
|
|
return true, true
|
2013-01-17 16:15:09 +08:00
|
|
|
}
|
|
|
|
if strings.HasSuffix(mtype, "script") {
|
2019-04-07 05:14:28 +08:00
|
|
|
return true, true
|
2012-12-23 05:15:09 +08:00
|
|
|
}
|
2021-04-29 04:36:53 +08:00
|
|
|
if strings.HasSuffix(mtype, "vnd.rar") {
|
2021-04-28 16:54:19 +08:00
|
|
|
return false, true
|
|
|
|
}
|
2020-01-30 12:51:58 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if strings.HasPrefix(mtype, "audio/") {
|
|
|
|
switch strings.TrimPrefix(mtype, "audio/") {
|
|
|
|
case "wave", "wav", "x-wav", "x-pn-wav":
|
|
|
|
return true, true
|
|
|
|
}
|
2012-12-23 05:15:09 +08:00
|
|
|
}
|
2018-12-23 07:05:31 +08:00
|
|
|
|
2019-04-07 05:14:28 +08:00
|
|
|
return false, false
|
2012-07-30 16:36:25 +08:00
|
|
|
}
|