2016-11-18 00:47:31 +00:00
|
|
|
package mtree
|
|
|
|
|
|
|
|
import (
|
|
|
|
"archive/tar"
|
|
|
|
"crypto/md5"
|
|
|
|
"crypto/sha1"
|
|
|
|
"crypto/sha256"
|
|
|
|
"crypto/sha512"
|
|
|
|
"fmt"
|
|
|
|
"hash"
|
|
|
|
"io"
|
|
|
|
"os"
|
|
|
|
|
2017-02-15 16:10:30 +00:00
|
|
|
"github.com/vbatts/go-mtree/pkg/govis"
|
2016-11-18 00:47:31 +00:00
|
|
|
"golang.org/x/crypto/ripemd160"
|
|
|
|
)
|
|
|
|
|
|
|
|
// KeywordFunc is the type of a function called on each file to be included in
|
|
|
|
// a DirectoryHierarchy, that will produce the string output of the keyword to
|
|
|
|
// be included for the file entry. Otherwise, empty string.
|
|
|
|
// io.Reader `r` is to the file stream for the file payload. While this
|
|
|
|
// function takes an io.Reader, the caller needs to reset it to the beginning
|
|
|
|
// for each new KeywordFunc
|
|
|
|
type KeywordFunc func(path string, info os.FileInfo, r io.Reader) (KeyVal, error)
|
|
|
|
|
|
|
|
var (
|
|
|
|
// KeywordFuncs is the map of all keywords (and the functions to produce them)
|
|
|
|
KeywordFuncs = map[Keyword]KeywordFunc{
|
|
|
|
"size": sizeKeywordFunc, // The size, in bytes, of the file
|
|
|
|
"type": typeKeywordFunc, // The type of the file
|
|
|
|
"time": timeKeywordFunc, // The last modification time of the file
|
|
|
|
"link": linkKeywordFunc, // The target of the symbolic link when type=link
|
|
|
|
"uid": uidKeywordFunc, // The file owner as a numeric value
|
|
|
|
"gid": gidKeywordFunc, // The file group as a numeric value
|
|
|
|
"nlink": nlinkKeywordFunc, // The number of hard links the file is expected to have
|
|
|
|
"uname": unameKeywordFunc, // The file owner as a symbolic name
|
|
|
|
"mode": modeKeywordFunc, // The current file's permissions as a numeric (octal) or symbolic value
|
|
|
|
"cksum": cksumKeywordFunc, // The checksum of the file using the default algorithm specified by the cksum(1) utility
|
|
|
|
"md5": hasherKeywordFunc("md5digest", md5.New), // The MD5 message digest of the file
|
|
|
|
"md5digest": hasherKeywordFunc("md5digest", md5.New), // A synonym for `md5`
|
|
|
|
"rmd160": hasherKeywordFunc("ripemd160digest", ripemd160.New), // The RIPEMD160 message digest of the file
|
|
|
|
"rmd160digest": hasherKeywordFunc("ripemd160digest", ripemd160.New), // A synonym for `rmd160`
|
|
|
|
"ripemd160digest": hasherKeywordFunc("ripemd160digest", ripemd160.New), // A synonym for `rmd160`
|
|
|
|
"sha1": hasherKeywordFunc("sha1digest", sha1.New), // The SHA1 message digest of the file
|
|
|
|
"sha1digest": hasherKeywordFunc("sha1digest", sha1.New), // A synonym for `sha1`
|
|
|
|
"sha256": hasherKeywordFunc("sha256digest", sha256.New), // The SHA256 message digest of the file
|
|
|
|
"sha256digest": hasherKeywordFunc("sha256digest", sha256.New), // A synonym for `sha256`
|
|
|
|
"sha384": hasherKeywordFunc("sha384digest", sha512.New384), // The SHA384 message digest of the file
|
|
|
|
"sha384digest": hasherKeywordFunc("sha384digest", sha512.New384), // A synonym for `sha384`
|
|
|
|
"sha512": hasherKeywordFunc("sha512digest", sha512.New), // The SHA512 message digest of the file
|
|
|
|
"sha512digest": hasherKeywordFunc("sha512digest", sha512.New), // A synonym for `sha512`
|
|
|
|
|
|
|
|
"flags": flagsKeywordFunc, // NOTE: this is a noop, but here to support the presence of the "flags" keyword.
|
|
|
|
|
|
|
|
// This is not an upstreamed keyword, but used to vary from "time", as tar
|
|
|
|
// archives do not store nanosecond precision. So comparing on "time" will
|
|
|
|
// be only seconds level accurate.
|
|
|
|
"tar_time": tartimeKeywordFunc, // The last modification time of the file, from a tar archive mtime
|
|
|
|
|
|
|
|
// This is not an upstreamed keyword, but a needed attribute for file validation.
|
|
|
|
// The pattern for this keyword key is prefixed by "xattr." followed by the extended attribute "namespace.key".
|
|
|
|
// The keyword value is the SHA1 digest of the extended attribute's value.
|
|
|
|
// In this way, the order of the keys does not matter, and the contents of the value is not revealed.
|
|
|
|
"xattr": xattrKeywordFunc,
|
|
|
|
"xattrs": xattrKeywordFunc,
|
|
|
|
}
|
|
|
|
)
|
|
|
|
var (
|
|
|
|
modeKeywordFunc = func(path string, info os.FileInfo, r io.Reader) (KeyVal, error) {
|
|
|
|
permissions := info.Mode().Perm()
|
|
|
|
if os.ModeSetuid&info.Mode() > 0 {
|
|
|
|
permissions |= (1 << 11)
|
|
|
|
}
|
|
|
|
if os.ModeSetgid&info.Mode() > 0 {
|
|
|
|
permissions |= (1 << 10)
|
|
|
|
}
|
|
|
|
if os.ModeSticky&info.Mode() > 0 {
|
|
|
|
permissions |= (1 << 9)
|
|
|
|
}
|
|
|
|
return KeyVal(fmt.Sprintf("mode=%#o", permissions)), nil
|
|
|
|
}
|
|
|
|
sizeKeywordFunc = func(path string, info os.FileInfo, r io.Reader) (KeyVal, error) {
|
|
|
|
if sys, ok := info.Sys().(*tar.Header); ok {
|
|
|
|
if sys.Typeflag == tar.TypeSymlink {
|
|
|
|
return KeyVal(fmt.Sprintf("size=%d", len(sys.Linkname))), nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return KeyVal(fmt.Sprintf("size=%d", info.Size())), nil
|
|
|
|
}
|
|
|
|
cksumKeywordFunc = func(path string, info os.FileInfo, r io.Reader) (KeyVal, error) {
|
|
|
|
if !info.Mode().IsRegular() {
|
|
|
|
return emptyKV, nil
|
|
|
|
}
|
|
|
|
sum, _, err := cksum(r)
|
|
|
|
if err != nil {
|
|
|
|
return emptyKV, err
|
|
|
|
}
|
|
|
|
return KeyVal(fmt.Sprintf("cksum=%d", sum)), nil
|
|
|
|
}
|
|
|
|
hasherKeywordFunc = func(name string, newHash func() hash.Hash) KeywordFunc {
|
|
|
|
return func(path string, info os.FileInfo, r io.Reader) (KeyVal, error) {
|
|
|
|
if !info.Mode().IsRegular() {
|
|
|
|
return emptyKV, nil
|
|
|
|
}
|
|
|
|
h := newHash()
|
|
|
|
if _, err := io.Copy(h, r); err != nil {
|
|
|
|
return emptyKV, err
|
|
|
|
}
|
|
|
|
return KeyVal(fmt.Sprintf("%s=%x", KeywordSynonym(name), h.Sum(nil))), nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
tartimeKeywordFunc = func(path string, info os.FileInfo, r io.Reader) (KeyVal, error) {
|
|
|
|
return KeyVal(fmt.Sprintf("tar_time=%d.%9.9d", info.ModTime().Unix(), 0)), nil
|
|
|
|
}
|
|
|
|
timeKeywordFunc = func(path string, info os.FileInfo, r io.Reader) (KeyVal, error) {
|
|
|
|
tSec := info.ModTime().Unix()
|
|
|
|
tNano := info.ModTime().Nanosecond()
|
|
|
|
return KeyVal(fmt.Sprintf("time=%d.%9.9d", tSec, tNano)), nil
|
|
|
|
}
|
|
|
|
linkKeywordFunc = func(path string, info os.FileInfo, r io.Reader) (KeyVal, error) {
|
|
|
|
if sys, ok := info.Sys().(*tar.Header); ok {
|
|
|
|
if sys.Linkname != "" {
|
2017-02-15 16:10:30 +00:00
|
|
|
linkname, err := govis.Vis(sys.Linkname, DefaultVisFlags)
|
2016-11-18 00:47:31 +00:00
|
|
|
if err != nil {
|
|
|
|
return emptyKV, err
|
|
|
|
}
|
|
|
|
return KeyVal(fmt.Sprintf("link=%s", linkname)), nil
|
|
|
|
}
|
|
|
|
return emptyKV, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if info.Mode()&os.ModeSymlink != 0 {
|
|
|
|
str, err := os.Readlink(path)
|
|
|
|
if err != nil {
|
|
|
|
return emptyKV, err
|
|
|
|
}
|
2017-02-15 16:10:30 +00:00
|
|
|
linkname, err := govis.Vis(str, DefaultVisFlags)
|
2016-11-18 00:47:31 +00:00
|
|
|
if err != nil {
|
|
|
|
return emptyKV, err
|
|
|
|
}
|
|
|
|
return KeyVal(fmt.Sprintf("link=%s", linkname)), nil
|
|
|
|
}
|
|
|
|
return emptyKV, nil
|
|
|
|
}
|
|
|
|
typeKeywordFunc = func(path string, info os.FileInfo, r io.Reader) (KeyVal, error) {
|
|
|
|
if info.Mode().IsDir() {
|
|
|
|
return "type=dir", nil
|
|
|
|
}
|
|
|
|
if info.Mode().IsRegular() {
|
|
|
|
return "type=file", nil
|
|
|
|
}
|
|
|
|
if info.Mode()&os.ModeSocket != 0 {
|
|
|
|
return "type=socket", nil
|
|
|
|
}
|
|
|
|
if info.Mode()&os.ModeSymlink != 0 {
|
|
|
|
return "type=link", nil
|
|
|
|
}
|
|
|
|
if info.Mode()&os.ModeNamedPipe != 0 {
|
|
|
|
return "type=fifo", nil
|
|
|
|
}
|
|
|
|
if info.Mode()&os.ModeDevice != 0 {
|
|
|
|
if info.Mode()&os.ModeCharDevice != 0 {
|
|
|
|
return "type=char", nil
|
|
|
|
}
|
|
|
|
return "type=device", nil
|
|
|
|
}
|
|
|
|
return emptyKV, nil
|
|
|
|
}
|
|
|
|
)
|