2021-08-09 21:35:18 +00:00
|
|
|
package shell
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"flag"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
2021-08-14 22:11:52 +00:00
|
|
|
"path/filepath"
|
2021-08-09 21:35:18 +00:00
|
|
|
"strings"
|
2021-11-29 07:10:32 +00:00
|
|
|
|
2022-07-29 07:17:28 +00:00
|
|
|
"github.com/seaweedfs/seaweedfs/weed/filer"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/pb/filer_pb"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/util"
|
2021-08-09 21:35:18 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
func init() {
|
|
|
|
Commands = append(Commands, &commandRemoteUncache{})
|
|
|
|
}
|
|
|
|
|
|
|
|
type commandRemoteUncache struct {
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *commandRemoteUncache) Name() string {
|
|
|
|
return "remote.uncache"
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *commandRemoteUncache) Help() string {
|
|
|
|
return `keep the metadata but remote cache the file content for mounted directories or files
|
|
|
|
|
2021-08-14 22:11:52 +00:00
|
|
|
This is designed to run regularly. So you can add it to some cronjob.
|
|
|
|
If a file is not synchronized with the remote copy, the file will be skipped to avoid loss of data.
|
|
|
|
|
2021-08-14 22:55:53 +00:00
|
|
|
remote.uncache -dir=/xxx
|
|
|
|
remote.uncache -dir=/xxx/some/sub/dir
|
|
|
|
remote.uncache -dir=/xxx/some/sub/dir -include=*.pdf
|
|
|
|
remote.uncache -dir=/xxx/some/sub/dir -exclude=*.txt
|
2021-08-21 09:17:10 +00:00
|
|
|
remote.uncache -minSize=1024000 # uncache files larger than 100K
|
|
|
|
remote.uncache -minAge=3600 # uncache files older than 1 hour
|
2021-08-09 21:35:18 +00:00
|
|
|
|
|
|
|
`
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *commandRemoteUncache) Do(args []string, commandEnv *CommandEnv, writer io.Writer) (err error) {
|
|
|
|
|
2021-11-29 07:10:32 +00:00
|
|
|
remoteUncacheCommand := flag.NewFlagSet(c.Name(), flag.ContinueOnError)
|
2021-08-09 21:35:18 +00:00
|
|
|
|
2021-11-29 07:10:32 +00:00
|
|
|
dir := remoteUncacheCommand.String("dir", "", "a directory in filer")
|
|
|
|
fileFiler := newFileFilter(remoteUncacheCommand)
|
2021-08-09 21:35:18 +00:00
|
|
|
|
2021-11-29 07:10:32 +00:00
|
|
|
if err = remoteUncacheCommand.Parse(args); err != nil {
|
2021-08-09 21:35:18 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
mappings, listErr := filer.ReadMountMappings(commandEnv.option.GrpcDialOption, commandEnv.option.FilerAddress)
|
|
|
|
if listErr != nil {
|
|
|
|
return listErr
|
|
|
|
}
|
2021-09-05 21:47:06 +00:00
|
|
|
if *dir != "" {
|
|
|
|
var localMountedDir string
|
|
|
|
for k := range mappings.Mappings {
|
|
|
|
if strings.HasPrefix(*dir, k) {
|
|
|
|
localMountedDir = k
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if localMountedDir == "" {
|
|
|
|
jsonPrintln(writer, mappings)
|
|
|
|
fmt.Fprintf(writer, "%s is not mounted\n", *dir)
|
|
|
|
return nil
|
|
|
|
}
|
2021-08-09 21:35:18 +00:00
|
|
|
|
2021-09-05 21:47:06 +00:00
|
|
|
// pull content from remote
|
|
|
|
if err = c.uncacheContentData(commandEnv, writer, util.FullPath(*dir), fileFiler); err != nil {
|
|
|
|
return fmt.Errorf("uncache content data: %v", err)
|
2021-08-09 21:35:18 +00:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-09-05 21:47:06 +00:00
|
|
|
for key, _ := range mappings.Mappings {
|
|
|
|
if err := c.uncacheContentData(commandEnv, writer, util.FullPath(key), fileFiler); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2021-08-09 21:35:18 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-08-14 22:11:52 +00:00
|
|
|
func (c *commandRemoteUncache) uncacheContentData(commandEnv *CommandEnv, writer io.Writer, dirToCache util.FullPath, fileFilter *FileFilter) error {
|
2021-08-09 21:35:18 +00:00
|
|
|
|
|
|
|
return recursivelyTraverseDirectory(commandEnv, dirToCache, func(dir util.FullPath, entry *filer_pb.Entry) bool {
|
2021-08-26 22:18:34 +00:00
|
|
|
|
2021-08-09 21:35:18 +00:00
|
|
|
if !mayHaveCachedToLocal(entry) {
|
|
|
|
return true // true means recursive traversal should continue
|
|
|
|
}
|
2021-08-14 22:11:52 +00:00
|
|
|
|
2021-09-04 20:58:14 +00:00
|
|
|
if !fileFilter.matches(entry) {
|
2021-08-14 22:11:52 +00:00
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
2021-08-15 04:46:34 +00:00
|
|
|
if entry.RemoteEntry.LastLocalSyncTsNs/1e9 < entry.Attributes.Mtime {
|
2021-08-14 22:11:52 +00:00
|
|
|
return true // should not uncache an entry that is not synchronized with remote
|
|
|
|
}
|
|
|
|
|
2021-08-15 04:46:34 +00:00
|
|
|
entry.RemoteEntry.LastLocalSyncTsNs = 0
|
2021-08-09 22:24:21 +00:00
|
|
|
entry.Chunks = nil
|
2021-08-09 21:35:18 +00:00
|
|
|
|
2021-08-26 22:18:34 +00:00
|
|
|
fmt.Fprintf(writer, "Uncache %+v ... ", dir.Child(entry.Name))
|
2021-08-09 21:35:18 +00:00
|
|
|
|
2021-12-26 08:15:03 +00:00
|
|
|
err := commandEnv.WithFilerClient(false, func(client filer_pb.SeaweedFilerClient) error {
|
2021-08-09 21:35:18 +00:00
|
|
|
_, updateErr := client.UpdateEntry(context.Background(), &filer_pb.UpdateEntryRequest{
|
2021-08-09 21:37:34 +00:00
|
|
|
Directory: string(dir),
|
|
|
|
Entry: entry,
|
2021-08-09 21:35:18 +00:00
|
|
|
})
|
|
|
|
return updateErr
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
fmt.Fprintf(writer, "uncache %+v: %v\n", dir.Child(entry.Name), err)
|
|
|
|
return false
|
|
|
|
}
|
2021-08-26 22:18:34 +00:00
|
|
|
fmt.Fprintf(writer, "Done\n")
|
2021-08-09 21:35:18 +00:00
|
|
|
|
|
|
|
return true
|
|
|
|
})
|
|
|
|
}
|
2021-08-14 22:11:52 +00:00
|
|
|
|
|
|
|
type FileFilter struct {
|
|
|
|
include *string
|
|
|
|
exclude *string
|
|
|
|
minSize *int64
|
|
|
|
maxSize *int64
|
|
|
|
minAge *int64
|
|
|
|
maxAge *int64
|
|
|
|
}
|
|
|
|
|
|
|
|
func newFileFilter(remoteMountCommand *flag.FlagSet) (ff *FileFilter) {
|
|
|
|
ff = &FileFilter{}
|
|
|
|
ff.include = remoteMountCommand.String("include", "", "pattens of file names, e.g., *.pdf, *.html, ab?d.txt")
|
|
|
|
ff.exclude = remoteMountCommand.String("exclude", "", "pattens of file names, e.g., *.pdf, *.html, ab?d.txt")
|
|
|
|
ff.minSize = remoteMountCommand.Int64("minSize", -1, "minimum file size in bytes")
|
|
|
|
ff.maxSize = remoteMountCommand.Int64("maxSize", -1, "maximum file size in bytes")
|
|
|
|
ff.minAge = remoteMountCommand.Int64("minAge", -1, "minimum file age in seconds")
|
|
|
|
ff.maxAge = remoteMountCommand.Int64("maxAge", -1, "maximum file age in seconds")
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
func (ff *FileFilter) matches(entry *filer_pb.Entry) bool {
|
|
|
|
if *ff.include != "" {
|
|
|
|
if ok, _ := filepath.Match(*ff.include, entry.Name); !ok {
|
2021-09-04 20:45:39 +00:00
|
|
|
return false
|
2021-08-14 22:11:52 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
if *ff.exclude != "" {
|
|
|
|
if ok, _ := filepath.Match(*ff.exclude, entry.Name); ok {
|
2021-09-04 20:45:39 +00:00
|
|
|
return false
|
2021-08-14 22:11:52 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
if *ff.minSize != -1 {
|
|
|
|
if int64(entry.Attributes.FileSize) < *ff.minSize {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if *ff.maxSize != -1 {
|
|
|
|
if int64(entry.Attributes.FileSize) > *ff.maxSize {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if *ff.minAge != -1 {
|
|
|
|
if entry.Attributes.Crtime < *ff.minAge {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if *ff.maxAge != -1 {
|
|
|
|
if entry.Attributes.Crtime > *ff.maxAge {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
2021-09-04 20:45:39 +00:00
|
|
|
return true
|
2021-08-14 22:11:52 +00:00
|
|
|
}
|