2021-08-13 17:20:17 +01:00
|
|
|
package aghos
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
"io"
|
2021-10-14 17:39:21 +01:00
|
|
|
"io/fs"
|
2021-08-13 17:20:17 +01:00
|
|
|
|
2024-04-03 11:44:51 +01:00
|
|
|
"github.com/AdguardTeam/golibs/container"
|
2021-08-13 17:20:17 +01:00
|
|
|
"github.com/AdguardTeam/golibs/errors"
|
|
|
|
)
|
|
|
|
|
|
|
|
// FileWalker is the signature of a function called for files in the file tree.
|
|
|
|
// As opposed to filepath.Walk it only walk the files (not directories) matching
|
|
|
|
// the provided pattern and those returned by function itself. All patterns
|
2021-12-01 13:26:46 +00:00
|
|
|
// should be valid for fs.Glob. If FileWalker returns false for cont then
|
|
|
|
// walking terminates. Prefer using bufio.Scanner to read the r since the input
|
|
|
|
// is not limited.
|
2021-08-13 17:20:17 +01:00
|
|
|
//
|
2021-12-01 13:26:46 +00:00
|
|
|
// TODO(e.burkov, a.garipov): Move into another package like aghfs.
|
2021-08-13 17:20:17 +01:00
|
|
|
//
|
|
|
|
// TODO(e.burkov): Think about passing filename or any additional data.
|
|
|
|
type FileWalker func(r io.Reader) (patterns []string, cont bool, err error)
|
|
|
|
|
2021-10-14 17:39:21 +01:00
|
|
|
// checkFile tries to open and process a single file located on sourcePath in
|
|
|
|
// the specified fsys. The path is skipped if it's a directory.
|
|
|
|
func checkFile(
|
|
|
|
fsys fs.FS,
|
|
|
|
c FileWalker,
|
|
|
|
sourcePath string,
|
|
|
|
) (patterns []string, cont bool, err error) {
|
|
|
|
var f fs.File
|
|
|
|
f, err = fsys.Open(sourcePath)
|
2021-08-13 17:20:17 +01:00
|
|
|
if err != nil {
|
2021-10-14 17:39:21 +01:00
|
|
|
if errors.Is(err, fs.ErrNotExist) {
|
|
|
|
// Ignore non-existing files since this may only happen when the
|
|
|
|
// file was removed after filepath.Glob matched it.
|
2021-08-13 17:20:17 +01:00
|
|
|
return nil, true, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil, false, err
|
|
|
|
}
|
|
|
|
defer func() { err = errors.WithDeferred(err, f.Close()) }()
|
|
|
|
|
2021-10-14 17:39:21 +01:00
|
|
|
var fi fs.FileInfo
|
|
|
|
if fi, err = f.Stat(); err != nil {
|
|
|
|
return nil, true, err
|
2021-12-01 13:26:46 +00:00
|
|
|
} else if fi.IsDir() {
|
2021-10-14 17:39:21 +01:00
|
|
|
// Skip the directories.
|
|
|
|
return nil, true, nil
|
|
|
|
}
|
|
|
|
|
2021-12-01 13:26:46 +00:00
|
|
|
return c(f)
|
2021-08-13 17:20:17 +01:00
|
|
|
}
|
|
|
|
|
2021-10-14 17:39:21 +01:00
|
|
|
// handlePatterns parses the patterns in fsys and ignores duplicates using
|
|
|
|
// srcSet. srcSet must be non-nil.
|
|
|
|
func handlePatterns(
|
|
|
|
fsys fs.FS,
|
2024-04-03 11:44:51 +01:00
|
|
|
srcSet *container.MapSet[string],
|
2021-10-14 17:39:21 +01:00
|
|
|
patterns ...string,
|
|
|
|
) (sub []string, err error) {
|
2021-08-13 17:20:17 +01:00
|
|
|
sub = make([]string, 0, len(patterns))
|
|
|
|
for _, p := range patterns {
|
|
|
|
var matches []string
|
2021-10-14 17:39:21 +01:00
|
|
|
matches, err = fs.Glob(fsys, p)
|
2021-08-13 17:20:17 +01:00
|
|
|
if err != nil {
|
|
|
|
// Enrich error with the pattern because filepath.Glob
|
|
|
|
// doesn't do it.
|
|
|
|
return nil, fmt.Errorf("invalid pattern %q: %w", p, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, m := range matches {
|
|
|
|
if srcSet.Has(m) {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
srcSet.Add(m)
|
|
|
|
sub = append(sub, m)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return sub, nil
|
|
|
|
}
|
|
|
|
|
2021-10-14 17:39:21 +01:00
|
|
|
// Walk starts walking the files in fsys defined by patterns from initial.
|
|
|
|
// It only returns true if fw signed to stop walking.
|
|
|
|
func (fw FileWalker) Walk(fsys fs.FS, initial ...string) (ok bool, err error) {
|
|
|
|
// The slice of sources keeps the order in which the files are walked since
|
|
|
|
// srcSet.Values() returns strings in undefined order.
|
2024-04-03 11:44:51 +01:00
|
|
|
srcSet := container.NewMapSet[string]()
|
2021-08-13 17:20:17 +01:00
|
|
|
var src []string
|
2021-10-14 17:39:21 +01:00
|
|
|
src, err = handlePatterns(fsys, srcSet, initial...)
|
2021-08-13 17:20:17 +01:00
|
|
|
if err != nil {
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
|
|
|
var filename string
|
|
|
|
defer func() { err = errors.Annotate(err, "checking %q: %w", filename) }()
|
|
|
|
|
2024-04-04 13:52:39 +01:00
|
|
|
// TODO(e.burkov): Redo this loop, as it modifies the very same slice it
|
|
|
|
// iterates over.
|
2021-08-13 17:20:17 +01:00
|
|
|
for i := 0; i < len(src); i++ {
|
|
|
|
var patterns []string
|
|
|
|
var cont bool
|
|
|
|
filename = src[i]
|
2021-10-14 17:39:21 +01:00
|
|
|
patterns, cont, err = checkFile(fsys, fw, src[i])
|
2021-08-13 17:20:17 +01:00
|
|
|
if err != nil {
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if !cont {
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
var subsrc []string
|
2021-10-14 17:39:21 +01:00
|
|
|
subsrc, err = handlePatterns(fsys, srcSet, patterns...)
|
2021-08-13 17:20:17 +01:00
|
|
|
if err != nil {
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
|
|
|
|
src = append(src, subsrc...)
|
|
|
|
}
|
|
|
|
|
|
|
|
return false, nil
|
|
|
|
}
|