blob: 53dcabedab2e0cdd7759e675aec9014a4a43b2eb [file] [log] [blame] [edit]
/* Copyright 2018 The Bazel Authors. All rights reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package walk
import (
"bufio"
"errors"
"flag"
"fmt"
"io/fs"
"log"
"os"
"path"
"path/filepath"
"strings"
"github.com/bazelbuild/bazel-gazelle/config"
"github.com/bazelbuild/bazel-gazelle/rule"
bzl "github.com/bazelbuild/buildtools/build"
"github.com/bmatcuk/doublestar/v4"
gzflag "github.com/bazelbuild/bazel-gazelle/flag"
)
// generationModeType represents one of the generation modes.
type generationModeType string
// Generation modes
const (
// Update: update and maintain existing BUILD files
generationModeUpdate generationModeType = "update_only"
// Create: create new and update existing BUILD files
generationModeCreate generationModeType = "create_and_update"
)
// TODO(#472): store location information to validate each exclude. They
// may be set in one directory and used in another. Excludes work on
// declared generated files, so we can't just stat.
type walkConfig struct {
updateOnly bool
ignoreFilter *ignoreFilter
excludes []string
ignore bool
follow []string
validBuildFileNames []string // to be copied to config.Config
}
const (
walkName = "_walk"
walkNameCached = "_walkCached"
)
func getWalkConfig(c *config.Config) *walkConfig {
return c.Exts[walkName].(*walkConfig)
}
func (wc *walkConfig) clone() *walkConfig {
wcCopy := *wc
// Trim cap of exclude and follow. We may append to these slices in multiple
// goroutines. Doing so should allocate a copy of the backing array.
// Other slices are either immutable or replaced when written.
wcCopy.excludes = wcCopy.excludes[:len(wcCopy.excludes):len(wcCopy.excludes)]
wcCopy.follow = wcCopy.follow[:len(wcCopy.follow):len(wcCopy.follow)]
return &wcCopy
}
func (wc *walkConfig) isExcludedDir(p string) bool {
return path.Base(p) == ".git" || wc.ignoreFilter.isDirectoryIgnored(p) || matchAnyGlob(wc.excludes, p)
}
func (wc *walkConfig) isExcludedFile(p string) bool {
return wc.ignoreFilter.isFileIgnored(p) || matchAnyGlob(wc.excludes, p)
}
func (wc *walkConfig) shouldFollow(p string) bool {
return matchAnyGlob(wc.follow, p)
}
var _ config.Configurer = (*Configurer)(nil)
type Configurer struct {
// Excludes and BUILD filenames specified on the command line.
// May be extending with BUILD directives.
cliExcludes []string
cliBuildFileNames string
// Alternate BUILD read/write directories
readBuildFilesDir, writeBuildFilesDir string
}
func (cr *Configurer) RegisterFlags(fs *flag.FlagSet, cmd string, c *config.Config) {
fs.Var(&gzflag.MultiFlag{Values: &cr.cliExcludes}, "exclude", "pattern that should be ignored (may be repeated)")
fs.StringVar(&cr.cliBuildFileNames, "build_file_name", strings.Join(config.DefaultValidBuildFileNames, ","), "comma-separated list of valid build file names.\nThe first element of the list is the name of output build files to generate.")
fs.StringVar(&cr.readBuildFilesDir, "experimental_read_build_files_dir", "", "path to a directory where build files should be read from (instead of -repo_root)")
fs.StringVar(&cr.writeBuildFilesDir, "experimental_write_build_files_dir", "", "path to a directory where build files should be written to (instead of -repo_root)")
}
func (cr *Configurer) CheckFlags(_ *flag.FlagSet, c *config.Config) error {
c.ValidBuildFileNames = strings.Split(cr.cliBuildFileNames, ",")
if cr.readBuildFilesDir != "" {
if filepath.IsAbs(cr.readBuildFilesDir) {
c.ReadBuildFilesDir = cr.readBuildFilesDir
} else {
c.ReadBuildFilesDir = filepath.Join(c.WorkDir, cr.readBuildFilesDir)
}
}
if cr.writeBuildFilesDir != "" {
if filepath.IsAbs(cr.writeBuildFilesDir) {
c.WriteBuildFilesDir = cr.writeBuildFilesDir
} else {
c.WriteBuildFilesDir = filepath.Join(c.WorkDir, cr.writeBuildFilesDir)
}
}
ignoreFilter := newIgnoreFilter(c.RepoRoot)
wc := &walkConfig{
ignoreFilter: ignoreFilter,
excludes: cr.cliExcludes,
validBuildFileNames: c.ValidBuildFileNames,
}
c.Exts[walkName] = wc
return nil
}
func (*Configurer) KnownDirectives() []string {
return []string{"build_file_name", "generation_mode", "exclude", "follow", "ignore"}
}
func (cr *Configurer) Configure(c *config.Config, rel string, f *rule.File) {
if c.Exts[walkNameCached] != nil {
// A normal Configurer implementation would process directives and set
// c.Exts[walkName] here. However, we've parallelized the tree walk and
// processed the configuration ahead of time in configureForWalk. So instead,
// the caller of this method (configure) sets c.Exts[walkNameCache] to the
// preprocessed configuration. We copy it to c.Exts[walkName] instead of
// re-processing directives.
c.Exts[walkName] = c.Exts[walkNameCached]
delete(c.Exts, walkNameCached)
} else {
// In some unit tests, c.Exts[walkNameCached] is not set.
// Process directives normally using the same code.
c.Exts[walkName] = configureForWalk(getWalkConfig(c), rel, f)
}
c.ValidBuildFileNames = getWalkConfig(c).validBuildFileNames
}
func configureForWalk(parent *walkConfig, rel string, f *rule.File) *walkConfig {
wc := parent.clone()
wc.ignore = false
if f != nil {
for _, d := range f.Directives {
switch d.Key {
case "build_file_name":
wc.validBuildFileNames = strings.Split(d.Value, ",")
case "generation_mode":
switch generationModeType(strings.TrimSpace(d.Value)) {
case generationModeUpdate:
wc.updateOnly = true
case generationModeCreate:
wc.updateOnly = false
default:
log.Fatalf("unknown generation_mode %q in //%s", d.Value, f.Pkg)
continue
}
case "exclude":
if err := checkPathMatchPattern(path.Join(rel, d.Value)); err != nil {
log.Printf("the exclusion pattern is not valid %q: %s", path.Join(rel, d.Value), err)
continue
}
wc.excludes = append(wc.excludes, path.Join(rel, d.Value))
case "follow":
if err := checkPathMatchPattern(path.Join(rel, d.Value)); err != nil {
log.Printf("the follow pattern is not valid %q: %s", path.Join(rel, d.Value), err)
continue
}
wc.follow = append(wc.follow, path.Join(rel, d.Value))
case "ignore":
if d.Value != "" {
log.Printf("the ignore directive does not take any arguments. Did you mean to use gazelle:exclude instead? in //%s '# gazelle:ignore %s'", f.Pkg, d.Value)
}
wc.ignore = true
}
}
}
return wc
}
type ignoreFilter struct {
ignoreDirectoryGlobs []string
ignorePaths map[string]struct{}
}
func newIgnoreFilter(repoRoot string) *ignoreFilter {
bazelignorePaths, err := loadBazelIgnore(repoRoot)
if err != nil {
log.Printf("error loading .bazelignore: %v", err)
}
repoDirectoryIgnores, err := loadRepoDirectoryIgnore(repoRoot)
if err != nil {
log.Printf("error loading REPO.bazel ignore_directories(): %v", err)
}
return &ignoreFilter{
ignorePaths: bazelignorePaths,
ignoreDirectoryGlobs: repoDirectoryIgnores,
}
}
func (f *ignoreFilter) isDirectoryIgnored(p string) bool {
if _, ok := f.ignorePaths[p]; ok {
return true
}
return matchAnyGlob(f.ignoreDirectoryGlobs, p)
}
func (f *ignoreFilter) isFileIgnored(p string) bool {
_, ok := f.ignorePaths[p]
return ok
}
func loadBazelIgnore(repoRoot string) (map[string]struct{}, error) {
ignorePath := path.Join(repoRoot, ".bazelignore")
file, err := os.Open(ignorePath)
if errors.Is(err, fs.ErrNotExist) {
return nil, nil
}
if err != nil {
return nil, fmt.Errorf(".bazelignore exists but couldn't be read: %v", err)
}
defer file.Close()
excludes := make(map[string]struct{})
scanner := bufio.NewScanner(file)
for scanner.Scan() {
ignore := strings.TrimSpace(scanner.Text())
if ignore == "" || string(ignore[0]) == "#" {
continue
}
// Bazel ignore paths are always relative to repo root.
// Glob patterns are not supported.
if strings.ContainsAny(ignore, "*?[") {
log.Printf("the .bazelignore exclusion pattern must not be a glob %s", ignore)
continue
}
// Clean the path to remove any extra '.', './' etc otherwise
// the exclude matching won't work correctly.
ignore = path.Clean(ignore)
excludes[ignore] = struct{}{}
}
return excludes, nil
}
func loadRepoDirectoryIgnore(repoRoot string) ([]string, error) {
repoFilePath := path.Join(repoRoot, "REPO.bazel")
repoFileContent, err := os.ReadFile(repoFilePath)
if errors.Is(err, fs.ErrNotExist) {
return nil, nil
}
if err != nil {
return nil, fmt.Errorf("REPO.bazel exists but couldn't be read: %v", err)
}
ast, err := bzl.Parse(repoRoot, repoFileContent)
if err != nil {
return nil, fmt.Errorf("failed to parse REPO.bazel: %v", err)
}
var ignoreDirectories []string
// Search for ignore_directories([...ignore strings...])
for _, expr := range ast.Stmt {
if call, isCall := expr.(*bzl.CallExpr); isCall {
if inv, isIdentCall := call.X.(*bzl.Ident); isIdentCall && inv.Name == "ignore_directories" {
if len(call.List) != 1 {
return nil, fmt.Errorf("REPO.bazel ignore_directories() expects one argument")
}
list, isList := call.List[0].(*bzl.ListExpr)
if !isList {
return nil, fmt.Errorf("REPO.bazel ignore_directories() unexpected argument type: %T", call.List[0])
}
for _, item := range list.List {
if strExpr, isStr := item.(*bzl.StringExpr); isStr {
if err := checkPathMatchPattern(strExpr.Value); err != nil {
log.Printf("the ignore_directories() pattern %q is not valid: %s", strExpr.Value, err)
continue
}
ignoreDirectories = append(ignoreDirectories, strExpr.Value)
}
}
// Only a single ignore_directories() is supported in REPO.bazel and searching can stop.
break
}
}
}
return ignoreDirectories, nil
}
func checkPathMatchPattern(pattern string) error {
_, err := doublestar.Match(pattern, "x")
return err
}
func matchAnyGlob(patterns []string, path string) bool {
for _, x := range patterns {
if doublestar.MatchUnvalidated(x, path) {
return true
}
}
return false
}