1// Copyright 2018 The Go Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style
3// license that can be found in the LICENSE file.
4
5// Package gopathwalk is like filepath.Walk but specialized for finding Go
6// packages, particularly in $GOPATH and $GOROOT.
7package gopathwalk
8
9import (
10	"bufio"
11	"bytes"
12	"fmt"
13	"io/ioutil"
14	"log"
15	"os"
16	"path/filepath"
17	"strings"
18	"time"
19
20	"golang.org/x/tools/internal/fastwalk"
21)
22
23// Options controls the behavior of a Walk call.
24type Options struct {
25	// If Logf is non-nil, debug logging is enabled through this function.
26	Logf func(format string, args ...interface{})
27	// Search module caches. Also disables legacy goimports ignore rules.
28	ModulesEnabled bool
29}
30
31// RootType indicates the type of a Root.
32type RootType int
33
34const (
35	RootUnknown RootType = iota
36	RootGOROOT
37	RootGOPATH
38	RootCurrentModule
39	RootModuleCache
40	RootOther
41)
42
43// A Root is a starting point for a Walk.
44type Root struct {
45	Path string
46	Type RootType
47}
48
49// Walk walks Go source directories ($GOROOT, $GOPATH, etc) to find packages.
50// For each package found, add will be called (concurrently) with the absolute
51// paths of the containing source directory and the package directory.
52// add will be called concurrently.
53func Walk(roots []Root, add func(root Root, dir string), opts Options) {
54	WalkSkip(roots, add, func(Root, string) bool { return false }, opts)
55}
56
57// WalkSkip walks Go source directories ($GOROOT, $GOPATH, etc) to find packages.
58// For each package found, add will be called (concurrently) with the absolute
59// paths of the containing source directory and the package directory.
60// For each directory that will be scanned, skip will be called (concurrently)
61// with the absolute paths of the containing source directory and the directory.
62// If skip returns false on a directory it will be processed.
63// add will be called concurrently.
64// skip will be called concurrently.
65func WalkSkip(roots []Root, add func(root Root, dir string), skip func(root Root, dir string) bool, opts Options) {
66	for _, root := range roots {
67		walkDir(root, add, skip, opts)
68	}
69}
70
71// walkDir creates a walker and starts fastwalk with this walker.
72func walkDir(root Root, add func(Root, string), skip func(root Root, dir string) bool, opts Options) {
73	if _, err := os.Stat(root.Path); os.IsNotExist(err) {
74		if opts.Logf != nil {
75			opts.Logf("skipping nonexistent directory: %v", root.Path)
76		}
77		return
78	}
79	start := time.Now()
80	if opts.Logf != nil {
81		opts.Logf("gopathwalk: scanning %s", root.Path)
82	}
83	w := &walker{
84		root: root,
85		add:  add,
86		skip: skip,
87		opts: opts,
88	}
89	w.init()
90	if err := fastwalk.Walk(root.Path, w.walk); err != nil {
91		log.Printf("gopathwalk: scanning directory %v: %v", root.Path, err)
92	}
93
94	if opts.Logf != nil {
95		opts.Logf("gopathwalk: scanned %s in %v", root.Path, time.Since(start))
96	}
97}
98
99// walker is the callback for fastwalk.Walk.
100type walker struct {
101	root Root                    // The source directory to scan.
102	add  func(Root, string)      // The callback that will be invoked for every possible Go package dir.
103	skip func(Root, string) bool // The callback that will be invoked for every dir. dir is skipped if it returns true.
104	opts Options                 // Options passed to Walk by the user.
105
106	ignoredDirs []os.FileInfo // The ignored directories, loaded from .goimportsignore files.
107}
108
109// init initializes the walker based on its Options
110func (w *walker) init() {
111	var ignoredPaths []string
112	if w.root.Type == RootModuleCache {
113		ignoredPaths = []string{"cache"}
114	}
115	if !w.opts.ModulesEnabled && w.root.Type == RootGOPATH {
116		ignoredPaths = w.getIgnoredDirs(w.root.Path)
117		ignoredPaths = append(ignoredPaths, "v", "mod")
118	}
119
120	for _, p := range ignoredPaths {
121		full := filepath.Join(w.root.Path, p)
122		if fi, err := os.Stat(full); err == nil {
123			w.ignoredDirs = append(w.ignoredDirs, fi)
124			if w.opts.Logf != nil {
125				w.opts.Logf("Directory added to ignore list: %s", full)
126			}
127		} else if w.opts.Logf != nil {
128			w.opts.Logf("Error statting ignored directory: %v", err)
129		}
130	}
131}
132
133// getIgnoredDirs reads an optional config file at <path>/.goimportsignore
134// of relative directories to ignore when scanning for go files.
135// The provided path is one of the $GOPATH entries with "src" appended.
136func (w *walker) getIgnoredDirs(path string) []string {
137	file := filepath.Join(path, ".goimportsignore")
138	slurp, err := ioutil.ReadFile(file)
139	if w.opts.Logf != nil {
140		if err != nil {
141			w.opts.Logf("%v", err)
142		} else {
143			w.opts.Logf("Read %s", file)
144		}
145	}
146	if err != nil {
147		return nil
148	}
149
150	var ignoredDirs []string
151	bs := bufio.NewScanner(bytes.NewReader(slurp))
152	for bs.Scan() {
153		line := strings.TrimSpace(bs.Text())
154		if line == "" || strings.HasPrefix(line, "#") {
155			continue
156		}
157		ignoredDirs = append(ignoredDirs, line)
158	}
159	return ignoredDirs
160}
161
162// shouldSkipDir reports whether the file should be skipped or not.
163func (w *walker) shouldSkipDir(fi os.FileInfo, dir string) bool {
164	for _, ignoredDir := range w.ignoredDirs {
165		if os.SameFile(fi, ignoredDir) {
166			return true
167		}
168	}
169	if w.skip != nil {
170		// Check with the user specified callback.
171		return w.skip(w.root, dir)
172	}
173	return false
174}
175
176// walk walks through the given path.
177func (w *walker) walk(path string, typ os.FileMode) error {
178	dir := filepath.Dir(path)
179	if typ.IsRegular() {
180		if dir == w.root.Path && (w.root.Type == RootGOROOT || w.root.Type == RootGOPATH) {
181			// Doesn't make sense to have regular files
182			// directly in your $GOPATH/src or $GOROOT/src.
183			return fastwalk.ErrSkipFiles
184		}
185		if !strings.HasSuffix(path, ".go") {
186			return nil
187		}
188
189		w.add(w.root, dir)
190		return fastwalk.ErrSkipFiles
191	}
192	if typ == os.ModeDir {
193		base := filepath.Base(path)
194		if base == "" || base[0] == '.' || base[0] == '_' ||
195			base == "testdata" ||
196			(w.root.Type == RootGOROOT && w.opts.ModulesEnabled && base == "vendor") ||
197			(!w.opts.ModulesEnabled && base == "node_modules") {
198			return filepath.SkipDir
199		}
200		fi, err := os.Lstat(path)
201		if err == nil && w.shouldSkipDir(fi, path) {
202			return filepath.SkipDir
203		}
204		return nil
205	}
206	if typ == os.ModeSymlink {
207		base := filepath.Base(path)
208		if strings.HasPrefix(base, ".#") {
209			// Emacs noise.
210			return nil
211		}
212		fi, err := os.Lstat(path)
213		if err != nil {
214			// Just ignore it.
215			return nil
216		}
217		if w.shouldTraverse(dir, fi) {
218			return fastwalk.ErrTraverseLink
219		}
220	}
221	return nil
222}
223
224// shouldTraverse reports whether the symlink fi, found in dir,
225// should be followed.  It makes sure symlinks were never visited
226// before to avoid symlink loops.
227func (w *walker) shouldTraverse(dir string, fi os.FileInfo) bool {
228	path := filepath.Join(dir, fi.Name())
229	target, err := filepath.EvalSymlinks(path)
230	if err != nil {
231		return false
232	}
233	ts, err := os.Stat(target)
234	if err != nil {
235		fmt.Fprintln(os.Stderr, err)
236		return false
237	}
238	if !ts.IsDir() {
239		return false
240	}
241	if w.shouldSkipDir(ts, dir) {
242		return false
243	}
244	// Check for symlink loops by statting each directory component
245	// and seeing if any are the same file as ts.
246	for {
247		parent := filepath.Dir(path)
248		if parent == path {
249			// Made it to the root without seeing a cycle.
250			// Use this symlink.
251			return true
252		}
253		parentInfo, err := os.Stat(parent)
254		if err != nil {
255			return false
256		}
257		if os.SameFile(ts, parentInfo) {
258			// Cycle. Don't traverse.
259			return false
260		}
261		path = parent
262	}
263
264}
265