// Copyright 2018 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. // Package cache implements the caching layer for gopls. package cache import ( "context" "encoding/json" "fmt" "go/ast" "io" "io/ioutil" "os" "path" "path/filepath" "reflect" "strings" "sync" "time" "golang.org/x/tools/internal/event" "golang.org/x/tools/internal/event/keys" "golang.org/x/tools/internal/gocommand" "golang.org/x/tools/internal/imports" "golang.org/x/tools/internal/lsp/debug/tag" "golang.org/x/tools/internal/lsp/source" "golang.org/x/tools/internal/memoize" "golang.org/x/tools/internal/span" "golang.org/x/tools/internal/xcontext" errors "golang.org/x/xerrors" ) type View struct { session *Session id string optionsMu sync.Mutex options source.Options // mu protects most mutable state of the view. mu sync.Mutex // baseCtx is the context handed to NewView. This is the parent of all // background contexts created for this view. baseCtx context.Context // backgroundCtx is the current context used by background tasks initiated // by the view. backgroundCtx context.Context // cancel is called when all action being performed by the current view // should be stopped. cancel context.CancelFunc // Name is the user visible name of this view. name string // Folder is the root of this view. folder span.URI // importsMu guards imports-related state, particularly the ProcessEnv. importsMu sync.Mutex // process is the process env for this view. // Note: this contains cached module and filesystem state. // // TODO(suzmue): the state cached in the process env is specific to each view, // however, there is state that can be shared between views that is not currently // cached, like the module cache. processEnv *imports.ProcessEnv cacheRefreshDuration time.Duration cacheRefreshTimer *time.Timer cachedModFileVersion source.FileIdentity // keep track of files by uri and by basename, a single file may be mapped // to multiple uris, and the same basename may map to multiple files filesByURI map[span.URI]*fileBase filesByBase map[string][]*fileBase snapshotMu sync.Mutex snapshot *snapshot // initialized is closed when the view has been fully initialized. // On initialization, the view's workspace packages are loaded. // All of the fields below are set as part of initialization. // If we failed to load, we don't re-try to avoid too many go/packages calls. initializeOnce sync.Once initialized chan struct{} initCancel context.CancelFunc // initializedErr needs no mutex, since any access to it happens after it // has been set. initializedErr error // builtin pins the AST and package for builtin.go in memory. builtin *builtinPackageHandle // True if the view is either in GOPATH, a module, or some other // non go command build system. hasValidBuildConfiguration bool // The real and temporary go.mod files that are attributed to a view. // The temporary go.mod is for use with the Go command's -modfile flag. realMod, tempMod span.URI // goCommand indicates if the user is using the go command or some other // build system. goCommand bool // `go env` variables that need to be tracked. gopath, gocache, goprivate string // gocmdRunner guards go command calls from concurrency errors. gocmdRunner *gocommand.Runner } type builtinPackageHandle struct { handle *memoize.Handle file source.ParseGoHandle } type builtinPackageData struct { memoize.NoCopy pkg *ast.Package pgh *parseGoHandle err error } func (d *builtinPackageData) Package() *ast.Package { return d.pkg } func (d *builtinPackageData) ParseGoHandle() source.ParseGoHandle { return d.pgh } // fileBase holds the common functionality for all files. // It is intended to be embedded in the file implementations type fileBase struct { uris []span.URI fname string view *View } func (f *fileBase) URI() span.URI { return f.uris[0] } func (f *fileBase) filename() string { return f.fname } func (f *fileBase) addURI(uri span.URI) int { f.uris = append(f.uris, uri) return len(f.uris) } func (v *View) ID() string { return v.id } func (v *View) ValidBuildConfiguration() bool { return v.hasValidBuildConfiguration } func (v *View) ModFiles() (span.URI, span.URI) { return v.realMod, v.tempMod } func (v *View) Session() source.Session { return v.session } // Name returns the user visible name of this view. func (v *View) Name() string { return v.name } // Folder returns the root of this view. func (v *View) Folder() span.URI { return v.folder } func (v *View) Options() source.Options { v.optionsMu.Lock() defer v.optionsMu.Unlock() return v.options } func minorOptionsChange(a, b source.Options) bool { // Check if any of the settings that modify our understanding of files have been changed if !reflect.DeepEqual(a.Env, b.Env) { return false } if !reflect.DeepEqual(a.BuildFlags, b.BuildFlags) { return false } // the rest of the options are benign return true } func (v *View) SetOptions(ctx context.Context, options source.Options) (source.View, error) { // no need to rebuild the view if the options were not materially changed v.optionsMu.Lock() if minorOptionsChange(v.options, options) { v.options = options v.optionsMu.Unlock() return v, nil } v.optionsMu.Unlock() newView, _, err := v.session.updateView(ctx, v, options) return newView, err } func (v *View) Rebuild(ctx context.Context) (source.Snapshot, error) { _, snapshot, err := v.session.updateView(ctx, v, v.Options()) return snapshot, err } func (v *View) BuiltinPackage(ctx context.Context) (source.BuiltinPackage, error) { v.awaitInitialized(ctx) if v.builtin == nil { return nil, errors.Errorf("no builtin package for view %s", v.name) } data := v.builtin.handle.Get(ctx) if ctx.Err() != nil { return nil, ctx.Err() } if data == nil { return nil, errors.Errorf("unexpected nil builtin package") } d, ok := data.(*builtinPackageData) if !ok { return nil, errors.Errorf("unexpected type %T", data) } if d.err != nil { return nil, d.err } if d.pkg == nil || d.pkg.Scope == nil { return nil, errors.Errorf("no builtin package") } return d, nil } func (v *View) buildBuiltinPackage(ctx context.Context, goFiles []string) error { if len(goFiles) != 1 { return errors.Errorf("only expected 1 file, got %v", len(goFiles)) } uri := span.URIFromPath(goFiles[0]) // Get the FileHandle through the cache to avoid adding it to the snapshot // and to get the file content from disk. fh, err := v.session.cache.GetFile(ctx, uri) if err != nil { return err } pgh := v.session.cache.parseGoHandle(ctx, fh, source.ParseFull) fset := v.session.cache.fset h := v.session.cache.store.Bind(fh.Identity(), func(ctx context.Context) interface{} { file, _, _, _, err := pgh.Parse(ctx) if err != nil { return &builtinPackageData{err: err} } pkg, err := ast.NewPackage(fset, map[string]*ast.File{ pgh.File().URI().Filename(): file, }, nil, nil) if err != nil { return &builtinPackageData{err: err} } return &builtinPackageData{ pgh: pgh, pkg: pkg, } }) v.builtin = &builtinPackageHandle{ handle: h, file: pgh, } return nil } func (v *View) WriteEnv(ctx context.Context, w io.Writer) error { v.optionsMu.Lock() env, buildFlags := v.envLocked() v.optionsMu.Unlock() // TODO(rstambler): We could probably avoid running this by saving the // output on original create, but I'm not sure if it's worth it. inv := gocommand.Invocation{ Verb: "env", Env: env, WorkingDir: v.Folder().Filename(), } stdout, err := v.gocmdRunner.Run(ctx, inv) if err != nil { return err } fmt.Fprintf(w, "go env for %v\n(valid build configuration = %v)\n(build flags: %v)\n", v.folder.Filename(), v.hasValidBuildConfiguration, buildFlags) fmt.Fprint(w, stdout) return nil } func (v *View) RunProcessEnvFunc(ctx context.Context, fn func(*imports.Options) error) error { v.importsMu.Lock() defer v.importsMu.Unlock() if v.processEnv == nil { var err error if v.processEnv, err = v.buildProcessEnv(ctx); err != nil { return err } } // In module mode, check if the mod file has changed. if v.realMod != "" { mod, err := v.session.cache.GetFile(ctx, v.realMod) if err != nil { return err } if mod.Identity() != v.cachedModFileVersion { v.processEnv.GetResolver().(*imports.ModuleResolver).ClearForNewMod() v.cachedModFileVersion = mod.Identity() } } // Run the user function. opts := &imports.Options{ // Defaults. AllErrors: true, Comments: true, Fragment: true, FormatOnly: false, TabIndent: true, TabWidth: 8, Env: v.processEnv, } if err := fn(opts); err != nil { return err } if v.cacheRefreshTimer == nil { // Don't refresh more than twice per minute. delay := 30 * time.Second // Don't spend more than a couple percent of the time refreshing. if adaptive := 50 * v.cacheRefreshDuration; adaptive > delay { delay = adaptive } v.cacheRefreshTimer = time.AfterFunc(delay, v.refreshProcessEnv) } return nil } func (v *View) refreshProcessEnv() { start := time.Now() v.importsMu.Lock() env := v.processEnv env.GetResolver().ClearForNewScan() v.importsMu.Unlock() // We don't have a context handy to use for logging, so use the stdlib for now. event.Log(v.baseCtx, "background imports cache refresh starting") err := imports.PrimeCache(context.Background(), env) if err == nil { event.Log(v.baseCtx, fmt.Sprintf("background refresh finished after %v", time.Since(start))) } else { event.Log(v.baseCtx, fmt.Sprintf("background refresh finished after %v", time.Since(start)), keys.Err.Of(err)) } v.importsMu.Lock() v.cacheRefreshDuration = time.Since(start) v.cacheRefreshTimer = nil v.importsMu.Unlock() } func (v *View) buildProcessEnv(ctx context.Context) (*imports.ProcessEnv, error) { v.optionsMu.Lock() env, buildFlags := v.envLocked() localPrefix, verboseOutput := v.options.LocalPrefix, v.options.VerboseOutput v.optionsMu.Unlock() processEnv := &imports.ProcessEnv{ WorkingDir: v.folder.Filename(), BuildFlags: buildFlags, LocalPrefix: localPrefix, GocmdRunner: v.gocmdRunner, } if verboseOutput { processEnv.Logf = func(format string, args ...interface{}) { event.Log(ctx, fmt.Sprintf(format, args...)) } } for _, kv := range env { split := strings.SplitN(kv, "=", 2) if len(split) < 2 { continue } switch split[0] { case "GOPATH": processEnv.GOPATH = split[1] case "GOROOT": processEnv.GOROOT = split[1] case "GO111MODULE": processEnv.GO111MODULE = split[1] case "GOPROXY": processEnv.GOPROXY = split[1] case "GOFLAGS": processEnv.GOFLAGS = split[1] case "GOSUMDB": processEnv.GOSUMDB = split[1] } } if processEnv.GOPATH == "" { return nil, fmt.Errorf("no GOPATH for view %s", v.folder) } return processEnv, nil } func (v *View) envLocked() ([]string, []string) { // We want to run the go commands with the -modfile flag if the version of go // that we are using supports it. buildFlags := v.options.BuildFlags if v.tempMod != "" { buildFlags = append(buildFlags, fmt.Sprintf("-modfile=%s", v.tempMod.Filename())) } env := []string{fmt.Sprintf("GOPATH=%s", v.gopath)} env = append(env, v.options.Env...) return env, buildFlags } func (v *View) contains(uri span.URI) bool { return strings.HasPrefix(string(uri), string(v.folder)) } func (v *View) mapFile(uri span.URI, f *fileBase) { v.filesByURI[uri] = f if f.addURI(uri) == 1 { basename := basename(f.filename()) v.filesByBase[basename] = append(v.filesByBase[basename], f) } } func basename(filename string) string { return strings.ToLower(filepath.Base(filename)) } func (v *View) relevantChange(c source.FileModification) bool { // If the file is known to the view, the change is relevant. known := v.knownFile(c.URI) // If the file is not known to the view, and the change is only on-disk, // we should not invalidate the snapshot. This is necessary because Emacs // sends didChangeWatchedFiles events for temp files. if !known && c.OnDisk && (c.Action == source.Change || c.Action == source.Delete) { return false } return v.contains(c.URI) || known } func (v *View) knownFile(uri span.URI) bool { v.mu.Lock() defer v.mu.Unlock() f, err := v.findFile(uri) return f != nil && err == nil } // getFile returns a file for the given URI. It will always succeed because it // adds the file to the managed set if needed. func (v *View) getFile(uri span.URI) (*fileBase, error) { v.mu.Lock() defer v.mu.Unlock() f, err := v.findFile(uri) if err != nil { return nil, err } else if f != nil { return f, nil } f = &fileBase{ view: v, fname: uri.Filename(), } v.mapFile(uri, f) return f, nil } // findFile checks the cache for any file matching the given uri. // // An error is only returned for an irreparable failure, for example, if the // filename in question does not exist. func (v *View) findFile(uri span.URI) (*fileBase, error) { if f := v.filesByURI[uri]; f != nil { // a perfect match return f, nil } // no exact match stored, time to do some real work // check for any files with the same basename fname := uri.Filename() basename := basename(fname) if candidates := v.filesByBase[basename]; candidates != nil { pathStat, err := os.Stat(fname) if os.IsNotExist(err) { return nil, err } if err != nil { return nil, nil // the file may exist, return without an error } for _, c := range candidates { if cStat, err := os.Stat(c.filename()); err == nil { if os.SameFile(pathStat, cStat) { // same file, map it v.mapFile(uri, c) return c, nil } } } } // no file with a matching name was found, it wasn't in our cache return nil, nil } func (v *View) Shutdown(ctx context.Context) { v.session.removeView(ctx, v) } func (v *View) shutdown(ctx context.Context) { // Cancel the initial workspace load if it is still running. v.initCancel() v.mu.Lock() defer v.mu.Unlock() if v.cancel != nil { v.cancel() v.cancel = nil } if v.tempMod != "" { os.Remove(v.tempMod.Filename()) os.Remove(tempSumFile(v.tempMod.Filename())) } } func (v *View) BackgroundContext() context.Context { v.mu.Lock() defer v.mu.Unlock() return v.backgroundCtx } func (v *View) Snapshot() source.Snapshot { return v.getSnapshot() } func (v *View) getSnapshot() *snapshot { v.snapshotMu.Lock() defer v.snapshotMu.Unlock() return v.snapshot } func (v *View) initialize(ctx context.Context, s *snapshot) { v.initializeOnce.Do(func() { defer close(v.initialized) if err := s.load(ctx, viewLoadScope("LOAD_VIEW"), packagePath("builtin")); err != nil { if ctx.Err() != nil { return } v.initializedErr = err event.Error(ctx, "initial workspace load failed", err) } }) } func (v *View) awaitInitialized(ctx context.Context) { select { case <-ctx.Done(): case <-v.initialized: } } // invalidateContent invalidates the content of a Go file, // including any position and type information that depends on it. // It returns true if we were already tracking the given file, false otherwise. func (v *View) invalidateContent(ctx context.Context, uris map[span.URI]source.FileHandle, forceReloadMetadata bool) source.Snapshot { // Detach the context so that content invalidation cannot be canceled. ctx = xcontext.Detach(ctx) // Cancel all still-running previous requests, since they would be // operating on stale data. v.cancelBackground() // Do not clone a snapshot until its view has finished initializing. v.awaitInitialized(ctx) // This should be the only time we hold the view's snapshot lock for any period of time. v.snapshotMu.Lock() defer v.snapshotMu.Unlock() v.snapshot = v.snapshot.clone(ctx, uris, forceReloadMetadata) return v.snapshot } func (v *View) cancelBackground() { v.mu.Lock() defer v.mu.Unlock() if v.cancel == nil { // this can happen during shutdown return } v.cancel() v.backgroundCtx, v.cancel = context.WithCancel(v.baseCtx) } func (v *View) setBuildInformation(ctx context.Context, folder span.URI, env []string, modfileFlagEnabled bool) error { if err := checkPathCase(folder.Filename()); err != nil { return fmt.Errorf("invalid workspace configuration: %w", err) } // Make sure to get the `go env` before continuing with initialization. gomod, err := v.getGoEnv(ctx, env) if err != nil { return err } modFile := strings.TrimSpace(gomod) if modFile == os.DevNull { return nil } v.realMod = span.URIFromPath(modFile) // Now that we have set all required fields, // check if the view has a valid build configuration. v.hasValidBuildConfiguration = checkBuildConfiguration(v.goCommand, v.realMod, v.folder, v.gopath) // The user has disabled the use of the -modfile flag or has no go.mod file. if !modfileFlagEnabled || v.realMod == "" { return nil } if modfileFlag, err := v.modfileFlagExists(ctx, v.Options().Env); err != nil { return err } else if !modfileFlag { return nil } // Copy the current go.mod file into the temporary go.mod file. // The file's name will be of the format go.directory.1234.mod. // It's temporary go.sum file should have the corresponding format of go.directory.1234.sum. tmpPattern := fmt.Sprintf("go.%s.*.mod", filepath.Base(folder.Filename())) tempModFile, err := ioutil.TempFile("", tmpPattern) if err != nil { return err } defer tempModFile.Close() origFile, err := os.Open(modFile) if err != nil { return err } defer origFile.Close() if _, err := io.Copy(tempModFile, origFile); err != nil { return err } v.tempMod = span.URIFromPath(tempModFile.Name()) // Copy go.sum file as well (if there is one). sumFile := filepath.Join(filepath.Dir(modFile), "go.sum") stat, err := os.Stat(sumFile) if err != nil || !stat.Mode().IsRegular() { return nil } contents, err := ioutil.ReadFile(sumFile) if err != nil { return err } if err := ioutil.WriteFile(tempSumFile(tempModFile.Name()), contents, stat.Mode()); err != nil { return err } return nil } // OS-specific path case check, for case-insensitive filesystems. var checkPathCase = defaultCheckPathCase func defaultCheckPathCase(path string) error { return nil } func checkBuildConfiguration(goCommand bool, mod, folder span.URI, gopath string) bool { // Since we only really understand the `go` command, if the user is not // using the go command, assume that their configuration is valid. if !goCommand { return true } // Check if the user is working within a module. if mod != "" { return true } // The user may have a multiple directories in their GOPATH. // Check if the workspace is within any of them. for _, gp := range filepath.SplitList(gopath) { if isSubdirectory(filepath.Join(gp, "src"), folder.Filename()) { return true } } return false } func isSubdirectory(root, leaf string) bool { rel, err := filepath.Rel(root, leaf) return err == nil && !strings.HasPrefix(rel, "..") } // getGoEnv sets the view's build information's GOPATH, GOCACHE, GOPRIVATE, and // GOPACKAGESDRIVER values. It also returns the view's GOMOD value, which need // not be cached. func (v *View) getGoEnv(ctx context.Context, env []string) (string, error) { var gocache, gopath, gopackagesdriver, goprivate bool isGoCommand := func(gopackagesdriver string) bool { return gopackagesdriver == "" || gopackagesdriver == "off" } for _, e := range env { split := strings.Split(e, "=") if len(split) != 2 { continue } switch split[0] { case "GOCACHE": v.gocache = split[1] gocache = true case "GOPATH": v.gopath = split[1] gopath = true case "GOPRIVATE": v.goprivate = split[1] goprivate = true case "GOPACKAGESDRIVER": v.goCommand = isGoCommand(split[1]) gopackagesdriver = true } } inv := gocommand.Invocation{ Verb: "env", Args: []string{"-json"}, Env: env, WorkingDir: v.Folder().Filename(), } stdout, err := v.gocmdRunner.Run(ctx, inv) if err != nil { return "", err } envMap := make(map[string]string) decoder := json.NewDecoder(stdout) if err := decoder.Decode(&envMap); err != nil { return "", err } if !gopath { if gopath, ok := envMap["GOPATH"]; ok { v.gopath = gopath } else { return "", errors.New("unable to determine GOPATH") } } if !gocache { if gocache, ok := envMap["GOCACHE"]; ok { v.gocache = gocache } else { return "", errors.New("unable to determine GOCACHE") } } if !goprivate { if goprivate, ok := envMap["GOPRIVATE"]; ok { v.goprivate = goprivate } // No error here: GOPRIVATE is not essential. } // The value of GOPACKAGESDRIVER is not returned through the go command. if !gopackagesdriver { v.goCommand = isGoCommand(os.Getenv("GOPACKAGESDRIVER")) } if gomod, ok := envMap["GOMOD"]; ok { return gomod, nil } return "", nil } func (v *View) IsGoPrivatePath(target string) bool { return globsMatchPath(v.goprivate, target) } // Copied from // https://cs.opensource.google/go/go/+/master:src/cmd/go/internal/str/path.go;l=58;drc=2910c5b4a01a573ebc97744890a07c1a3122c67a func globsMatchPath(globs, target string) bool { for globs != "" { // Extract next non-empty glob in comma-separated list. var glob string if i := strings.Index(globs, ","); i >= 0 { glob, globs = globs[:i], globs[i+1:] } else { glob, globs = globs, "" } if glob == "" { continue } // A glob with N+1 path elements (N slashes) needs to be matched // against the first N+1 path elements of target, // which end just before the N+1'th slash. n := strings.Count(glob, "/") prefix := target // Walk target, counting slashes, truncating at the N+1'th slash. for i := 0; i < len(target); i++ { if target[i] == '/' { if n == 0 { prefix = target[:i] break } n-- } } if n > 0 { // Not enough prefix elements. continue } matched, _ := path.Match(glob, prefix) if matched { return true } } return false } // This function will return the main go.mod file for this folder if it exists and whether the -modfile // flag exists for this version of go. func (v *View) modfileFlagExists(ctx context.Context, env []string) (bool, error) { // Check the go version by running "go list" with modules off. // Borrowed from internal/imports/mod.go:620. const format = `{{range context.ReleaseTags}}{{if eq . "go1.14"}}{{.}}{{end}}{{end}}` folder := v.folder.Filename() inv := gocommand.Invocation{ Verb: "list", Args: []string{"-e", "-f", format}, Env: append(env, "GO111MODULE=off"), WorkingDir: v.Folder().Filename(), } stdout, err := v.gocmdRunner.Run(ctx, inv) if err != nil { return false, err } // If the output is not go1.14 or an empty string, then it could be an error. lines := strings.Split(stdout.String(), "\n") if len(lines) < 2 && stdout.String() != "" { event.Error(ctx, "unexpected stdout when checking for go1.14", errors.Errorf("%q", stdout), tag.Directory.Of(folder)) return false, nil } return lines[0] == "go1.14", nil } // tempSumFile returns the path to the copied temporary go.sum file. // It simply replaces the extension of the temporary go.mod file with "sum". func tempSumFile(filename string) string { if filename == "" { return "" } return filename[:len(filename)-len("mod")] + "sum" }