golang
diff --git a/‎gopls/internal/lsp/cache/cache.go
Lines changed: 2 additions & 0 deletions b/‎gopls/internal/lsp/cache/cache.go
Lines changed: 2 additions & 0 deletions
diff --git a/‎gopls/internal/lsp/cache/check.go
Lines changed: 27 additions & 4 deletions b/‎gopls/internal/lsp/cache/check.go
Lines changed: 27 additions & 4 deletions
diff --git a/‎gopls/internal/lsp/cache/mod_tidy.go
Lines changed: 1 addition & 1 deletion b/‎gopls/internal/lsp/cache/mod_tidy.go
Lines changed: 1 addition & 1 deletion
diff --git a/‎gopls/internal/lsp/cache/parse.go
Lines changed: 1 addition & 1 deletion b/‎gopls/internal/lsp/cache/parse.go
Lines changed: 1 addition & 1 deletion
diff --git a/‎gopls/internal/lsp/cache/parse_cache.go
Lines changed: 96 additions & 40 deletions b/‎gopls/internal/lsp/cache/parse_cache.go
Lines changed: 96 additions & 40 deletions
@@ -9,6 +9,7 @@ import (
 	"reflect"
 	"strconv"
 	"sync/atomic"
+	"time"
 
 	"golang.org/x/tools/gopls/internal/lsp/source"
 	"golang.org/x/tools/internal/event"
@@ -67,6 +68,7 @@ func NewSession(ctx context.Context, c *Cache, optionsOverrides func(*source.Opt
 		gocmdRunner: &gocommand.Runner{},
 		options:     options,
 		overlayFS:   newOverlayFS(c),
+		parseCache:  newParseCache(1 * time.Minute), // keep recently parsed files for a minute, to optimize typing CPU
 	}
 	event.Log(ctx, "New session", KeyCreateSession.Of(s))
 	return s
 
@@ -356,7 +356,7 @@ func (s *snapshot) forEachPackage(ctx context.Context, ids []PackageID, pre preT
 // If a non-nil importGraph is provided, imports in this graph will be reused.
 func (s *snapshot) forEachPackageInternal(ctx context.Context, importGraph *importGraph, importIDs, syntaxIDs []PackageID, pre preTypeCheck, post postTypeCheck, handles map[PackageID]*packageHandle) (*typeCheckBatch, error) {
 	b := &typeCheckBatch{
-		parseCache:     s.parseCache,
+		parseCache:     s.view.parseCache,
 		pre:            pre,
 		post:           post,
 		handles:        handles,
@@ -593,9 +593,32 @@ func (b *typeCheckBatch) checkPackageForImport(ctx context.Context, ph *packageH
 	}
 	cfg := b.typesConfig(ctx, ph.localInputs, onError)
 	cfg.IgnoreFuncBodies = true
-	pgfs, err := b.parseCache.parseFiles(ctx, b.fset, source.ParseFull, ph.localInputs.compiledGoFiles...)
-	if err != nil {
-		return nil, err
+
+	// Parse the compiled go files, bypassing the parse cache as packages checked
+	// for import are unlikely to get cache hits. Additionally, we can optimize
+	// parsing slightly by not passing parser.ParseComments.
+	pgfs := make([]*source.ParsedGoFile, len(ph.localInputs.compiledGoFiles))
+	{
+		var group errgroup.Group
+		// Set an arbitrary concurrency limit; we want some parallelism but don't
+		// need GOMAXPROCS, as there is already a lot of concurrency among calls to
+		// checkPackageForImport.
+		//
+		// TODO(rfindley): is there a better way to limit parallelism here? We could
+		// have a global limit on the type-check batch, but would have to be very
+		// careful to avoid starvation.
+		group.SetLimit(4)
+		for i, fh := range ph.localInputs.compiledGoFiles {
+			i, fh := i, fh
+			group.Go(func() error {
+				pgf, err := parseGoImpl(ctx, b.fset, fh, parser.SkipObjectResolution)
+				pgfs[i] = pgf
+				return err
+			})
+		}
+		if err := group.Wait(); err != nil {
+			return nil, err // cancelled, or catastrophic error (e.g. missing file)
+		}
 	}
 	pkg := types.NewPackage(string(ph.localInputs.pkgPath), string(ph.localInputs.name))
 	check := types.NewChecker(cfg, b.fset, pkg, nil)
 
@@ -486,7 +486,7 @@ func missingModuleForImport(pgf *source.ParsedGoFile, imp *ast.ImportSpec, req *
 //
 // TODO(rfindley): this should key off source.ImportPath.
 func parseImports(ctx context.Context, s *snapshot, files []source.FileHandle) (map[string]bool, error) {
-	pgfs, err := s.parseCache.parseFiles(ctx, token.NewFileSet(), source.ParseHeader, files...)
+	pgfs, err := s.view.parseCache.parseFiles(ctx, token.NewFileSet(), source.ParseHeader, files...)
 	if err != nil { // e.g. context cancellation
 		return nil, err
 	}
 
@@ -27,7 +27,7 @@ import (
 // ParseGo parses the file whose contents are provided by fh, using a cache.
 // The resulting tree may have beeen fixed up.
 func (s *snapshot) ParseGo(ctx context.Context, fh source.FileHandle, mode parser.Mode) (*source.ParsedGoFile, error) {
-	pgfs, err := s.parseCache.parseFiles(ctx, token.NewFileSet(), mode, fh)
+	pgfs, err := s.view.parseCache.parseFiles(ctx, token.NewFileSet(), mode, fh)
 	if err != nil {
 		return nil, err
 	}
 
@@ -14,13 +14,22 @@ import (
 	"math/bits"
 	"runtime"
 	"sync"
+	"time"
 
 	"golang.org/x/sync/errgroup"
 	"golang.org/x/tools/gopls/internal/lsp/source"
+	"golang.org/x/tools/gopls/internal/span"
 	"golang.org/x/tools/internal/memoize"
 	"golang.org/x/tools/internal/tokeninternal"
 )
 
+// This file contains an implementation of an LRU parse cache, that offsets the
+// base token.Pos value of each cached file so that they may be later described
+// by a single dedicated FileSet.
+//
+// This is achieved by tracking a monotonic offset in the token.Pos space, that
+// is incremented before parsing allow room for the resulting parsed file.
+
 // reservedForParsing defines the room in the token.Pos space reserved for
 // cached parsed files.
 //
@@ -58,21 +67,11 @@ func fileSetWithBase(base int) *token.FileSet {
 	return fset
 }
 
-// This file contains an implementation of a bounded-size parse cache, that
-// offsets the base token.Pos value of each cached file so that they may be
-// later described by a single dedicated FileSet.
-//
-// This is achieved by tracking a monotonic offset in the token.Pos space, that
-// is incremented before parsing allow room for the resulting parsed file.
-
-// Keep 200 recently parsed files, based on the following rationale:
-//   - One of the most important benefits of caching is avoiding re-parsing
-//     everything in a package when working on a single file. No packages in
-//     Kubernetes have > 200 files (only one has > 100).
-//   - Experience has shown that ~1000 parsed files can use noticeable space.
-//     200 feels like a sweet spot between limiting cache size and optimizing
-//     cache hits for low-latency operations.
-const parseCacheMaxFiles = 200
+const (
+	// Always keep 100 recent files, independent of their wall-clock age, to
+	// optimize the case where the user resumes editing after a delay.
+	parseCacheMinFiles = 100
+)
 
 // parsePadding is additional padding allocated to allow for increases in
 // length (such as appending missing braces) caused by fixAST.
@@ -89,31 +88,55 @@ const parseCacheMaxFiles = 200
 // This value is mutable for testing, so that we can exercise the slow path.
 var parsePadding = 1000 // mutable for testing
 
-// A parseCache holds a bounded number of recently accessed parsed Go files. As
-// new files are stored, older files may be evicted from the cache.
+// A parseCache holds recently accessed parsed Go files. After new files are
+// stored, older files may be evicted from the cache via garbage collection.
 //
 // The parseCache.parseFiles method exposes a batch API for parsing (and
 // caching) multiple files. This is necessary for type-checking, where files
 // must be parsed in a common fileset.
 type parseCache struct {
+	maxAge time.Duration // interval at which to collect expired cache entries
+	done   chan struct{} // closed when GC is stopped
+
 	mu       sync.Mutex
 	m        map[parseKey]*parseCacheEntry
 	lru      queue  // min-atime priority queue of *parseCacheEntry
 	clock    uint64 // clock time, incremented when the cache is updated
 	nextBase int    // base offset for the next parsed file
 }
 
+// newParseCache creates a new parse cache and starts a goroutine to garbage
+// collect old entries that are older than maxAge.
+//
+// Callers must call parseCache.stop when the parse cache is no longer in use.
+func newParseCache(maxAge time.Duration) *parseCache {
+	c := &parseCache{
+		maxAge: maxAge,
+		m:      make(map[parseKey]*parseCacheEntry),
+		done:   make(chan struct{}),
+	}
+	go c.gc()
+	return c
+}
+
+// stop causes the GC goroutine to exit.
+func (c *parseCache) stop() {
+	close(c.done)
+}
+
 // parseKey uniquely identifies a parsed Go file.
 type parseKey struct {
-	file source.FileIdentity
+	uri  span.URI
 	mode parser.Mode
 }
 
 type parseCacheEntry struct {
 	key      parseKey
+	hash     source.Hash
 	promise  *memoize.Promise // memoize.Promise[*source.ParsedGoFile]
-	atime    uint64           // clock time of last access
-	lruIndex int
+	atime    uint64           // clock time of last access, for use in LRU sorting
+	walltime time.Time        // actual time of last access, for use in time-based eviction; too coarse for LRU on some systems
+	lruIndex int              // owned by the queue implementation
 }
 
 // startParse prepares a parsing pass, creating new promises in the cache for
@@ -131,6 +154,7 @@ func (c *parseCache) startParse(mode parser.Mode, fhs ...source.FileHandle) ([]*
 	//
 	// All entries parsed from a single call get the same access time.
 	c.clock++
+	walltime := time.Now()
 
 	// Read file data and collect cacheable files.
 	var (
@@ -149,15 +173,22 @@ func (c *parseCache) startParse(mode parser.Mode, fhs ...source.FileHandle) ([]*
 		data[i] = content
 
 		key := parseKey{
-			file: fh.FileIdentity(),
+			uri:  fh.URI(),
 			mode: mode,
 		}
 
-		if e, ok := c.m[key]; ok { // cache hit
-			e.atime = c.clock
-			heap.Fix(&c.lru, e.lruIndex)
-			promises[i] = e.promise
-			continue
+		if e, ok := c.m[key]; ok {
+			if e.hash == fh.FileIdentity().Hash { // cache hit
+				e.atime = c.clock
+				e.walltime = walltime
+				heap.Fix(&c.lru, e.lruIndex)
+				promises[i] = e.promise
+				continue
+			} else {
+				// A cache hit, for a different version. Delete it.
+				delete(c.m, e.key)
+				heap.Remove(&c.lru, e.lruIndex)
+			}
 		}
 
 		uri := fh.URI()
@@ -200,21 +231,14 @@ func (c *parseCache) startParse(mode parser.Mode, fhs ...source.FileHandle) ([]*
 		})
 		promises[i] = promise
 
-		var e *parseCacheEntry
-		if len(c.lru) < parseCacheMaxFiles {
-			// add new entry
-			e = new(parseCacheEntry)
-			if c.m == nil {
-				c.m = make(map[parseKey]*parseCacheEntry)
-			}
-		} else {
-			// evict oldest entry
-			e = heap.Pop(&c.lru).(*parseCacheEntry)
-			delete(c.m, e.key)
+		// add new entry; entries are gc'ed asynchronously
+		e := &parseCacheEntry{
+			key:      key,
+			hash:     fh.FileIdentity().Hash,
+			promise:  promise,
+			atime:    c.clock,
+			walltime: walltime,
 		}
-		e.key = key
-		e.promise = promise
-		e.atime = c.clock
 		c.m[e.key] = e
 		heap.Push(&c.lru, e)
 	}
@@ -226,6 +250,38 @@ func (c *parseCache) startParse(mode parser.Mode, fhs ...source.FileHandle) ([]*
 	return promises, firstReadError
 }
 
+func (c *parseCache) gc() {
+	const period = 10 * time.Second // gc period
+	timer := time.NewTimer(period)
+	defer timer.Stop()
+
+	for {
+		select {
+		case <-c.done:
+			return
+		case <-timer.C:
+		}
+
+		c.gcOnce()
+	}
+}
+
+func (c *parseCache) gcOnce() {
+	now := time.Now()
+	c.mu.Lock()
+	defer c.mu.Unlock()
+
+	for len(c.m) > parseCacheMinFiles {
+		e := heap.Pop(&c.lru).(*parseCacheEntry)
+		if now.Sub(e.walltime) > c.maxAge {
+			delete(c.m, e.key)
+		} else {
+			heap.Push(&c.lru, e)
+			break
+		}
+	}
+}
+
 // allocateSpace reserves the next n bytes of token.Pos space in the
 // cache.
 //
Original file line number	Diff line number	Diff line change
`@@ -486,7 +486,7 @@ func missingModuleForImport(pgf source.ParsedGoFile, imp ast.ImportSpec, req *`
`486`	`486`	`//`
`487`	`487`	`// TODO(rfindley): this should key off source.ImportPath.`
`488`	`488`	`func parseImports(ctx context.Context, s *snapshot, files []source.FileHandle) (map[string]bool, error) {`
`489`		`- pgfs, err := s.parseCache.parseFiles(ctx, token.NewFileSet(), source.ParseHeader, files...)`
	`489`	`+ pgfs, err := s.view.parseCache.parseFiles(ctx, token.NewFileSet(), source.ParseHeader, files...)`
`490`	`490`	`if err != nil { // e.g. context cancellation`
`491`	`491`	`return nil, err`
`492`	`492`	`}`
Original file line number	Diff line number	Diff line change
`@@ -27,7 +27,7 @@ import (`
`27`	`27`	`// ParseGo parses the file whose contents are provided by fh, using a cache.`
`28`	`28`	`// The resulting tree may have beeen fixed up.`
`29`	`29`	`func (s snapshot) ParseGo(ctx context.Context, fh source.FileHandle, mode parser.Mode) (source.ParsedGoFile, error) {`
`30`		`- pgfs, err := s.parseCache.parseFiles(ctx, token.NewFileSet(), mode, fh)`
	`30`	`+ pgfs, err := s.view.parseCache.parseFiles(ctx, token.NewFileSet(), mode, fh)`
`31`	`31`	`if err != nil {`
`32`	`32`	`return nil, err`
`33`	`33`	`}`