replace listedPackage.Deps in favor of a derived map

In looking at the cpu and memory profiles, it surfaced that we spent
a lot of time in garbage collection, and a significant amount of the
garbage was produced by gob decoding string slices.

listedPackage.Deps is a list of a package's transitive dependencies,
so as a Go build gets larger, the list also gets larger and larger.

Given that Imports is the list of direct dependencies,
we can reconstruct it ourselves as needed, which is not always.
Moreover, since we want to do lookups, we can build a map directly.

This doesn't directly result in a wall time speed-up,
but it does result in a significant reduction in allocations.
The gob files we store in the disk cache should also be a bit smaller.

            │      old      │               new               │
            │ cached-sec/op │ cached-sec/op  vs base          │
    Build-8     339.5m ± 2%     340.3m ± 1%  ~ (p=0.218 n=10)

            │     old     │                new                 │
            │ mallocs/op  │ mallocs/op   vs base               │
    Build-8   38.08M ± 0%   35.73M ± 0%  -6.18% (p=0.000 n=10)
pull/850/head
Daniel Martí 4 months ago committed by Paul Scheduikat
parent ec5b6df439
commit 8a7d91b684

@ -146,7 +146,6 @@ type listedPackage struct {
ForTest string
Export string
BuildID string
Deps []string
ImportMap map[string]string
Standard bool
@ -161,6 +160,11 @@ type listedPackage struct {
// between garble processes. Use "Garble" as a prefix to ensure no
// collisions with the JSON fields from 'go list'.
// allDeps is like the Deps field given by 'go list', but in the form of a map
// for the sake of fast lookups. It's also unnecessary to consume or store Deps
// as returned by 'go list', as it can be reconstructed from Imports.
allDeps map[string]struct{}
// GarbleActionID is a hash combining the Action ID from BuildID,
// with Garble's own inputs as per addGarbleToHash.
// It is set even when ToObfuscate is false, as it is also used for random
@ -172,6 +176,33 @@ type listedPackage struct {
ToObfuscate bool `json:"-"`
}
func (p *listedPackage) hasDep(path string) bool {
if p.allDeps == nil {
p.allDeps = make(map[string]struct{}, len(p.Imports)*2)
p.addImportsFrom(p)
}
_, ok := p.allDeps[path]
return ok
}
func (p *listedPackage) addImportsFrom(from *listedPackage) {
for _, path := range from.Imports {
if path == "C" {
// `go list -json` shows "C" in Imports but not Deps.
// See https://go.dev/issue/60453.
continue
}
if path2 := from.ImportMap[path]; path2 != "" {
path = path2
}
if _, ok := p.allDeps[path]; ok {
continue // already added
}
p.allDeps[path] = struct{}{}
p.addImportsFrom(sharedCache.ListedPackages[path])
}
}
type packageError struct {
Pos string
Err string
@ -419,10 +450,8 @@ func listPackage(from *listedPackage, path string) (*listedPackage, error) {
// Packages outside std can list any package,
// as long as they depend on it directly or indirectly.
for _, dep := range from.Deps {
if dep == pkg.ImportPath {
return pkg, nil
}
if from.hasDep(pkg.ImportPath) {
return pkg, nil
}
// As a special case, any package can list runtime or its dependencies,
@ -432,10 +461,8 @@ func listPackage(from *listedPackage, path string) (*listedPackage, error) {
if pkg.ImportPath == "runtime" {
return pkg, nil
}
for _, dep := range sharedCache.ListedPackages["runtime"].Deps {
if dep == pkg.ImportPath {
return pkg, nil
}
if sharedCache.ListedPackages["runtime"].hasDep(pkg.ImportPath) {
return pkg, nil
}
return nil, fmt.Errorf("list %s: %w", path, ErrNotDependency)

Loading…
Cancel
Save