You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
garble/bench_test.go

230 lines
7.5 KiB
Go

// Copyright (c) 2020, The Garble Authors.
// See LICENSE for licensing information.
package main
import (
_ "embed"
"flag"
"fmt"
"math/rand/v2"
"os"
"os/exec"
"path/filepath"
"regexp"
"strconv"
"strings"
"testing"
"time"
"github.com/go-quicktest/qt"
)
//go:embed testdata/bench/main.go
var benchSourceMain []byte
var (
rxBuiltRuntime = regexp.MustCompile(`(?m)^runtime$`)
rxBuiltMain = regexp.MustCompile(`(?m)^test/main$`)
)
// BenchmarkBuild is a benchmark for 'garble build' on a fairly simple
// main package with a handful of standard library depedencies.
//
// We use a real garble binary and exec it, to simulate what the real user would
// run. The real obfuscation and compilation will happen in sub-processes
// anyway, so skipping one exec layer doesn't help us in any way.
//
// The benchmark isn't parallel, because in practice users build once at a time,
// and each build already spawns concurrent processes and goroutines to do work.
//
// At the moment, each iteration takes 1-2s on a laptop, so we can't make the
// benchmark include any more features unless we make it significantly faster.
func BenchmarkBuild(b *testing.B) {
// As of Go 1.17, using -benchtime=Nx with N larger than 1 results in two
// calls to BenchmarkBuild, with the first having b.N==1 to discover
// sub-benchmarks. Unfortunately, we do a significant amount of work both
// during setup and during that first iteration, which is pointless.
// To avoid that, detect the scenario in a hacky way, and return early.
// See https://github.com/golang/go/issues/32051.
benchtime := flag.Lookup("test.benchtime").Value.String()
if b.N == 1 && strings.HasSuffix(benchtime, "x") && benchtime != "1x" {
return
}
tdir := b.TempDir()
// We collect extra metrics.
var memoryAllocs, cachedTime, systemTime int64
outputBin := filepath.Join(tdir, "output")
sourceDir := filepath.Join(tdir, "src")
qt.Assert(b, qt.IsNil(os.Mkdir(sourceDir, 0o777)))
writeSourceFile := func(name string, content []byte) {
err := os.WriteFile(filepath.Join(sourceDir, name), content, 0o666)
qt.Assert(b, qt.IsNil(err))
}
writeSourceFile("go.mod", []byte("module test/main"))
writeSourceFile("main.go", benchSourceMain)
rxGarbleAllocs := regexp.MustCompile(`(?m)^garble allocs: ([0-9]+)`)
b.ResetTimer()
b.StopTimer()
for i := range b.N {
// First we do a fresh build, using empty cache directories,
// and the second does an incremental rebuild reusing the same cache directories.
goCache := filepath.Join(tdir, "go-cache")
qt.Assert(b, qt.IsNil(os.RemoveAll(goCache)))
qt.Assert(b, qt.IsNil(os.Mkdir(goCache, 0o777)))
garbleCache := filepath.Join(tdir, "garble-cache")
qt.Assert(b, qt.IsNil(os.RemoveAll(garbleCache)))
qt.Assert(b, qt.IsNil(os.Mkdir(garbleCache, 0o777)))
env := []string{
"RUN_GARBLE_MAIN=true",
"GOCACHE=" + goCache,
"GARBLE_CACHE=" + garbleCache,
"GARBLE_WRITE_ALLOCS=true",
}
if prof := flag.Lookup("test.cpuprofile").Value.String(); prof != "" {
// Ensure the directory is empty and created, and pass it along, so that the garble
// sub-processes can also write CPU profiles.
// Collect and then merge the profiles as follows:
//
// go test -run=- -vet=off -bench=. -benchtime=5x -cpuprofile=cpu.pprof
// go tool pprof -proto cpu.pprof cpu.pprof-subproc/* >merged.pprof
dir, err := filepath.Abs(prof + "-subproc")
qt.Assert(b, qt.IsNil(err))
err = os.RemoveAll(dir)
qt.Assert(b, qt.IsNil(err))
err = os.MkdirAll(dir, 0o777)
qt.Assert(b, qt.IsNil(err))
env = append(env, "GARBLE_WRITE_CPUPROFILES="+dir)
}
if prof := flag.Lookup("test.memprofile").Value.String(); prof != "" {
// Same as before, but for allocation profiles.
dir, err := filepath.Abs(prof + "-subproc")
qt.Assert(b, qt.IsNil(err))
err = os.RemoveAll(dir)
qt.Assert(b, qt.IsNil(err))
err = os.MkdirAll(dir, 0o777)
qt.Assert(b, qt.IsNil(err))
env = append(env, "GARBLE_WRITE_MEMPROFILES="+dir)
}
args := []string{"build", "-v", "-o=" + outputBin, sourceDir}
for _, cached := range []bool{false, true} {
// The cached rebuild will reuse all dependencies,
// but rebuild the main package itself.
if cached {
writeSourceFile("rebuild.go", fmt.Appendf(nil, "package main\nvar v%d int", i))
}
cmd := exec.Command(os.Args[0], args...)
cmd.Env = append(cmd.Environ(), env...)
cmd.Dir = sourceDir
cachedStart := time.Now()
b.StartTimer()
out, err := cmd.CombinedOutput()
b.StopTimer()
if cached {
cachedTime += time.Since(cachedStart).Nanoseconds()
}
qt.Assert(b, qt.IsNil(err), qt.Commentf("output: %s", out))
if !cached {
// Ensure that we built all packages, as expected.
qt.Assert(b, qt.IsTrue(rxBuiltRuntime.Match(out)))
} else {
// Ensure that we only rebuilt the main package, as expected.
qt.Assert(b, qt.IsFalse(rxBuiltRuntime.Match(out)))
}
qt.Assert(b, qt.IsTrue(rxBuiltMain.Match(out)))
matches := rxGarbleAllocs.FindAllSubmatch(out, -1)
if !cached {
// The non-cached version should have at least a handful of
// sub-processes; catch if our logic breaks.
qt.Assert(b, qt.IsTrue(len(matches) > 5))
}
for _, match := range matches {
allocs, err := strconv.ParseInt(string(match[1]), 10, 64)
qt.Assert(b, qt.IsNil(err))
memoryAllocs += allocs
}
systemTime += int64(cmd.ProcessState.SystemTime())
}
}
// We can't use "allocs/op" as it's reserved for ReportAllocs.
b.ReportMetric(float64(memoryAllocs)/float64(b.N), "mallocs/op")
b.ReportMetric(float64(cachedTime)/float64(b.N), "cached-ns/op")
b.ReportMetric(float64(systemTime)/float64(b.N), "sys-ns/op")
info, err := os.Stat(outputBin)
if err != nil {
b.Fatal(err)
}
b.ReportMetric(float64(info.Size()), "bin-B")
}
func BenchmarkAbiOriginalNames(b *testing.B) {
// Benchmark two thousand obfuscated names in _originalNamePairs
// and a variety of input strings to reverse.
// As an example, the cmd/go binary ends up with about 2200 entries
// in _originalNamePairs as of November 2024, so it's a realistic figure.
// Structs with tens of fields are also relatively normal.
salt := []byte("some salt bytes")
for n := range 2000 {
name := fmt.Sprintf("name_%d", n)
garbled := hashWithCustomSalt(salt, name)
_originalNamePairs = append(_originalNamePairs, garbled, name)
}
_originalNamesInit()
// Pick twenty obfuscated names at random to use as inputs below.
// Use a deterministic random source so it's stable between benchmark runs.
rnd := rand.New(rand.NewPCG(1, 2))
var chosen []string
for i := 0; i < len(_originalNamePairs); i += 2 {
chosen = append(chosen, _originalNamePairs[i])
}
rnd.Shuffle(len(chosen), func(i, j int) {
chosen[i], chosen[j] = chosen[j], chosen[i]
})
chosen = chosen[:20]
inputs := []string{
// non-obfuscated names and types
"Error",
"int",
"*[]*interface {}",
"*map[uint64]bool",
// an obfuscated name
chosen[0],
// an obfuscated *pkg.Name
fmt.Sprintf("*%s.%s", chosen[1], chosen[2]),
// big struct with more than a dozen string field types
fmt.Sprintf("struct { %s string }", strings.Join(chosen[3:], " string ")),
}
var inputBytes int
for _, input := range inputs {
inputBytes += len(input)
}
b.SetBytes(int64(inputBytes))
b.ReportAllocs()
b.ResetTimer()
// We use a parallel benchmark because internal/abi's Name method
// is meant to be called by any goroutine at any time.
b.RunParallel(func(pb *testing.PB) {
for pb.Next() {
for _, input := range inputs {
_originalNames(input)
}
}
})
_originalNamePairs = []string{}
_originalNamesReplacer = nil
}