// Copyright (c) 2020, The Garble Authors.
// See LICENSE for licensing information.

package main

import (
	_ "embed"
	"flag"
	"fmt"
	"math/rand/v2"
	"os"
	"os/exec"
	"path/filepath"
	"regexp"
	"strconv"
	"strings"
	"testing"
	"time"

	"github.com/go-quicktest/qt"
)

//go:embed testdata/bench/main.go
var benchSourceMain []byte

var (
	rxBuiltRuntime = regexp.MustCompile(`(?m)^runtime$`)
	rxBuiltMain    = regexp.MustCompile(`(?m)^test/main$`)
)

// BenchmarkBuild is a benchmark for 'garble build' on a fairly simple
// main package with a handful of standard library depedencies.
//
// We use a real garble binary and exec it, to simulate what the real user would
// run. The real obfuscation and compilation will happen in sub-processes
// anyway, so skipping one exec layer doesn't help us in any way.
//
// The benchmark isn't parallel, because in practice users build once at a time,
// and each build already spawns concurrent processes and goroutines to do work.
//
// At the moment, each iteration takes 1-2s on a laptop, so we can't make the
// benchmark include any more features unless we make it significantly faster.
func BenchmarkBuild(b *testing.B) {
	// As of Go 1.17, using -benchtime=Nx with N larger than 1 results in two
	// calls to BenchmarkBuild, with the first having b.N==1 to discover
	// sub-benchmarks. Unfortunately, we do a significant amount of work both
	// during setup and during that first iteration, which is pointless.
	// To avoid that, detect the scenario in a hacky way, and return early.
	// See https://github.com/golang/go/issues/32051.
	benchtime := flag.Lookup("test.benchtime").Value.String()
	if b.N == 1 && strings.HasSuffix(benchtime, "x") && benchtime != "1x" {
		return
	}
	tdir := b.TempDir()

	// We collect extra metrics.
	var memoryAllocs, cachedTime, systemTime int64

	outputBin := filepath.Join(tdir, "output")
	sourceDir := filepath.Join(tdir, "src")
	qt.Assert(b, qt.IsNil(os.Mkdir(sourceDir, 0o777)))

	writeSourceFile := func(name string, content []byte) {
		err := os.WriteFile(filepath.Join(sourceDir, name), content, 0o666)
		qt.Assert(b, qt.IsNil(err))
	}
	writeSourceFile("go.mod", []byte("module test/main"))
	writeSourceFile("main.go", benchSourceMain)

	rxGarbleAllocs := regexp.MustCompile(`(?m)^garble allocs: ([0-9]+)`)

	b.ResetTimer()
	b.StopTimer()
	for i := range b.N {
		// First we do a fresh build, using empty cache directories,
		// and the second does an incremental rebuild reusing the same cache directories.
		goCache := filepath.Join(tdir, "go-cache")
		qt.Assert(b, qt.IsNil(os.RemoveAll(goCache)))
		qt.Assert(b, qt.IsNil(os.Mkdir(goCache, 0o777)))
		garbleCache := filepath.Join(tdir, "garble-cache")
		qt.Assert(b, qt.IsNil(os.RemoveAll(garbleCache)))
		qt.Assert(b, qt.IsNil(os.Mkdir(garbleCache, 0o777)))
		env := []string{
			"RUN_GARBLE_MAIN=true",
			"GOCACHE=" + goCache,
			"GARBLE_CACHE=" + garbleCache,
			"GARBLE_WRITE_ALLOCS=true",
		}
		if prof := flag.Lookup("test.cpuprofile").Value.String(); prof != "" {
			// Ensure the directory is empty and created, and pass it along, so that the garble
			// sub-processes can also write CPU profiles.
			// Collect and then merge the profiles as follows:
			//
			//    go test -run=- -vet=off -bench=. -benchtime=5x -cpuprofile=cpu.pprof
			//    go tool pprof -proto cpu.pprof cpu.pprof-subproc/* >merged.pprof
			dir, err := filepath.Abs(prof + "-subproc")
			qt.Assert(b, qt.IsNil(err))
			err = os.RemoveAll(dir)
			qt.Assert(b, qt.IsNil(err))
			err = os.MkdirAll(dir, 0o777)
			qt.Assert(b, qt.IsNil(err))
			env = append(env, "GARBLE_WRITE_CPUPROFILES="+dir)
		}
		if prof := flag.Lookup("test.memprofile").Value.String(); prof != "" {
			// Same as before, but for allocation profiles.
			dir, err := filepath.Abs(prof + "-subproc")
			qt.Assert(b, qt.IsNil(err))
			err = os.RemoveAll(dir)
			qt.Assert(b, qt.IsNil(err))
			err = os.MkdirAll(dir, 0o777)
			qt.Assert(b, qt.IsNil(err))
			env = append(env, "GARBLE_WRITE_MEMPROFILES="+dir)
		}
		args := []string{"build", "-v", "-o=" + outputBin, sourceDir}

		for _, cached := range []bool{false, true} {
			// The cached rebuild will reuse all dependencies,
			// but rebuild the main package itself.
			if cached {
				writeSourceFile("rebuild.go", fmt.Appendf(nil, "package main\nvar v%d int", i))
			}

			cmd := exec.Command(os.Args[0], args...)
			cmd.Env = append(cmd.Environ(), env...)
			cmd.Dir = sourceDir

			cachedStart := time.Now()
			b.StartTimer()
			out, err := cmd.CombinedOutput()
			b.StopTimer()
			if cached {
				cachedTime += time.Since(cachedStart).Nanoseconds()
			}

			qt.Assert(b, qt.IsNil(err), qt.Commentf("output: %s", out))
			if !cached {
				// Ensure that we built all packages, as expected.
				qt.Assert(b, qt.IsTrue(rxBuiltRuntime.Match(out)))
			} else {
				// Ensure that we only rebuilt the main package, as expected.
				qt.Assert(b, qt.IsFalse(rxBuiltRuntime.Match(out)))
			}
			qt.Assert(b, qt.IsTrue(rxBuiltMain.Match(out)))

			matches := rxGarbleAllocs.FindAllSubmatch(out, -1)
			if !cached {
				// The non-cached version should have at least a handful of
				// sub-processes; catch if our logic breaks.
				qt.Assert(b, qt.IsTrue(len(matches) > 5))
			}
			for _, match := range matches {
				allocs, err := strconv.ParseInt(string(match[1]), 10, 64)
				qt.Assert(b, qt.IsNil(err))
				memoryAllocs += allocs
			}

			systemTime += int64(cmd.ProcessState.SystemTime())
		}
	}
	// We can't use "allocs/op" as it's reserved for ReportAllocs.
	b.ReportMetric(float64(memoryAllocs)/float64(b.N), "mallocs/op")
	b.ReportMetric(float64(cachedTime)/float64(b.N), "cached-ns/op")
	b.ReportMetric(float64(systemTime)/float64(b.N), "sys-ns/op")
	info, err := os.Stat(outputBin)
	if err != nil {
		b.Fatal(err)
	}
	b.ReportMetric(float64(info.Size()), "bin-B")
}

func BenchmarkAbiOriginalNames(b *testing.B) {
	// Benchmark two thousand obfuscated names in _originalNamePairs
	// and a variety of input strings to reverse.
	// As an example, the cmd/go binary ends up with about 2200 entries
	// in _originalNamePairs as of November 2024, so it's a realistic figure.
	// Structs with tens of fields are also relatively normal.
	salt := []byte("some salt bytes")
	for n := range 2000 {
		name := fmt.Sprintf("name_%d", n)
		garbled := hashWithCustomSalt(salt, name)
		_originalNamePairs = append(_originalNamePairs, garbled, name)
	}
	_originalNamesInit()
	// Pick twenty obfuscated names at random to use as inputs below.
	// Use a deterministic random source so it's stable between benchmark runs.
	rnd := rand.New(rand.NewPCG(1, 2))
	var chosen []string
	for i := 0; i < len(_originalNamePairs); i += 2 {
		chosen = append(chosen, _originalNamePairs[i])
	}
	rnd.Shuffle(len(chosen), func(i, j int) {
		chosen[i], chosen[j] = chosen[j], chosen[i]
	})
	chosen = chosen[:20]

	inputs := []string{
		// non-obfuscated names and types
		"Error",
		"int",
		"*[]*interface {}",
		"*map[uint64]bool",
		// an obfuscated name
		chosen[0],
		// an obfuscated *pkg.Name
		fmt.Sprintf("*%s.%s", chosen[1], chosen[2]),
		// big struct with more than a dozen string field types
		fmt.Sprintf("struct { %s string }", strings.Join(chosen[3:], " string ")),
	}

	var inputBytes int
	for _, input := range inputs {
		inputBytes += len(input)
	}
	b.SetBytes(int64(inputBytes))
	b.ReportAllocs()
	b.ResetTimer()

	// We use a parallel benchmark because internal/abi's Name method
	// is meant to be called by any goroutine at any time.
	b.RunParallel(func(pb *testing.PB) {
		for pb.Next() {
			for _, input := range inputs {
				_originalNames(input)
			}
		}
	})
	_originalNamePairs = []string{}
	_originalNamesReplacer = nil
}