|
|
|
// Copyright (c) 2020, The Garble Authors.
|
|
|
|
// See LICENSE for licensing information.
|
|
|
|
|
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"go/ast"
|
patch and rebuild cmd/link to modify the magic value in pclntab
This value is hard-coded in the linker and written in a header.
We could rewrite the final binary, like we used to do with import paths,
but that would require once again maintaining libraries to do so.
Instead, we're now modifying the linker to do what we want.
It's not particularly hard, as every Go install has its source code,
and rebuilding a slightly modified linker only takes a few seconds at most.
Thanks to `go build -overlay`, we only need to copy the files we modify,
and right now we're just modifying one file in the toolchain.
We use a git patch, as the change is fairly static and small,
and the patch is easier to understand and maintain.
The other side of this change is in the runtime,
as it also hard-codes the magic value when loading information.
We modify the code via syntax trees in that case, like `-tiny` does,
because the change is tiny (one literal) and the affected lines of code
are modified regularly between major Go releases.
Since rebuilding a slightly modified linker can take a few seconds,
and Go's build cache does not cache linked binaries,
we keep our own cached version of the rebuilt binary in `os.UserCacheDir`.
The feature isn't perfect, and will be improved in the future.
See the TODOs about the added dependency on `git`,
or how we are currently only able to cache one linker binary at once.
Fixes #622.
2 years ago
|
|
|
"go/token"
|
|
|
|
"strconv"
|
|
|
|
"strings"
|
|
|
|
|
|
|
|
ah "mvdan.cc/garble/internal/asthelper"
|
|
|
|
)
|
|
|
|
|
patch and rebuild cmd/link to modify the magic value in pclntab
This value is hard-coded in the linker and written in a header.
We could rewrite the final binary, like we used to do with import paths,
but that would require once again maintaining libraries to do so.
Instead, we're now modifying the linker to do what we want.
It's not particularly hard, as every Go install has its source code,
and rebuilding a slightly modified linker only takes a few seconds at most.
Thanks to `go build -overlay`, we only need to copy the files we modify,
and right now we're just modifying one file in the toolchain.
We use a git patch, as the change is fairly static and small,
and the patch is easier to understand and maintain.
The other side of this change is in the runtime,
as it also hard-codes the magic value when loading information.
We modify the code via syntax trees in that case, like `-tiny` does,
because the change is tiny (one literal) and the affected lines of code
are modified regularly between major Go releases.
Since rebuilding a slightly modified linker can take a few seconds,
and Go's build cache does not cache linked binaries,
we keep our own cached version of the rebuilt binary in `os.UserCacheDir`.
The feature isn't perfect, and will be improved in the future.
See the TODOs about the added dependency on `git`,
or how we are currently only able to cache one linker binary at once.
Fixes #622.
2 years ago
|
|
|
// updateMagicValue updates hardcoded value of hdr.magic
|
|
|
|
// when verifying header in symtab.go
|
|
|
|
func updateMagicValue(file *ast.File, magicValue uint32) {
|
|
|
|
magicUpdated := false
|
|
|
|
|
|
|
|
// Find `hdr.magic != 0xfffffff?` in symtab.go and update to random magicValue
|
|
|
|
updateMagic := func(node ast.Node) bool {
|
|
|
|
binExpr, ok := node.(*ast.BinaryExpr)
|
|
|
|
if !ok || binExpr.Op != token.NEQ {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
selectorExpr, ok := binExpr.X.(*ast.SelectorExpr)
|
|
|
|
if !ok {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
if ident, ok := selectorExpr.X.(*ast.Ident); !ok || ident.Name != "hdr" {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
if selectorExpr.Sel.Name != "magic" {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
if _, ok := binExpr.Y.(*ast.BasicLit); !ok {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
binExpr.Y = &ast.BasicLit{
|
|
|
|
Kind: token.INT,
|
|
|
|
Value: strconv.FormatUint(uint64(magicValue), 10),
|
|
|
|
}
|
|
|
|
magicUpdated = true
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, decl := range file.Decls {
|
|
|
|
funcDecl, ok := decl.(*ast.FuncDecl)
|
|
|
|
if ok && funcDecl.Name.Name == "moduledataverify1" {
|
|
|
|
ast.Inspect(funcDecl, updateMagic)
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if !magicUpdated {
|
|
|
|
panic("magic value not updated")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// updateEntryOffset adds xor encryption for funcInfo.entryoff
|
|
|
|
// Encryption algorithm contains 1 xor and 1 multiply operations and is not cryptographically strong.
|
|
|
|
// Its goal, without slowing down program performance (reflection, stacktrace),
|
|
|
|
// is to make it difficult to determine relations between function metadata and function itself in a binary file.
|
|
|
|
// Difficulty of decryption is based on the difficulty of finding a small (probably inlined) entry() function without obvious patterns.
|
|
|
|
func updateEntryOffset(file *ast.File, entryOffKey uint32) {
|
update gotip and adapt to upstream changes
https://go.dev/cl/466095 lightly refactored the runtime
in a way that broke extractNameOff. In particular, the code
func cfuncname(f funcInfo) *byte {
if !f.valid() || f.nameOff == 0 {
return nil
}
return &f.datap.funcnametab[f.nameOff]
}
func funcname(f funcInfo) string {
return gostringnocopy(cfuncname(f))
}
is now simply
func funcname(f funcInfo) string {
if !f.valid() {
return ""
}
return f.datap.funcName(f.nameOff)
}
Since extractNameOff looked for the func named cfuncname,
and looked for the nameOff selector inside an index expression,
all of that code no longer worked properly.
It all existed to find the name of the field, nameOff,
so that we would automatically adapt if upstream renames it.
Unsurprisingly, the code using the field got refactored first.
It doesn't seem like the extra code on our part is helping us,
and assuming the name of the field works for all Go versions,
so do that instead.
If upstream does rename the field in the future,
the obfuscated Go builds will start failing in an obvious way.
If or when that comes to pass, we can change our constant string.
2 years ago
|
|
|
// Note that this field could be renamed in future Go versions.
|
|
|
|
const nameOffField = "nameOff"
|
|
|
|
entryOffUpdated := false
|
|
|
|
|
update gotip and adapt to upstream changes
https://go.dev/cl/466095 lightly refactored the runtime
in a way that broke extractNameOff. In particular, the code
func cfuncname(f funcInfo) *byte {
if !f.valid() || f.nameOff == 0 {
return nil
}
return &f.datap.funcnametab[f.nameOff]
}
func funcname(f funcInfo) string {
return gostringnocopy(cfuncname(f))
}
is now simply
func funcname(f funcInfo) string {
if !f.valid() {
return ""
}
return f.datap.funcName(f.nameOff)
}
Since extractNameOff looked for the func named cfuncname,
and looked for the nameOff selector inside an index expression,
all of that code no longer worked properly.
It all existed to find the name of the field, nameOff,
so that we would automatically adapt if upstream renames it.
Unsurprisingly, the code using the field got refactored first.
It doesn't seem like the extra code on our part is helping us,
and assuming the name of the field works for all Go versions,
so do that instead.
If upstream does rename the field in the future,
the obfuscated Go builds will start failing in an obvious way.
If or when that comes to pass, we can change our constant string.
2 years ago
|
|
|
// During linker stage we encrypt funcInfo.entryoff using a random number and funcInfo.nameOff,
|
|
|
|
// for correct program functioning we must decrypt funcInfo.entryoff at any access to it.
|
|
|
|
// In runtime package all references to funcInfo.entryOff are made through one method entry():
|
|
|
|
// func (f funcInfo) entry() uintptr {
|
|
|
|
// return f.datap.textAddr(f.entryoff)
|
|
|
|
// }
|
|
|
|
// It is enough to inject decryption into entry() method for program to start working transparently with encrypted value of funcInfo.entryOff:
|
|
|
|
// func (f funcInfo) entry() uintptr {
|
update gotip and adapt to upstream changes
https://go.dev/cl/466095 lightly refactored the runtime
in a way that broke extractNameOff. In particular, the code
func cfuncname(f funcInfo) *byte {
if !f.valid() || f.nameOff == 0 {
return nil
}
return &f.datap.funcnametab[f.nameOff]
}
func funcname(f funcInfo) string {
return gostringnocopy(cfuncname(f))
}
is now simply
func funcname(f funcInfo) string {
if !f.valid() {
return ""
}
return f.datap.funcName(f.nameOff)
}
Since extractNameOff looked for the func named cfuncname,
and looked for the nameOff selector inside an index expression,
all of that code no longer worked properly.
It all existed to find the name of the field, nameOff,
so that we would automatically adapt if upstream renames it.
Unsurprisingly, the code using the field got refactored first.
It doesn't seem like the extra code on our part is helping us,
and assuming the name of the field works for all Go versions,
so do that instead.
If upstream does rename the field in the future,
the obfuscated Go builds will start failing in an obvious way.
If or when that comes to pass, we can change our constant string.
2 years ago
|
|
|
// return f.datap.textAddr(f.entryoff ^ (uint32(f.nameOff) * <random int>))
|
|
|
|
// }
|
|
|
|
updateEntryOff := func(node ast.Node) bool {
|
|
|
|
callExpr, ok := node.(*ast.CallExpr)
|
|
|
|
if !ok {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
textSelExpr, ok := callExpr.Fun.(*ast.SelectorExpr)
|
|
|
|
if !ok || textSelExpr.Sel.Name != "textAddr" {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
selExpr, ok := callExpr.Args[0].(*ast.SelectorExpr)
|
|
|
|
if !ok {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
callExpr.Args[0] = &ast.BinaryExpr{
|
|
|
|
X: selExpr,
|
|
|
|
Op: token.XOR,
|
|
|
|
Y: &ast.ParenExpr{X: &ast.BinaryExpr{
|
|
|
|
X: ah.CallExpr(ast.NewIdent("uint32"), &ast.SelectorExpr{
|
|
|
|
X: selExpr.X,
|
|
|
|
Sel: ast.NewIdent(nameOffField),
|
|
|
|
}),
|
|
|
|
Op: token.MUL,
|
|
|
|
Y: &ast.BasicLit{
|
|
|
|
Kind: token.INT,
|
|
|
|
Value: strconv.FormatUint(uint64(entryOffKey), 10),
|
|
|
|
},
|
|
|
|
}},
|
|
|
|
}
|
|
|
|
entryOffUpdated = true
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
var entryFunc *ast.FuncDecl
|
|
|
|
for _, decl := range file.Decls {
|
update gotip and adapt to upstream changes
https://go.dev/cl/466095 lightly refactored the runtime
in a way that broke extractNameOff. In particular, the code
func cfuncname(f funcInfo) *byte {
if !f.valid() || f.nameOff == 0 {
return nil
}
return &f.datap.funcnametab[f.nameOff]
}
func funcname(f funcInfo) string {
return gostringnocopy(cfuncname(f))
}
is now simply
func funcname(f funcInfo) string {
if !f.valid() {
return ""
}
return f.datap.funcName(f.nameOff)
}
Since extractNameOff looked for the func named cfuncname,
and looked for the nameOff selector inside an index expression,
all of that code no longer worked properly.
It all existed to find the name of the field, nameOff,
so that we would automatically adapt if upstream renames it.
Unsurprisingly, the code using the field got refactored first.
It doesn't seem like the extra code on our part is helping us,
and assuming the name of the field works for all Go versions,
so do that instead.
If upstream does rename the field in the future,
the obfuscated Go builds will start failing in an obvious way.
If or when that comes to pass, we can change our constant string.
2 years ago
|
|
|
decl, ok := decl.(*ast.FuncDecl)
|
|
|
|
if !ok {
|
|
|
|
continue
|
|
|
|
}
|
update gotip and adapt to upstream changes
https://go.dev/cl/466095 lightly refactored the runtime
in a way that broke extractNameOff. In particular, the code
func cfuncname(f funcInfo) *byte {
if !f.valid() || f.nameOff == 0 {
return nil
}
return &f.datap.funcnametab[f.nameOff]
}
func funcname(f funcInfo) string {
return gostringnocopy(cfuncname(f))
}
is now simply
func funcname(f funcInfo) string {
if !f.valid() {
return ""
}
return f.datap.funcName(f.nameOff)
}
Since extractNameOff looked for the func named cfuncname,
and looked for the nameOff selector inside an index expression,
all of that code no longer worked properly.
It all existed to find the name of the field, nameOff,
so that we would automatically adapt if upstream renames it.
Unsurprisingly, the code using the field got refactored first.
It doesn't seem like the extra code on our part is helping us,
and assuming the name of the field works for all Go versions,
so do that instead.
If upstream does rename the field in the future,
the obfuscated Go builds will start failing in an obvious way.
If or when that comes to pass, we can change our constant string.
2 years ago
|
|
|
if decl.Name.Name == "entry" {
|
|
|
|
entryFunc = decl
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if entryFunc == nil {
|
|
|
|
panic("entry function not found")
|
|
|
|
}
|
|
|
|
|
|
|
|
ast.Inspect(entryFunc, updateEntryOff)
|
|
|
|
if !entryOffUpdated {
|
|
|
|
panic("entryOff not found")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// stripRuntime removes unnecessary code from the runtime,
|
|
|
|
// such as panic and fatal error printing, and code that
|
|
|
|
// prints trace/debug info of the runtime.
|
|
|
|
func stripRuntime(basename string, file *ast.File) {
|
|
|
|
stripPrints := func(node ast.Node) bool {
|
|
|
|
call, ok := node.(*ast.CallExpr)
|
|
|
|
if !ok {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
id, ok := call.Fun.(*ast.Ident)
|
|
|
|
if !ok {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
switch id.Name {
|
|
|
|
case "print", "println":
|
|
|
|
id.Name = "hidePrint"
|
|
|
|
return false
|
|
|
|
default:
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, decl := range file.Decls {
|
|
|
|
funcDecl, ok := decl.(*ast.FuncDecl)
|
|
|
|
if !ok {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
switch basename {
|
|
|
|
case "error.go":
|
|
|
|
// only used in panics
|
|
|
|
switch funcDecl.Name.Name {
|
|
|
|
case "printany", "printanycustomtype":
|
|
|
|
funcDecl.Body.List = nil
|
|
|
|
}
|
|
|
|
case "mgcscavenge.go":
|
|
|
|
// used in tracing the scavenger
|
|
|
|
if funcDecl.Name.Name == "printScavTrace" {
|
|
|
|
funcDecl.Body.List = nil
|
|
|
|
}
|
|
|
|
case "mprof.go":
|
|
|
|
// remove all functions that print debug/tracing info
|
|
|
|
// of the runtime
|
|
|
|
if strings.HasPrefix(funcDecl.Name.Name, "trace") {
|
|
|
|
funcDecl.Body.List = nil
|
|
|
|
}
|
|
|
|
case "panic.go":
|
|
|
|
// used for printing panics
|
|
|
|
switch funcDecl.Name.Name {
|
|
|
|
case "preprintpanics", "printpanics":
|
|
|
|
funcDecl.Body.List = nil
|
|
|
|
}
|
|
|
|
case "print.go":
|
|
|
|
// only used in tracebacks
|
|
|
|
if funcDecl.Name.Name == "hexdumpWords" {
|
|
|
|
funcDecl.Body.List = nil
|
|
|
|
}
|
|
|
|
case "proc.go":
|
|
|
|
// used in tracing the scheduler
|
|
|
|
if funcDecl.Name.Name == "schedtrace" {
|
|
|
|
funcDecl.Body.List = nil
|
|
|
|
}
|
|
|
|
case "runtime1.go":
|
|
|
|
usesEnv := func(node ast.Node) bool {
|
|
|
|
for node := range ast.Preorder(node) {
|
|
|
|
ident, ok := node.(*ast.Ident)
|
|
|
|
if ok && ident.Name == "gogetenv" {
|
|
|
|
return true
|
small improvements towards obfuscating the runtime
I spent a couple of days trying to obfuscate all of std.
Ultimately I failed at making it fully work,
especially when it comes to the runtime package,
but I did fix a few problems along the way, as seen here.
First, fix the TODO to allow handleDirectives and transformGo to run on
runtime packages as well, if they are considered private. Note that this
is never true right now, but it matters once we remove runtimeRelated.
Second, modify parsedebugvars in a way that doesn't break typechecking.
We can remove AST nodes or even modify them in simple ways,
but if we add new AST nodes after typechecking,
those will lack type information.
We were replacing the entire body, running into that problem.
Instead, carefully cut the body to set some defaults,
but remove everything from the point GODEBUG is read.
Finally, add commented-out debug prints of transformed asm files.
For #193.
4 years ago
|
|
|
}
|
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
filenames:
|
|
|
|
switch funcDecl.Name.Name {
|
|
|
|
case "parsedebugvars":
|
|
|
|
// keep defaults for GODEBUG cgocheck and invalidptr,
|
|
|
|
// remove code that reads GODEBUG via gogetenv
|
|
|
|
for i, stmt := range funcDecl.Body.List {
|
|
|
|
if usesEnv(stmt) {
|
|
|
|
funcDecl.Body.List = funcDecl.Body.List[:i]
|
|
|
|
break filenames
|
|
|
|
}
|
|
|
|
}
|
|
|
|
panic("did not see any gogetenv call in parsedebugvars")
|
|
|
|
case "setTraceback":
|
|
|
|
// tracebacks are completely hidden, no
|
|
|
|
// sense keeping this function
|
|
|
|
funcDecl.Body.List = nil
|
|
|
|
}
|
|
|
|
case "traceback.go":
|
|
|
|
// only used for printing tracebacks
|
|
|
|
switch funcDecl.Name.Name {
|
|
|
|
case "tracebackdefers", "printcreatedby", "printcreatedby1", "traceback", "tracebacktrap", "traceback1", "printAncestorTraceback",
|
|
|
|
"printAncestorTracebackFuncInfo", "goroutineheader", "tracebackothers", "tracebackHexdump", "printCgoTraceback":
|
|
|
|
funcDecl.Body.List = nil
|
|
|
|
case "printOneCgoTraceback":
|
|
|
|
funcDecl.Body = ah.BlockStmt(ah.ReturnStmt(ast.NewIdent("false")))
|
|
|
|
default:
|
|
|
|
if strings.HasPrefix(funcDecl.Name.Name, "print") {
|
|
|
|
funcDecl.Body.List = nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
if basename == "print.go" {
|
|
|
|
file.Decls = append(file.Decls, hidePrintDecl)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// replace all 'print' and 'println' statements in
|
|
|
|
// the runtime with an empty func, which will be
|
|
|
|
// optimized out by the compiler
|
|
|
|
ast.Inspect(file, stripPrints)
|
|
|
|
}
|
|
|
|
|
|
|
|
var hidePrintDecl = &ast.FuncDecl{
|
|
|
|
Name: ast.NewIdent("hidePrint"),
|
|
|
|
Type: &ast.FuncType{Params: &ast.FieldList{
|
|
|
|
List: []*ast.Field{{
|
|
|
|
Names: []*ast.Ident{{Name: "args"}},
|
|
|
|
Type: &ast.Ellipsis{Elt: &ast.InterfaceType{
|
|
|
|
Methods: &ast.FieldList{},
|
|
|
|
}},
|
|
|
|
}},
|
|
|
|
}},
|
|
|
|
Body: &ast.BlockStmt{},
|
|
|
|
}
|