Skip to content

Commit

Permalink
strip struct tags when hashing structs for type identity
Browse files Browse the repository at this point in the history
This was a long standing TODO, and a user finally ran into it.
The fix isn't terribly straightforward, but I'm pretty happy with it.

Add a test case where the same struct field is identical
with no tag, with the "tagged1" json tag, and again with "tagged2".
While here, we add a test case for a regular named field too.

Fixes #801.
  • Loading branch information
mvdan committed Nov 12, 2023
1 parent 08b3d9d commit 4551910
Show file tree
Hide file tree
Showing 4 changed files with 74 additions and 10 deletions.
72 changes: 64 additions & 8 deletions hash.go
Original file line number Diff line number Diff line change
Expand Up @@ -224,6 +224,9 @@ func entryOffKey() uint32 {
}

func hashWithPackage(pkg *listedPackage, name string) string {
// If the user provided us with an obfuscation seed,
// we use that with the package import path directly..
// Otherwise, we use GarbleActionID as a fallback salt.
if !flagSeed.present() {
return hashWithCustomSalt(pkg.GarbleActionID[:], name)
}
Expand All @@ -233,16 +236,69 @@ func hashWithPackage(pkg *listedPackage, name string) string {
return hashWithCustomSalt([]byte(pkg.ImportPath+"|"), name)
}

func hashWithStruct(strct *types.Struct, fieldName string) string {
// TODO: We should probably strip field tags here.
// Do we need to do anything else to make a
// struct type "canonical"?
fieldsSalt := []byte(strct.String())
// stripStructTags takes the bytes produced by [types.WriteType]
// and removes any struct tags in-place, such as rewriting
//
// struct{Foo int; Bar string "json:\"tagged1\""}
//
// into
//
// struct{Foo int; Bar string}
//
// Note that, unlike most Go source, WriteType uses double quotes for tags.
//
// Reusing WriteType does require a second pass over its output here,
// which we could save by implementing our own modified version of WriteType.
// However, that would be a significant amount of code to maintain.
func stripStructTags(p []byte) []byte {
i := 0
for i < len(p) {
b := p[i]
start := i - 1 // a struct tag is preceded by a space
i++
if b != '"' {
continue
}
// Find the closing double quote, skipping over escaped characters.
// Note that we should probably iterate over runes and not bytes,
// but this byte implementation is probably good enough in practice.
for {
b = p[i]
i++
if b == '\\' {
i++
} else if b == '"' {
break
}
}
end := i
p = append(p[:start], p[end:]...)
}
return p
}

var typeIdentityBuf bytes.Buffer

// hashWithStruct is separate from hashWithPackage since Go
// allows converting between struct types across packages.
// Hashing struct field names differently between packages would break that.
//
// We hash field names with the identity struct type as a salt
// so that the same field name used in different struct types is obfuscated differently.
// Note that "identity" means omitting struct tags since conversions ignore them.
func hashWithStruct(strct *types.Struct, field *types.Var) string {
typeIdentityBuf.Reset()
types.WriteType(&typeIdentityBuf, strct, nil)
salt := stripStructTags(typeIdentityBuf.Bytes())

// If the user provided us with an obfuscation seed,
// we only use the identity struct type as a salt.
// Otherwise, we add garble's own inputs to the salt as a fallback.
if !flagSeed.present() {
withGarbleHash := addGarbleToHash(fieldsSalt)
fieldsSalt = withGarbleHash[:]
withGarbleHash := addGarbleToHash(salt)
salt = withGarbleHash[:]
}
return hashWithCustomSalt(fieldsSalt, fieldName)
return hashWithCustomSalt(salt, field.Name())
}

// minHashLength and maxHashLength define the range for the number of base64
Expand Down
2 changes: 1 addition & 1 deletion main.go
Original file line number Diff line number Diff line change
Expand Up @@ -2001,7 +2001,7 @@ func (tf *transformer) transformGoFile(file *ast.File) *ast.File {
if strct == nil {
panic("could not find struct for field " + name)
}
node.Name = hashWithStruct(strct, name)
node.Name = hashWithStruct(strct, obj)
if flagDebug { // TODO(mvdan): remove once https://go.dev/issue/53465 if fixed
log.Printf("%s %q hashed with struct fields to %q", debugName, name, node.Name)
}
Expand Down
2 changes: 1 addition & 1 deletion reverse.go
Original file line number Diff line number Diff line change
Expand Up @@ -106,7 +106,7 @@ One can reverse a captured panic stack trace as follows:
if strct == nil {
panic("could not find struct for field " + name.Name)
}
replaces = append(replaces, hashWithStruct(strct, name.Name), name.Name)
replaces = append(replaces, hashWithStruct(strct, obj), name.Name)
}

case *ast.CallExpr:
Expand Down
8 changes: 8 additions & 0 deletions testdata/script/implement.txtar
Original file line number Diff line number Diff line change
Expand Up @@ -48,7 +48,9 @@ type StructUnnamed = struct {
Bar struct {
Nested *[]string
}
Named lib3.Named
lib3.StructEmbed
Tagged string // no field tag
}

var _ = lib1.Struct1(lib2.Struct2{})
Expand All @@ -69,7 +71,9 @@ type Struct1 struct {
Bar struct {
Nested *[]string
}
Named lib3.Named
lib3.StructEmbed
Tagged string `json:"tagged1"`
}

-- lib2/lib2.go --
Expand All @@ -82,11 +86,15 @@ type Struct2 struct {
Bar struct {
Nested *[]string
}
Named lib3.Named
lib3.StructEmbed
Tagged string `json:"tagged2"`
}
-- lib3/lib3.go --
package lib3

type Named int

type StructEmbed struct {
Baz any
}
Expand Down

0 comments on commit 4551910

Please sign in to comment.