hypertrace · prodion23 · May 9, 2024 · Apr 26, 2024 · Apr 26, 2024 · May 1, 2024
diff --git a/sdk/instrumentation/bodyattribute/bodyattribute.go b/sdk/instrumentation/bodyattribute/bodyattribute.go
@@ -3,10 +3,14 @@ package bodyattribute // import "github.com/hypertrace/goagent/sdk/instrumentati
 import (
 	"encoding/base64"
 	"fmt"
+	"strings"
+	"unicode/utf8"
 
 	"github.com/hypertrace/goagent/sdk"
 )
 
+const utf8Replacement = "�"
+
 // SetTruncatedBodyAttribute truncates the body and sets the body as a span attribute.
 // When body is being truncated, we also add a second attribute suffixed by `.truncated` to
 // make it clear to the user, body has been modified.
@@ -48,7 +52,12 @@ func SetBodyAttribute(attrName string, body []byte, truncated bool, span sdk.Spa
 		return
 	}
 
-	span.SetAttribute(attrName, string(body))
+	bodyStr := string(body)
+	if !utf8.ValidString(bodyStr) {
+		bodyStr = strings.ToValidUTF8(bodyStr, utf8Replacement)
+	}
+
+	span.SetAttribute(attrName, bodyStr)
 	// if already truncated then set attribute
 	if truncated {
 		span.SetAttribute(fmt.Sprintf("%s.truncated", attrName), true)
@@ -63,7 +72,12 @@ func SetEncodedBodyAttribute(attrName string, body []byte, truncated bool, span
 		return
 	}
 
-	span.SetAttribute(attrName+".base64", base64.RawStdEncoding.EncodeToString(body))
+	bodyStr := string(body)
+	if !utf8.ValidString(bodyStr) {
+		bodyStr = strings.ToValidUTF8(bodyStr, utf8Replacement)
+	}
+
+	span.SetAttribute(attrName+".base64", base64.RawStdEncoding.EncodeToString([]byte(bodyStr)))
 	// if already truncated then set attribute
 	if truncated {
 		span.SetAttribute(fmt.Sprintf("%s.truncated", attrName), true)

diff --git a/sdk/instrumentation/bodyattribute/bodyattribute_test.go b/sdk/instrumentation/bodyattribute/bodyattribute_test.go
@@ -199,3 +199,21 @@ func TestSetEncodedBodyAttribute(t *testing.T) {
 		})
 	}
 }
+
+func TestSetBodyWithoutUtf8(t *testing.T) {
+	invalidUTF8 := []byte{'h', 'e', 'l', 'l', 'o', ' ', 0xff, 0xfe, 0xfd}
+	span := mock.NewSpan()
+	SetBodyAttribute("http.request.body", invalidUTF8, false, span)
+	value := span.ReadAttribute("http.request.body")
+	assert.Equal(t, value.(string), "hello �")
+}
+
+func TestSetB64BodyWithoutUtf8(t *testing.T) {
+	invalidUTF8 := []byte{'h', 'e', 'l', 'l', 'o', ' ', 0xff, 0xfe, 0xfd}
+	span := mock.NewSpan()
+	SetEncodedBodyAttribute("http.request.body", invalidUTF8, false, span)
+	value := span.ReadAttribute("http.request.body.base64")
+	decodedBytes, err := base64.StdEncoding.DecodeString(value.(string))
+	assert.NoError(t, err)
+	assert.Equal(t, string(decodedBytes), "hello �")
+}