zclconf · apparentlymart · Aug 24, 2023 · Aug 24, 2023 · Aug 24, 2023 · kmoe
diff --git a/cty/ctystrings/prefix.go b/cty/ctystrings/prefix.go
@@ -26,10 +26,6 @@ import (
 // application can guarantee that the remainder of the string will not begin
 // with combining marks then it is safe to instead just normalize the prefix
 // string with [Normalize].
-//
-// Note that this function only takes into account normalization boundaries
-// and does _not_ take into account grapheme cluster boundaries as defined
-// by Unicode Standard Annex #29.
 func SafeKnownPrefix(prefix string) string {
 	prefix = Normalize(prefix)
 

diff --git a/cty/msgpack/roundtrip_test.go b/cty/msgpack/roundtrip_test.go
@@ -2,6 +2,7 @@ package msgpack
 
 import (
 	"fmt"
+	"strings"
 	"testing"
 
 	"github.com/zclconf/go-cty/cty"
@@ -50,7 +51,6 @@ func TestRoundTrip(t *testing.T) {
 			cty.UnknownVal(cty.String).Refine().NotNull().StringPrefix("foo-").NewValue(),
 			cty.String,
 		},
-
 		{
 			cty.True,
 			cty.Bool,
@@ -350,3 +350,58 @@ func TestRoundTrip(t *testing.T) {
 		})
 	}
 }
+
+// Unknown values with very long string prefix refinements do not round-trip
+// losslessly. If the prefix is longer than 256 bytes it will be truncated to
+// a maximum of 256 bytes.
+func TestRoundTrip_truncatesStringPrefixRefinement(t *testing.T) {
+	tests := []struct {
+		Value          cty.Value
+		Type           cty.Type
+		RoundTripValue cty.Value
+	}{
+		{
+			cty.UnknownVal(cty.String).Refine().StringPrefix(strings.Repeat("a", 1024)).NewValue(),
+			cty.String,
+			cty.UnknownVal(cty.String).Refine().StringPrefix(strings.Repeat("a", 255)).NewValue(),
+		},
+		{
+			cty.UnknownVal(cty.String).Refine().NotNull().StringPrefix(strings.Repeat("b", 1024)).NewValue(),
+			cty.String,
+			cty.UnknownVal(cty.String).Refine().NotNull().StringPrefix(strings.Repeat("b", 255)).NewValue(),
+		},
+		{
+			cty.UnknownVal(cty.String).Refine().StringPrefix(strings.Repeat("c", 255) + "-").NewValue(),
+			cty.String,
+			cty.UnknownVal(cty.String).Refine().StringPrefix(strings.Repeat("c", 255) + "-").NewValue(),
+		},
+		{
+			cty.UnknownVal(cty.String).Refine().StringPrefix(strings.Repeat("d", 255) + "🤷🤷").NewValue(),
+
+			cty.String,
+			cty.UnknownVal(cty.String).Refine().StringPrefix(strings.Repeat("d", 255)).NewValue(),
+		},
+	}
+
+	for _, test := range tests {
+		t.Run(fmt.Sprintf("%#v as %#v", test.Value, test.Type), func(t *testing.T) {
+			b, err := Marshal(test.Value, test.Type)
+			if err != nil {
+				t.Fatal(err)
+			}
+
+			t.Logf("encoded as %x", b)
+
+			got, err := Unmarshal(b, test.Type)
+			if err != nil {
+				t.Fatal(err)
+			}
+
+			if !got.RawEquals(test.RoundTripValue) {
+				t.Errorf(
+					"unexpected value after round-trip\ninput:  %#v\nexpect: %#v\nresult: %#v",
+					test.Value, test.RoundTripValue, got)
+			}
+		})
+	}
+}
diff --git a/cty/msgpack/unknown.go b/cty/msgpack/unknown.go
@@ -8,6 +8,7 @@ import (
 
 	"github.com/vmihailenco/msgpack/v5"
 	"github.com/zclconf/go-cty/cty"
+	"github.com/zclconf/go-cty/cty/ctystrings"
 )
 
 type unknownType struct{}
@@ -85,6 +86,16 @@ func marshalUnknownValue(rng cty.ValueRange, path cty.Path, enc *msgpack.Encoder
 		}
 	case rng.TypeConstraint() == cty.String:
 		if prefix := rng.StringPrefix(); prefix != "" {
+			// To ensure the total size of the refinements blob does not exceed
+			// the limit set by our decoder, truncate the prefix string.
+			// We could allow up to 1018 bytes here if we assume that this
+			// refinement will only ever be combined with NotNull(), but there
+			// is no need for such long prefix refinements at the moment.
+			maxPrefixLength := 256
+			if len(prefix) > maxPrefixLength {
+				prefix = prefix[:maxPrefixLength-1]
+				prefix = ctystrings.SafeKnownPrefix(prefix)
+			}
 			mapLen++
 			refnEnc.EncodeInt(int64(unknownValStringPrefix))
 			refnEnc.EncodeString(prefix)