blob: 95967e8112a7c2050d039568010f9daebbb72987 [file] [log] [blame]
Naveen Sampath04696f72022-06-13 15:19:14 +05301// Copyright 2018 The Go Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style
3// license that can be found in the LICENSE file.
4
5package prototext
6
7import (
8 "fmt"
9 "strconv"
10 "unicode/utf8"
11
12 "google.golang.org/protobuf/encoding/protowire"
13 "google.golang.org/protobuf/internal/encoding/messageset"
14 "google.golang.org/protobuf/internal/encoding/text"
15 "google.golang.org/protobuf/internal/errors"
16 "google.golang.org/protobuf/internal/flags"
17 "google.golang.org/protobuf/internal/genid"
18 "google.golang.org/protobuf/internal/order"
19 "google.golang.org/protobuf/internal/pragma"
20 "google.golang.org/protobuf/internal/strs"
21 "google.golang.org/protobuf/proto"
22 "google.golang.org/protobuf/reflect/protoreflect"
Naveen Sampath04696f72022-06-13 15:19:14 +053023 "google.golang.org/protobuf/reflect/protoregistry"
24)
25
26const defaultIndent = " "
27
28// Format formats the message as a multiline string.
29// This function is only intended for human consumption and ignores errors.
30// Do not depend on the output being stable. It may change over time across
31// different versions of the program.
32func Format(m proto.Message) string {
33 return MarshalOptions{Multiline: true}.Format(m)
34}
35
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +053036// Marshal writes the given [proto.Message] in textproto format using default
Naveen Sampath04696f72022-06-13 15:19:14 +053037// options. Do not depend on the output being stable. It may change over time
38// across different versions of the program.
39func Marshal(m proto.Message) ([]byte, error) {
40 return MarshalOptions{}.Marshal(m)
41}
42
43// MarshalOptions is a configurable text format marshaler.
44type MarshalOptions struct {
45 pragma.NoUnkeyedLiterals
46
47 // Multiline specifies whether the marshaler should format the output in
48 // indented-form with every textual element on a new line.
49 // If Indent is an empty string, then an arbitrary indent is chosen.
50 Multiline bool
51
52 // Indent specifies the set of indentation characters to use in a multiline
53 // formatted output such that every entry is preceded by Indent and
54 // terminated by a newline. If non-empty, then Multiline is treated as true.
55 // Indent can only be composed of space or tab characters.
56 Indent string
57
58 // EmitASCII specifies whether to format strings and bytes as ASCII only
59 // as opposed to using UTF-8 encoding when possible.
60 EmitASCII bool
61
62 // allowInvalidUTF8 specifies whether to permit the encoding of strings
63 // with invalid UTF-8. This is unexported as it is intended to only
64 // be specified by the Format method.
65 allowInvalidUTF8 bool
66
67 // AllowPartial allows messages that have missing required fields to marshal
68 // without returning an error. If AllowPartial is false (the default),
69 // Marshal will return error if there are any missing required fields.
70 AllowPartial bool
71
72 // EmitUnknown specifies whether to emit unknown fields in the output.
73 // If specified, the unmarshaler may be unable to parse the output.
74 // The default is to exclude unknown fields.
75 EmitUnknown bool
76
77 // Resolver is used for looking up types when expanding google.protobuf.Any
78 // messages. If nil, this defaults to using protoregistry.GlobalTypes.
79 Resolver interface {
80 protoregistry.ExtensionTypeResolver
81 protoregistry.MessageTypeResolver
82 }
83}
84
85// Format formats the message as a string.
86// This method is only intended for human consumption and ignores errors.
87// Do not depend on the output being stable. It may change over time across
88// different versions of the program.
89func (o MarshalOptions) Format(m proto.Message) string {
90 if m == nil || !m.ProtoReflect().IsValid() {
91 return "<nil>" // invalid syntax, but okay since this is for debugging
92 }
93 o.allowInvalidUTF8 = true
94 o.AllowPartial = true
95 o.EmitUnknown = true
96 b, _ := o.Marshal(m)
97 return string(b)
98}
99
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530100// Marshal writes the given [proto.Message] in textproto format using options in
Naveen Sampath04696f72022-06-13 15:19:14 +0530101// MarshalOptions object. Do not depend on the output being stable. It may
102// change over time across different versions of the program.
103func (o MarshalOptions) Marshal(m proto.Message) ([]byte, error) {
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530104 return o.marshal(nil, m)
105}
106
107// MarshalAppend appends the textproto format encoding of m to b,
108// returning the result.
109func (o MarshalOptions) MarshalAppend(b []byte, m proto.Message) ([]byte, error) {
110 return o.marshal(b, m)
Naveen Sampath04696f72022-06-13 15:19:14 +0530111}
112
113// marshal is a centralized function that all marshal operations go through.
114// For profiling purposes, avoid changing the name of this function or
115// introducing other code paths for marshal that do not go through this.
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530116func (o MarshalOptions) marshal(b []byte, m proto.Message) ([]byte, error) {
Naveen Sampath04696f72022-06-13 15:19:14 +0530117 var delims = [2]byte{'{', '}'}
118
119 if o.Multiline && o.Indent == "" {
120 o.Indent = defaultIndent
121 }
122 if o.Resolver == nil {
123 o.Resolver = protoregistry.GlobalTypes
124 }
125
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530126 internalEnc, err := text.NewEncoder(b, o.Indent, delims, o.EmitASCII)
Naveen Sampath04696f72022-06-13 15:19:14 +0530127 if err != nil {
128 return nil, err
129 }
130
131 // Treat nil message interface as an empty message,
132 // in which case there is nothing to output.
133 if m == nil {
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530134 return b, nil
Naveen Sampath04696f72022-06-13 15:19:14 +0530135 }
136
137 enc := encoder{internalEnc, o}
138 err = enc.marshalMessage(m.ProtoReflect(), false)
139 if err != nil {
140 return nil, err
141 }
142 out := enc.Bytes()
143 if len(o.Indent) > 0 && len(out) > 0 {
144 out = append(out, '\n')
145 }
146 if o.AllowPartial {
147 return out, nil
148 }
149 return out, proto.CheckInitialized(m)
150}
151
152type encoder struct {
153 *text.Encoder
154 opts MarshalOptions
155}
156
157// marshalMessage marshals the given protoreflect.Message.
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530158func (e encoder) marshalMessage(m protoreflect.Message, inclDelims bool) error {
Naveen Sampath04696f72022-06-13 15:19:14 +0530159 messageDesc := m.Descriptor()
160 if !flags.ProtoLegacy && messageset.IsMessageSet(messageDesc) {
161 return errors.New("no support for proto1 MessageSets")
162 }
163
164 if inclDelims {
165 e.StartMessage()
166 defer e.EndMessage()
167 }
168
169 // Handle Any expansion.
170 if messageDesc.FullName() == genid.Any_message_fullname {
171 if e.marshalAny(m) {
172 return nil
173 }
174 // If unable to expand, continue on to marshal Any as a regular message.
175 }
176
177 // Marshal fields.
178 var err error
179 order.RangeFields(m, order.IndexNameFieldOrder, func(fd protoreflect.FieldDescriptor, v protoreflect.Value) bool {
180 if err = e.marshalField(fd.TextName(), v, fd); err != nil {
181 return false
182 }
183 return true
184 })
185 if err != nil {
186 return err
187 }
188
189 // Marshal unknown fields.
190 if e.opts.EmitUnknown {
191 e.marshalUnknown(m.GetUnknown())
192 }
193
194 return nil
195}
196
197// marshalField marshals the given field with protoreflect.Value.
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530198func (e encoder) marshalField(name string, val protoreflect.Value, fd protoreflect.FieldDescriptor) error {
Naveen Sampath04696f72022-06-13 15:19:14 +0530199 switch {
200 case fd.IsList():
201 return e.marshalList(name, val.List(), fd)
202 case fd.IsMap():
203 return e.marshalMap(name, val.Map(), fd)
204 default:
205 e.WriteName(name)
206 return e.marshalSingular(val, fd)
207 }
208}
209
210// marshalSingular marshals the given non-repeated field value. This includes
211// all scalar types, enums, messages, and groups.
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530212func (e encoder) marshalSingular(val protoreflect.Value, fd protoreflect.FieldDescriptor) error {
Naveen Sampath04696f72022-06-13 15:19:14 +0530213 kind := fd.Kind()
214 switch kind {
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530215 case protoreflect.BoolKind:
Naveen Sampath04696f72022-06-13 15:19:14 +0530216 e.WriteBool(val.Bool())
217
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530218 case protoreflect.StringKind:
Naveen Sampath04696f72022-06-13 15:19:14 +0530219 s := val.String()
220 if !e.opts.allowInvalidUTF8 && strs.EnforceUTF8(fd) && !utf8.ValidString(s) {
221 return errors.InvalidUTF8(string(fd.FullName()))
222 }
223 e.WriteString(s)
224
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530225 case protoreflect.Int32Kind, protoreflect.Int64Kind,
226 protoreflect.Sint32Kind, protoreflect.Sint64Kind,
227 protoreflect.Sfixed32Kind, protoreflect.Sfixed64Kind:
Naveen Sampath04696f72022-06-13 15:19:14 +0530228 e.WriteInt(val.Int())
229
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530230 case protoreflect.Uint32Kind, protoreflect.Uint64Kind,
231 protoreflect.Fixed32Kind, protoreflect.Fixed64Kind:
Naveen Sampath04696f72022-06-13 15:19:14 +0530232 e.WriteUint(val.Uint())
233
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530234 case protoreflect.FloatKind:
Naveen Sampath04696f72022-06-13 15:19:14 +0530235 // Encoder.WriteFloat handles the special numbers NaN and infinites.
236 e.WriteFloat(val.Float(), 32)
237
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530238 case protoreflect.DoubleKind:
Naveen Sampath04696f72022-06-13 15:19:14 +0530239 // Encoder.WriteFloat handles the special numbers NaN and infinites.
240 e.WriteFloat(val.Float(), 64)
241
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530242 case protoreflect.BytesKind:
Naveen Sampath04696f72022-06-13 15:19:14 +0530243 e.WriteString(string(val.Bytes()))
244
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530245 case protoreflect.EnumKind:
Naveen Sampath04696f72022-06-13 15:19:14 +0530246 num := val.Enum()
247 if desc := fd.Enum().Values().ByNumber(num); desc != nil {
248 e.WriteLiteral(string(desc.Name()))
249 } else {
250 // Use numeric value if there is no enum description.
251 e.WriteInt(int64(num))
252 }
253
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530254 case protoreflect.MessageKind, protoreflect.GroupKind:
Naveen Sampath04696f72022-06-13 15:19:14 +0530255 return e.marshalMessage(val.Message(), true)
256
257 default:
258 panic(fmt.Sprintf("%v has unknown kind: %v", fd.FullName(), kind))
259 }
260 return nil
261}
262
263// marshalList marshals the given protoreflect.List as multiple name-value fields.
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530264func (e encoder) marshalList(name string, list protoreflect.List, fd protoreflect.FieldDescriptor) error {
Naveen Sampath04696f72022-06-13 15:19:14 +0530265 size := list.Len()
266 for i := 0; i < size; i++ {
267 e.WriteName(name)
268 if err := e.marshalSingular(list.Get(i), fd); err != nil {
269 return err
270 }
271 }
272 return nil
273}
274
275// marshalMap marshals the given protoreflect.Map as multiple name-value fields.
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530276func (e encoder) marshalMap(name string, mmap protoreflect.Map, fd protoreflect.FieldDescriptor) error {
Naveen Sampath04696f72022-06-13 15:19:14 +0530277 var err error
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530278 order.RangeEntries(mmap, order.GenericKeyOrder, func(key protoreflect.MapKey, val protoreflect.Value) bool {
Naveen Sampath04696f72022-06-13 15:19:14 +0530279 e.WriteName(name)
280 e.StartMessage()
281 defer e.EndMessage()
282
283 e.WriteName(string(genid.MapEntry_Key_field_name))
284 err = e.marshalSingular(key.Value(), fd.MapKey())
285 if err != nil {
286 return false
287 }
288
289 e.WriteName(string(genid.MapEntry_Value_field_name))
290 err = e.marshalSingular(val, fd.MapValue())
291 if err != nil {
292 return false
293 }
294 return true
295 })
296 return err
297}
298
299// marshalUnknown parses the given []byte and marshals fields out.
300// This function assumes proper encoding in the given []byte.
301func (e encoder) marshalUnknown(b []byte) {
302 const dec = 10
303 const hex = 16
304 for len(b) > 0 {
305 num, wtype, n := protowire.ConsumeTag(b)
306 b = b[n:]
307 e.WriteName(strconv.FormatInt(int64(num), dec))
308
309 switch wtype {
310 case protowire.VarintType:
311 var v uint64
312 v, n = protowire.ConsumeVarint(b)
313 e.WriteUint(v)
314 case protowire.Fixed32Type:
315 var v uint32
316 v, n = protowire.ConsumeFixed32(b)
317 e.WriteLiteral("0x" + strconv.FormatUint(uint64(v), hex))
318 case protowire.Fixed64Type:
319 var v uint64
320 v, n = protowire.ConsumeFixed64(b)
321 e.WriteLiteral("0x" + strconv.FormatUint(v, hex))
322 case protowire.BytesType:
323 var v []byte
324 v, n = protowire.ConsumeBytes(b)
325 e.WriteString(string(v))
326 case protowire.StartGroupType:
327 e.StartMessage()
328 var v []byte
329 v, n = protowire.ConsumeGroup(num, b)
330 e.marshalUnknown(v)
331 e.EndMessage()
332 default:
333 panic(fmt.Sprintf("prototext: error parsing unknown field wire type: %v", wtype))
334 }
335
336 b = b[n:]
337 }
338}
339
340// marshalAny marshals the given google.protobuf.Any message in expanded form.
341// It returns true if it was able to marshal, else false.
Akash Reddy Kankanala105581b2024-09-11 05:20:38 +0530342func (e encoder) marshalAny(any protoreflect.Message) bool {
Naveen Sampath04696f72022-06-13 15:19:14 +0530343 // Construct the embedded message.
344 fds := any.Descriptor().Fields()
345 fdType := fds.ByNumber(genid.Any_TypeUrl_field_number)
346 typeURL := any.Get(fdType).String()
347 mt, err := e.opts.Resolver.FindMessageByURL(typeURL)
348 if err != nil {
349 return false
350 }
351 m := mt.New().Interface()
352
353 // Unmarshal bytes into embedded message.
354 fdValue := fds.ByNumber(genid.Any_Value_field_number)
355 value := any.Get(fdValue)
356 err = proto.UnmarshalOptions{
357 AllowPartial: true,
358 Resolver: e.opts.Resolver,
359 }.Unmarshal(value.Bytes(), m)
360 if err != nil {
361 return false
362 }
363
364 // Get current encoder position. If marshaling fails, reset encoder output
365 // back to this position.
366 pos := e.Snapshot()
367
368 // Field name is the proto field name enclosed in [].
369 e.WriteName("[" + typeURL + "]")
370 err = e.marshalMessage(m.ProtoReflect(), true)
371 if err != nil {
372 e.Reset(pos)
373 return false
374 }
375 return true
376}