blob: 0ee738e11b6738a901b552764e2ed0ef5bba7913 [file] [log] [blame]
Jonathan Hart4b110f62020-03-13 17:36:19 -07001package yaml
2
3import (
4 "encoding"
5 "fmt"
6 "io"
7 "reflect"
8 "regexp"
9 "sort"
10 "strconv"
11 "strings"
12 "time"
13 "unicode/utf8"
14)
15
16// jsonNumber is the interface of the encoding/json.Number datatype.
17// Repeating the interface here avoids a dependency on encoding/json, and also
18// supports other libraries like jsoniter, which use a similar datatype with
19// the same interface. Detecting this interface is useful when dealing with
20// structures containing json.Number, which is a string under the hood. The
21// encoder should prefer the use of Int64(), Float64() and string(), in that
22// order, when encoding this type.
23type jsonNumber interface {
24 Float64() (float64, error)
25 Int64() (int64, error)
26 String() string
27}
28
29type encoder struct {
30 emitter yaml_emitter_t
31 event yaml_event_t
32 out []byte
33 flow bool
34 // doneInit holds whether the initial stream_start_event has been
35 // emitted.
36 doneInit bool
37}
38
39func newEncoder() *encoder {
40 e := &encoder{}
41 yaml_emitter_initialize(&e.emitter)
42 yaml_emitter_set_output_string(&e.emitter, &e.out)
43 yaml_emitter_set_unicode(&e.emitter, true)
44 return e
45}
46
47func newEncoderWithWriter(w io.Writer) *encoder {
48 e := &encoder{}
49 yaml_emitter_initialize(&e.emitter)
50 yaml_emitter_set_output_writer(&e.emitter, w)
51 yaml_emitter_set_unicode(&e.emitter, true)
52 return e
53}
54
55func (e *encoder) init() {
56 if e.doneInit {
57 return
58 }
59 yaml_stream_start_event_initialize(&e.event, yaml_UTF8_ENCODING)
60 e.emit()
61 e.doneInit = true
62}
63
64func (e *encoder) finish() {
65 e.emitter.open_ended = false
66 yaml_stream_end_event_initialize(&e.event)
67 e.emit()
68}
69
70func (e *encoder) destroy() {
71 yaml_emitter_delete(&e.emitter)
72}
73
74func (e *encoder) emit() {
75 // This will internally delete the e.event value.
76 e.must(yaml_emitter_emit(&e.emitter, &e.event))
77}
78
79func (e *encoder) must(ok bool) {
80 if !ok {
81 msg := e.emitter.problem
82 if msg == "" {
83 msg = "unknown problem generating YAML content"
84 }
85 failf("%s", msg)
86 }
87}
88
89func (e *encoder) marshalDoc(tag string, in reflect.Value) {
90 e.init()
91 yaml_document_start_event_initialize(&e.event, nil, nil, true)
92 e.emit()
93 e.marshal(tag, in)
94 yaml_document_end_event_initialize(&e.event, true)
95 e.emit()
96}
97
98func (e *encoder) marshal(tag string, in reflect.Value) {
99 if !in.IsValid() || in.Kind() == reflect.Ptr && in.IsNil() {
100 e.nilv()
101 return
102 }
103 iface := in.Interface()
104 switch m := iface.(type) {
105 case jsonNumber:
106 integer, err := m.Int64()
107 if err == nil {
108 // In this case the json.Number is a valid int64
109 in = reflect.ValueOf(integer)
110 break
111 }
112 float, err := m.Float64()
113 if err == nil {
114 // In this case the json.Number is a valid float64
115 in = reflect.ValueOf(float)
116 break
117 }
118 // fallback case - no number could be obtained
119 in = reflect.ValueOf(m.String())
120 case time.Time, *time.Time:
121 // Although time.Time implements TextMarshaler,
122 // we don't want to treat it as a string for YAML
123 // purposes because YAML has special support for
124 // timestamps.
125 case Marshaler:
126 v, err := m.MarshalYAML()
127 if err != nil {
128 fail(err)
129 }
130 if v == nil {
131 e.nilv()
132 return
133 }
134 in = reflect.ValueOf(v)
135 case encoding.TextMarshaler:
136 text, err := m.MarshalText()
137 if err != nil {
138 fail(err)
139 }
140 in = reflect.ValueOf(string(text))
141 case nil:
142 e.nilv()
143 return
144 }
145 switch in.Kind() {
146 case reflect.Interface:
147 e.marshal(tag, in.Elem())
148 case reflect.Map:
149 e.mapv(tag, in)
150 case reflect.Ptr:
151 if in.Type() == ptrTimeType {
152 e.timev(tag, in.Elem())
153 } else {
154 e.marshal(tag, in.Elem())
155 }
156 case reflect.Struct:
157 if in.Type() == timeType {
158 e.timev(tag, in)
159 } else {
160 e.structv(tag, in)
161 }
162 case reflect.Slice, reflect.Array:
163 if in.Type().Elem() == mapItemType {
164 e.itemsv(tag, in)
165 } else {
166 e.slicev(tag, in)
167 }
168 case reflect.String:
169 e.stringv(tag, in)
170 case reflect.Int, reflect.Int8, reflect.Int16, reflect.Int32, reflect.Int64:
171 if in.Type() == durationType {
172 e.stringv(tag, reflect.ValueOf(iface.(time.Duration).String()))
173 } else {
174 e.intv(tag, in)
175 }
176 case reflect.Uint, reflect.Uint8, reflect.Uint16, reflect.Uint32, reflect.Uint64, reflect.Uintptr:
177 e.uintv(tag, in)
178 case reflect.Float32, reflect.Float64:
179 e.floatv(tag, in)
180 case reflect.Bool:
181 e.boolv(tag, in)
182 default:
183 panic("cannot marshal type: " + in.Type().String())
184 }
185}
186
187func (e *encoder) mapv(tag string, in reflect.Value) {
188 e.mappingv(tag, func() {
189 keys := keyList(in.MapKeys())
190 sort.Sort(keys)
191 for _, k := range keys {
192 e.marshal("", k)
193 e.marshal("", in.MapIndex(k))
194 }
195 })
196}
197
198func (e *encoder) itemsv(tag string, in reflect.Value) {
199 e.mappingv(tag, func() {
200 slice := in.Convert(reflect.TypeOf([]MapItem{})).Interface().([]MapItem)
201 for _, item := range slice {
202 e.marshal("", reflect.ValueOf(item.Key))
203 e.marshal("", reflect.ValueOf(item.Value))
204 }
205 })
206}
207
208func (e *encoder) structv(tag string, in reflect.Value) {
209 sinfo, err := getStructInfo(in.Type())
210 if err != nil {
211 panic(err)
212 }
213 e.mappingv(tag, func() {
214 for _, info := range sinfo.FieldsList {
215 var value reflect.Value
216 if info.Inline == nil {
217 value = in.Field(info.Num)
218 } else {
219 value = in.FieldByIndex(info.Inline)
220 }
221 if info.OmitEmpty && isZero(value) {
222 continue
223 }
224 e.marshal("", reflect.ValueOf(info.Key))
225 e.flow = info.Flow
226 e.marshal("", value)
227 }
228 if sinfo.InlineMap >= 0 {
229 m := in.Field(sinfo.InlineMap)
230 if m.Len() > 0 {
231 e.flow = false
232 keys := keyList(m.MapKeys())
233 sort.Sort(keys)
234 for _, k := range keys {
235 if _, found := sinfo.FieldsMap[k.String()]; found {
236 panic(fmt.Sprintf("Can't have key %q in inlined map; conflicts with struct field", k.String()))
237 }
238 e.marshal("", k)
239 e.flow = false
240 e.marshal("", m.MapIndex(k))
241 }
242 }
243 }
244 })
245}
246
247func (e *encoder) mappingv(tag string, f func()) {
248 implicit := tag == ""
249 style := yaml_BLOCK_MAPPING_STYLE
250 if e.flow {
251 e.flow = false
252 style = yaml_FLOW_MAPPING_STYLE
253 }
254 yaml_mapping_start_event_initialize(&e.event, nil, []byte(tag), implicit, style)
255 e.emit()
256 f()
257 yaml_mapping_end_event_initialize(&e.event)
258 e.emit()
259}
260
261func (e *encoder) slicev(tag string, in reflect.Value) {
262 implicit := tag == ""
263 style := yaml_BLOCK_SEQUENCE_STYLE
264 if e.flow {
265 e.flow = false
266 style = yaml_FLOW_SEQUENCE_STYLE
267 }
268 e.must(yaml_sequence_start_event_initialize(&e.event, nil, []byte(tag), implicit, style))
269 e.emit()
270 n := in.Len()
271 for i := 0; i < n; i++ {
272 e.marshal("", in.Index(i))
273 }
274 e.must(yaml_sequence_end_event_initialize(&e.event))
275 e.emit()
276}
277
278// isBase60 returns whether s is in base 60 notation as defined in YAML 1.1.
279//
280// The base 60 float notation in YAML 1.1 is a terrible idea and is unsupported
281// in YAML 1.2 and by this package, but these should be marshalled quoted for
282// the time being for compatibility with other parsers.
283func isBase60Float(s string) (result bool) {
284 // Fast path.
285 if s == "" {
286 return false
287 }
288 c := s[0]
289 if !(c == '+' || c == '-' || c >= '0' && c <= '9') || strings.IndexByte(s, ':') < 0 {
290 return false
291 }
292 // Do the full match.
293 return base60float.MatchString(s)
294}
295
296// From http://yaml.org/type/float.html, except the regular expression there
297// is bogus. In practice parsers do not enforce the "\.[0-9_]*" suffix.
298var base60float = regexp.MustCompile(`^[-+]?[0-9][0-9_]*(?::[0-5]?[0-9])+(?:\.[0-9_]*)?$`)
299
300func (e *encoder) stringv(tag string, in reflect.Value) {
301 var style yaml_scalar_style_t
302 s := in.String()
303 canUsePlain := true
304 switch {
305 case !utf8.ValidString(s):
306 if tag == yaml_BINARY_TAG {
307 failf("explicitly tagged !!binary data must be base64-encoded")
308 }
309 if tag != "" {
310 failf("cannot marshal invalid UTF-8 data as %s", shortTag(tag))
311 }
312 // It can't be encoded directly as YAML so use a binary tag
313 // and encode it as base64.
314 tag = yaml_BINARY_TAG
315 s = encodeBase64(s)
316 case tag == "":
317 // Check to see if it would resolve to a specific
318 // tag when encoded unquoted. If it doesn't,
319 // there's no need to quote it.
320 rtag, _ := resolve("", s)
321 canUsePlain = rtag == yaml_STR_TAG && !isBase60Float(s)
322 }
323 // Note: it's possible for user code to emit invalid YAML
324 // if they explicitly specify a tag and a string containing
325 // text that's incompatible with that tag.
326 switch {
327 case strings.Contains(s, "\n"):
328 style = yaml_LITERAL_SCALAR_STYLE
329 case canUsePlain:
330 style = yaml_PLAIN_SCALAR_STYLE
331 default:
332 style = yaml_DOUBLE_QUOTED_SCALAR_STYLE
333 }
334 e.emitScalar(s, "", tag, style)
335}
336
337func (e *encoder) boolv(tag string, in reflect.Value) {
338 var s string
339 if in.Bool() {
340 s = "true"
341 } else {
342 s = "false"
343 }
344 e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
345}
346
347func (e *encoder) intv(tag string, in reflect.Value) {
348 s := strconv.FormatInt(in.Int(), 10)
349 e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
350}
351
352func (e *encoder) uintv(tag string, in reflect.Value) {
353 s := strconv.FormatUint(in.Uint(), 10)
354 e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
355}
356
357func (e *encoder) timev(tag string, in reflect.Value) {
358 t := in.Interface().(time.Time)
359 s := t.Format(time.RFC3339Nano)
360 e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
361}
362
363func (e *encoder) floatv(tag string, in reflect.Value) {
364 // Issue #352: When formatting, use the precision of the underlying value
365 precision := 64
366 if in.Kind() == reflect.Float32 {
367 precision = 32
368 }
369
370 s := strconv.FormatFloat(in.Float(), 'g', -1, precision)
371 switch s {
372 case "+Inf":
373 s = ".inf"
374 case "-Inf":
375 s = "-.inf"
376 case "NaN":
377 s = ".nan"
378 }
379 e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
380}
381
382func (e *encoder) nilv() {
383 e.emitScalar("null", "", "", yaml_PLAIN_SCALAR_STYLE)
384}
385
386func (e *encoder) emitScalar(value, anchor, tag string, style yaml_scalar_style_t) {
387 implicit := tag == ""
388 e.must(yaml_scalar_event_initialize(&e.event, []byte(anchor), []byte(tag), []byte(value), implicit, implicit, style))
389 e.emit()
390}