1package yaml
2
3import (
4	"encoding"
5	"fmt"
6	"io"
7	"reflect"
8	"regexp"
9	"sort"
10	"strconv"
11	"strings"
12	"time"
13	"unicode/utf8"
14)
15
16// jsonNumber is the interface of the encoding/json.Number datatype.
17// Repeating the interface here avoids a dependency on encoding/json, and also
18// supports other libraries like jsoniter, which use a similar datatype with
19// the same interface. Detecting this interface is useful when dealing with
20// structures containing json.Number, which is a string under the hood. The
21// encoder should prefer the use of Int64(), Float64() and string(), in that
22// order, when encoding this type.
23type jsonNumber interface {
24	Float64() (float64, error)
25	Int64() (int64, error)
26	String() string
27}
28
29type encoder struct {
30	emitter yaml_emitter_t
31	event   yaml_event_t
32	out     []byte
33	flow    bool
34	// doneInit holds whether the initial stream_start_event has been
35	// emitted.
36	doneInit bool
37}
38
39func newEncoder() *encoder {
40	e := &encoder{}
41	yaml_emitter_initialize(&e.emitter)
42	yaml_emitter_set_output_string(&e.emitter, &e.out)
43	yaml_emitter_set_unicode(&e.emitter, true)
44	return e
45}
46
47func newEncoderWithWriter(w io.Writer) *encoder {
48	e := &encoder{}
49	yaml_emitter_initialize(&e.emitter)
50	yaml_emitter_set_output_writer(&e.emitter, w)
51	yaml_emitter_set_unicode(&e.emitter, true)
52	return e
53}
54
55func (e *encoder) init() {
56	if e.doneInit {
57		return
58	}
59	yaml_stream_start_event_initialize(&e.event, yaml_UTF8_ENCODING)
60	e.emit()
61	e.doneInit = true
62}
63
64func (e *encoder) finish() {
65	e.emitter.open_ended = false
66	yaml_stream_end_event_initialize(&e.event)
67	e.emit()
68}
69
70func (e *encoder) destroy() {
71	yaml_emitter_delete(&e.emitter)
72}
73
74func (e *encoder) emit() {
75	// This will internally delete the e.event value.
76	e.must(yaml_emitter_emit(&e.emitter, &e.event))
77}
78
79func (e *encoder) must(ok bool) {
80	if !ok {
81		msg := e.emitter.problem
82		if msg == "" {
83			msg = "unknown problem generating YAML content"
84		}
85		failf("%s", msg)
86	}
87}
88
89func (e *encoder) marshalDoc(tag string, in reflect.Value) {
90	e.init()
91	yaml_document_start_event_initialize(&e.event, nil, nil, true)
92	e.emit()
93	e.marshal(tag, in)
94	yaml_document_end_event_initialize(&e.event, true)
95	e.emit()
96}
97
98func (e *encoder) marshal(tag string, in reflect.Value) {
99	if !in.IsValid() || in.Kind() == reflect.Ptr && in.IsNil() {
100		e.nilv()
101		return
102	}
103	iface := in.Interface()
104	switch m := iface.(type) {
105	case jsonNumber:
106		integer, err := m.Int64()
107		if err == nil {
108			// In this case the json.Number is a valid int64
109			in = reflect.ValueOf(integer)
110			break
111		}
112		float, err := m.Float64()
113		if err == nil {
114			// In this case the json.Number is a valid float64
115			in = reflect.ValueOf(float)
116			break
117		}
118		// fallback case - no number could be obtained
119		in = reflect.ValueOf(m.String())
120	case time.Time, *time.Time:
121		// Although time.Time implements TextMarshaler,
122		// we don't want to treat it as a string for YAML
123		// purposes because YAML has special support for
124		// timestamps.
125	case Marshaler:
126		v, err := m.MarshalYAML()
127		if err != nil {
128			fail(err)
129		}
130		if v == nil {
131			e.nilv()
132			return
133		}
134		in = reflect.ValueOf(v)
135	case encoding.TextMarshaler:
136		text, err := m.MarshalText()
137		if err != nil {
138			fail(err)
139		}
140		in = reflect.ValueOf(string(text))
141	case nil:
142		e.nilv()
143		return
144	}
145	switch in.Kind() {
146	case reflect.Interface:
147		e.marshal(tag, in.Elem())
148	case reflect.Map:
149		e.mapv(tag, in)
150	case reflect.Ptr:
151		if in.Type() == ptrTimeType {
152			e.timev(tag, in.Elem())
153		} else {
154			e.marshal(tag, in.Elem())
155		}
156	case reflect.Struct:
157		if in.Type() == timeType {
158			e.timev(tag, in)
159		} else {
160			e.structv(tag, in)
161		}
162	case reflect.Slice, reflect.Array:
163		if in.Type().Elem() == mapItemType {
164			e.itemsv(tag, in)
165		} else {
166			e.slicev(tag, in)
167		}
168	case reflect.String:
169		e.stringv(tag, in)
170	case reflect.Int, reflect.Int8, reflect.Int16, reflect.Int32, reflect.Int64:
171		if in.Type() == durationType {
172			e.stringv(tag, reflect.ValueOf(iface.(time.Duration).String()))
173		} else {
174			e.intv(tag, in)
175		}
176	case reflect.Uint, reflect.Uint8, reflect.Uint16, reflect.Uint32, reflect.Uint64, reflect.Uintptr:
177		e.uintv(tag, in)
178	case reflect.Float32, reflect.Float64:
179		e.floatv(tag, in)
180	case reflect.Bool:
181		e.boolv(tag, in)
182	default:
183		panic("cannot marshal type: " + in.Type().String())
184	}
185}
186
187func (e *encoder) mapv(tag string, in reflect.Value) {
188	e.mappingv(tag, func() {
189		keys := keyList(in.MapKeys())
190		sort.Sort(keys)
191		for _, k := range keys {
192			e.marshal("", k)
193			e.marshal("", in.MapIndex(k))
194		}
195	})
196}
197
198func (e *encoder) itemsv(tag string, in reflect.Value) {
199	e.mappingv(tag, func() {
200		slice := in.Convert(reflect.TypeOf([]MapItem{})).Interface().([]MapItem)
201		for _, item := range slice {
202			e.marshal("", reflect.ValueOf(item.Key))
203			e.marshal("", reflect.ValueOf(item.Value))
204		}
205	})
206}
207
208func (e *encoder) structv(tag string, in reflect.Value) {
209	sinfo, err := getStructInfo(in.Type())
210	if err != nil {
211		panic(err)
212	}
213	e.mappingv(tag, func() {
214		for _, info := range sinfo.FieldsList {
215			var value reflect.Value
216			if info.Inline == nil {
217				value = in.Field(info.Num)
218			} else {
219				value = in.FieldByIndex(info.Inline)
220			}
221			if info.OmitEmpty && isZero(value) {
222				continue
223			}
224			e.marshal("", reflect.ValueOf(info.Key))
225			e.flow = info.Flow
226			e.marshal("", value)
227		}
228		if sinfo.InlineMap >= 0 {
229			m := in.Field(sinfo.InlineMap)
230			if m.Len() > 0 {
231				e.flow = false
232				keys := keyList(m.MapKeys())
233				sort.Sort(keys)
234				for _, k := range keys {
235					if _, found := sinfo.FieldsMap[k.String()]; found {
236						panic(fmt.Sprintf("Can't have key %q in inlined map; conflicts with struct field", k.String()))
237					}
238					e.marshal("", k)
239					e.flow = false
240					e.marshal("", m.MapIndex(k))
241				}
242			}
243		}
244	})
245}
246
247func (e *encoder) mappingv(tag string, f func()) {
248	implicit := tag == ""
249	style := yaml_BLOCK_MAPPING_STYLE
250	if e.flow {
251		e.flow = false
252		style = yaml_FLOW_MAPPING_STYLE
253	}
254	yaml_mapping_start_event_initialize(&e.event, nil, []byte(tag), implicit, style)
255	e.emit()
256	f()
257	yaml_mapping_end_event_initialize(&e.event)
258	e.emit()
259}
260
261func (e *encoder) slicev(tag string, in reflect.Value) {
262	implicit := tag == ""
263	style := yaml_BLOCK_SEQUENCE_STYLE
264	if e.flow {
265		e.flow = false
266		style = yaml_FLOW_SEQUENCE_STYLE
267	}
268	e.must(yaml_sequence_start_event_initialize(&e.event, nil, []byte(tag), implicit, style))
269	e.emit()
270	n := in.Len()
271	for i := 0; i < n; i++ {
272		e.marshal("", in.Index(i))
273	}
274	e.must(yaml_sequence_end_event_initialize(&e.event))
275	e.emit()
276}
277
278// isBase60 returns whether s is in base 60 notation as defined in YAML 1.1.
279//
280// The base 60 float notation in YAML 1.1 is a terrible idea and is unsupported
281// in YAML 1.2 and by this package, but these should be marshalled quoted for
282// the time being for compatibility with other parsers.
283func isBase60Float(s string) (result bool) {
284	// Fast path.
285	if s == "" {
286		return false
287	}
288	c := s[0]
289	if !(c == '+' || c == '-' || c >= '0' && c <= '9') || strings.IndexByte(s, ':') < 0 {
290		return false
291	}
292	// Do the full match.
293	return base60float.MatchString(s)
294}
295
296// From http://yaml.org/type/float.html, except the regular expression there
297// is bogus. In practice parsers do not enforce the "\.[0-9_]*" suffix.
298var base60float = regexp.MustCompile(`^[-+]?[0-9][0-9_]*(?::[0-5]?[0-9])+(?:\.[0-9_]*)?$`)
299
300func (e *encoder) stringv(tag string, in reflect.Value) {
301	var style yaml_scalar_style_t
302	s := in.String()
303	canUsePlain := true
304	switch {
305	case !utf8.ValidString(s):
306		if tag == yaml_BINARY_TAG {
307			failf("explicitly tagged !!binary data must be base64-encoded")
308		}
309		if tag != "" {
310			failf("cannot marshal invalid UTF-8 data as %s", shortTag(tag))
311		}
312		// It can't be encoded directly as YAML so use a binary tag
313		// and encode it as base64.
314		tag = yaml_BINARY_TAG
315		s = encodeBase64(s)
316	case tag == "":
317		// Check to see if it would resolve to a specific
318		// tag when encoded unquoted. If it doesn't,
319		// there's no need to quote it.
320		rtag, _ := resolve("", s)
321		canUsePlain = rtag == yaml_STR_TAG && !isBase60Float(s)
322	}
323	// Note: it's possible for user code to emit invalid YAML
324	// if they explicitly specify a tag and a string containing
325	// text that's incompatible with that tag.
326	switch {
327	case strings.Contains(s, "\n"):
328		style = yaml_LITERAL_SCALAR_STYLE
329	case canUsePlain:
330		style = yaml_PLAIN_SCALAR_STYLE
331	default:
332		style = yaml_DOUBLE_QUOTED_SCALAR_STYLE
333	}
334	e.emitScalar(s, "", tag, style)
335}
336
337func (e *encoder) boolv(tag string, in reflect.Value) {
338	var s string
339	if in.Bool() {
340		s = "true"
341	} else {
342		s = "false"
343	}
344	e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
345}
346
347func (e *encoder) intv(tag string, in reflect.Value) {
348	s := strconv.FormatInt(in.Int(), 10)
349	e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
350}
351
352func (e *encoder) uintv(tag string, in reflect.Value) {
353	s := strconv.FormatUint(in.Uint(), 10)
354	e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
355}
356
357func (e *encoder) timev(tag string, in reflect.Value) {
358	t := in.Interface().(time.Time)
359	s := t.Format(time.RFC3339Nano)
360	e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
361}
362
363func (e *encoder) floatv(tag string, in reflect.Value) {
364	// Issue #352: When formatting, use the precision of the underlying value
365	precision := 64
366	if in.Kind() == reflect.Float32 {
367		precision = 32
368	}
369
370	s := strconv.FormatFloat(in.Float(), 'g', -1, precision)
371	switch s {
372	case "+Inf":
373		s = ".inf"
374	case "-Inf":
375		s = "-.inf"
376	case "NaN":
377		s = ".nan"
378	}
379	e.emitScalar(s, "", tag, yaml_PLAIN_SCALAR_STYLE)
380}
381
382func (e *encoder) nilv() {
383	e.emitScalar("null", "", "", yaml_PLAIN_SCALAR_STYLE)
384}
385
386func (e *encoder) emitScalar(value, anchor, tag string, style yaml_scalar_style_t) {
387	implicit := tag == ""
388	e.must(yaml_scalar_event_initialize(&e.event, []byte(anchor), []byte(tag), []byte(value), implicit, implicit, style))
389	e.emit()
390}
391