forked from admpub/confl
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathencode.go
701 lines (661 loc) · 17.9 KB
/
encode.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
package confl
import (
"bufio"
"bytes"
"errors"
"fmt"
"io"
"reflect"
"regexp"
"sort"
"strconv"
"strings"
"time"
)
type encodeError struct{ error }
var (
KeyEqElement = ":"
errArrayMixedElementTypes = errors.New("can't encode array with mixed element types")
errArrayNilElement = errors.New("can't encode array with nil element")
errNonString = errors.New("can't encode a map with non-string key type")
errAnonNonStruct = errors.New("can't encode an anonymous field that is not a struct")
errArrayNoTable = errors.New("array element can't contain a table")
errNoKey = errors.New("top-level values must be a Go map or struct")
errAnything = errors.New("") // used in testing
quotedReplacer = strings.NewReplacer(
"\t", `\t`,
"\n", `\n`,
"\r", `\r`,
`"`, `\"`,
)
reNeedQuoted = regexp.MustCompile(`[\s:=]`)
)
// SafeKey key
func SafeKey(key string) string {
if reNeedQuoted.MatchString(key) {
if !strings.Contains(key, `"`) {
key = `"` + key + `"`
} else if !strings.Contains(key, `'`) {
key = `'` + key + `'`
} else {
key = fmt.Sprintf(`"%q"`, key)
}
}
return key
}
// Marshal a go struct into bytes
func Marshal(v interface{}) ([]byte, error) {
buf := bytes.Buffer{}
enc := NewEncoder(&buf)
err := enc.Encode(v)
if err != nil {
return nil, err
}
return buf.Bytes(), nil
}
// Encoder controls the encoding of Go values to a document to some
// io.Writer.
//
// The indentation level can be controlled with the Indent field.
type Encoder struct {
// A single indentation level. By default it is two spaces.
Indent string
// hasWritten is whether we have written any output to w yet.
hasWritten bool
w *bufio.Writer
KeyEqElement string
}
// NewEncoder returns a encoder that encodes Go values to the io.Writer
// given. By default, a single indentation level is 2 spaces.
func NewEncoder(w io.Writer) *Encoder {
return &Encoder{
w: bufio.NewWriter(w),
Indent: " ",
KeyEqElement: KeyEqElement,
}
}
// Encode writes a representation of the Go value to the underlying
// io.Writer. If the value given cannot be encoded to a valid document,
// then an error is returned.
//
// The mapping between Go values and values should be precisely the same
// as for the Decode* functions. Similarly, the TextMarshaler interface is
// supported by encoding the resulting bytes as strings. (If you want to write
// arbitrary binary data then you will need to use something like base64 since
// does not have any binary types.)
//
// When encoding hashes (i.e., Go maps or structs), keys without any
// sub-hashes are encoded first.
//
// If a Go map is encoded, then its keys are sorted alphabetically for
// deterministic output. More control over this behavior may be provided if
// there is demand for it.
//
// Encoding Go values without a corresponding representation---like map
// types with non-string keys---will cause an error to be returned. Similarly
// for mixed arrays/slices, arrays/slices with nil elements, embedded
// non-struct types and nested slices containing maps or structs.
// (e.g., [][]map[string]string is not allowed but []map[string]string is OK
// and so is []map[string][]string.)
func (enc *Encoder) Encode(v interface{}) error {
rv := eindirect(reflect.ValueOf(v))
if err := enc.safeEncode(Key([]string{}), rv); err != nil {
return err
}
return enc.w.Flush()
}
func (enc *Encoder) safeEncode(key Key, rv reflect.Value) (err error) {
defer func() {
if r := recover(); r != nil {
if terr, ok := r.(encodeError); ok {
err = terr.error
return
}
panic(r)
}
}()
enc.encode(key, rv)
return nil
}
func (enc *Encoder) encode(key Key, rv reflect.Value) {
// Special case. Time needs to be in ISO8601 format.
// Special case. If we can marshal the type to text, then we used that.
// Basically, this prevents the encoder for handling these types as
// generic structs (or whatever the underlying type of a TextMarshaler is).
switch rv.Interface().(type) {
case time.Time, TextMarshaler:
enc.keyEqElement(key, rv)
return
}
k := rv.Kind()
switch k {
case reflect.Int, reflect.Int8, reflect.Int16, reflect.Int32, reflect.Int64,
reflect.Uint, reflect.Uint8, reflect.Uint16, reflect.Uint32,
reflect.Uint64,
reflect.Float32, reflect.Float64, reflect.String, reflect.Bool:
enc.keyEqElement(key, rv)
case reflect.Array, reflect.Slice:
if typeEqual(confArrayHash, confTypeOfGo(rv)) {
enc.eArrayOfTables(key, rv)
} else {
enc.keyEqElement(key, rv)
}
case reflect.Interface:
if rv.IsNil() {
return
}
enc.encode(key, rv.Elem())
case reflect.Map:
if rv.IsNil() {
return
}
enc.eTable(key, rv)
case reflect.Ptr:
if rv.IsNil() {
return
}
enc.encode(key, rv.Elem())
case reflect.Struct:
enc.eTable(key, rv)
default:
panic(e("Unsupported type for key '%s': %s", key, k))
}
}
// eElement encodes any value that can be an array element (primitives and
// arrays).
func (enc *Encoder) eElement(rv reflect.Value) {
switch v := rv.Interface().(type) {
case time.Time:
// Special case time.Time as a primitive. Has to come before
// TextMarshaler below because time.Time implements
// encoding.TextMarshaler, but we need to always use UTC.
enc.wf(v.In(time.FixedZone("UTC", 0)).Format("2006-01-02T15:04:05Z"))
return
case TextMarshaler:
// Special case. Use text marshaler if it's available for this value.
if s, err := v.MarshalText(); err != nil {
encPanic(err)
} else {
enc.writeQuoted(string(s))
}
return
}
switch rv.Kind() {
case reflect.Bool:
enc.wf(strconv.FormatBool(rv.Bool()))
case reflect.Int, reflect.Int8, reflect.Int16, reflect.Int32, reflect.Int64:
enc.wf(strconv.FormatInt(rv.Int(), 10))
case reflect.Uint, reflect.Uint8, reflect.Uint16,
reflect.Uint32, reflect.Uint64:
enc.wf(strconv.FormatUint(rv.Uint(), 10))
case reflect.Float32:
enc.wf(floatAddDecimal(strconv.FormatFloat(rv.Float(), 'f', -1, 32)))
case reflect.Float64:
enc.wf(floatAddDecimal(strconv.FormatFloat(rv.Float(), 'f', -1, 64)))
case reflect.Array, reflect.Slice:
enc.eArrayOrSliceElement(rv)
case reflect.Interface:
enc.eElement(rv.Elem())
case reflect.String:
enc.writeQuoted(rv.String())
default:
panic(e("Unexpected primitive type: %s", rv.Kind()))
}
}
// all floats must have a decimal with at least one number on either side.
func floatAddDecimal(fstr string) string {
if !strings.Contains(fstr, ".") {
return fstr + ".0"
}
return fstr
}
func (enc *Encoder) writeQuoted(s string) {
switch {
case strings.Contains(s, "\n"):
switch {
case !strings.HasPrefix(s, `"`) && !strings.HasSuffix(s, `"`) && !strings.Contains(s, `"""`):
enc.wf(`"""%s"""`, s)
case !strings.HasPrefix(s, `'`) && !strings.HasSuffix(s, `'`) && !strings.Contains(s, `'''`):
enc.wf(`'''%s'''`, s)
default:
enc.wf("(")
enc.newline()
for idx, row := range strings.Split(s, "\n") {
if idx > 0 {
enc.wf("\n")
}
enc.wf("\t" + row)
}
enc.newline()
enc.wf(")")
enc.newline()
}
case strings.Contains(s, `"`):
switch {
case !strings.Contains(s, `'`):
enc.wf(`'%s'`, s)
case !strings.HasPrefix(s, `"`) && !strings.HasSuffix(s, `"`) && !strings.Contains(s, `"""`):
enc.wf(`"""%s"""`, s)
case !strings.HasPrefix(s, `'`) && !strings.HasSuffix(s, `'`) && !strings.Contains(s, `'''`):
enc.wf(`'''%s'''`, s)
default:
enc.wf(`"%s"`, quotedReplacer.Replace(s))
}
default:
enc.wf(`"%s"`, quotedReplacer.Replace(s))
}
}
func (enc *Encoder) eArrayOrSliceElement(rv reflect.Value) {
length := rv.Len()
enc.wf("[")
for i := 0; i < length; i++ {
elem := rv.Index(i)
enc.eElement(elem)
if i != length-1 {
enc.wf(", ")
}
}
enc.wf("]")
}
func (enc *Encoder) eArrayOfTables(key Key, rv reflect.Value) {
if len(key) == 0 {
encPanic(errNoKey)
}
panicIfInvalidKey(key, true)
//enc.newline()
newKey := key.insert("_")
keyDelta := 0
enc.wf("%s%s "+enc.KeyEqElement+" [", enc.indentStrDelta(key, -1), SafeKey(key[len(key)-1]))
for i := 0; i < rv.Len(); i++ {
trv := rv.Index(i)
if isNil(trv) {
continue
}
enc.newline()
enc.wf("%s{", enc.indentStrDelta(key, keyDelta))
enc.newline()
//enc.wf("%s{\n%s", enc.indentStr(key), key.String())
//enc.newline()
enc.eMapOrStruct(newKey, trv)
//enc.newline()
if i == rv.Len()-1 {
enc.wf("%s}", enc.indentStrDelta(key, keyDelta))
} else {
enc.wf("%s},", enc.indentStrDelta(key, keyDelta))
}
}
enc.newline()
enc.wf("%s]", enc.indentStrDelta(key, -1))
enc.newline()
}
func (enc *Encoder) eTable(key Key, rv reflect.Value) {
if len(key) == 1 {
// Output an extra new line between top-level tables.
// (The newline isn't written if nothing else has been written though.)
//enc.newline()
}
if len(key) > 0 {
panicIfInvalidKey(key, true)
enc.wf("%s%s {", enc.indentStrDelta(key, -1), key[len(key)-1])
enc.newline()
}
enc.eMapOrStruct(key, rv)
if len(key) > 0 {
enc.wf("%s}", enc.indentStrDelta(key, -1))
enc.newline()
}
}
func (enc *Encoder) eMapOrStruct(key Key, rv reflect.Value) {
switch rv := eindirect(rv); rv.Kind() {
case reflect.Map:
enc.eMap(key, rv)
case reflect.Struct:
enc.eStruct(key, rv)
default:
panic("eTable: unhandled reflect.Value Kind: " + rv.Kind().String())
}
}
func (enc *Encoder) eMap(key Key, rv reflect.Value) {
rt := rv.Type()
var convert func(string) (interface{}, error)
switch rt.Key().Kind() {
case reflect.String:
case reflect.Int:
convert = func(key string) (interface{}, error) {
return strconv.Atoi(key)
}
case reflect.Int16:
convert = func(key string) (interface{}, error) {
r, e := strconv.ParseInt(key, 10, 16)
return int16(r), e
}
case reflect.Int32:
convert = func(key string) (interface{}, error) {
r, e := strconv.ParseInt(key, 10, 32)
return int32(r), e
}
case reflect.Int64:
convert = func(key string) (interface{}, error) {
return strconv.ParseInt(key, 10, 64)
}
case reflect.Uint:
convert = func(key string) (interface{}, error) {
r, e := strconv.Atoi(key)
return uint(r), e
}
case reflect.Uint16:
convert = func(key string) (interface{}, error) {
r, e := strconv.ParseUint(key, 10, 16)
return uint16(r), e
}
case reflect.Uint32:
convert = func(key string) (interface{}, error) {
r, e := strconv.ParseUint(key, 10, 32)
return uint32(r), e
}
case reflect.Uint64:
convert = func(key string) (interface{}, error) {
return strconv.ParseUint(key, 10, 64)
}
default:
encPanic(errNonString)
}
// Sort keys so that we have deterministic output. And write keys directly
// underneath this key first, before writing sub-structs or sub-maps.
var mapKeysDirect, mapKeysSub []string
for _, mapKey := range rv.MapKeys() {
//k := mapKey.String()
k := fmt.Sprint(mapKey.Interface())
if typeIsHash(confTypeOfGo(rv.MapIndex(mapKey))) {
mapKeysSub = append(mapKeysSub, k)
} else {
mapKeysDirect = append(mapKeysDirect, k)
}
}
var writeMapKeys = func(mapKeys []string) {
sort.Strings(mapKeys)
for _, mapKey := range mapKeys {
var v interface{}
if convert != nil {
var e error
v, e = convert(mapKey)
if e != nil {
encPanic(e)
}
} else {
v = mapKey
}
mrv := rv.MapIndex(reflect.ValueOf(v))
if isNil(mrv) {
// Don't write anything for nil fields.
continue
}
enc.encode(key.add(mapKey), mrv)
}
}
writeMapKeys(mapKeysDirect)
writeMapKeys(mapKeysSub)
}
func (enc *Encoder) eStruct(key Key, rv reflect.Value) {
// Write keys for fields directly under this key first, because if we write
// a field that creates a new table, then all keys under it will be in that
// table (not the one we're writing here).
rt := rv.Type()
//var fieldsDirect, fieldsSub [][]int
var addFields func(rt reflect.Type, rv reflect.Value)
addFields = func(rt reflect.Type, rv reflect.Value) {
for i := 0; i < rt.NumField(); i++ {
f := rt.Field(i)
// skip unexporded fields
if len(f.PkgPath) > 0 {
continue
}
keyName := f.Tag.Get("confl")
if keyName == "-" {
continue
}
if keyName == "" {
keyName = f.Tag.Get("json")
if keyName == "-" {
continue
}
}
if len(keyName) > 0 {
attrs := strings.SplitN(keyName, `,`, 2)
keyName = attrs[0]
if keyName == "-" {
continue
}
}
frv := rv.Field(i)
if f.Anonymous {
// skip nil field
if !frv.IsValid() {
continue
}
frv = eindirect(frv)
// skip nil field
if !frv.IsValid() {
continue
}
t := frv.Type()
if t.Kind() != reflect.Struct {
encPanic(errAnonNonStruct)
}
addFields(t, frv)
continue
}
if keyName == "" {
keyName = f.Name
}
if keyName != f.Name {
attrs := strings.Split(keyName, `,`)
keyName = attrs[0]
if keyName == "-" {
continue
}
if len(attrs) > 1 {
var omitEmpty bool
for _, attr := range attrs[1:] {
switch attr {
case `omitempty`:
omitEmpty = isZero(frv)
default:
}
}
if omitEmpty {
continue
}
}
}
enc.encode(key.add(keyName), frv)
}
}
addFields(rt, rv)
}
// returns the Confl type name of the Go value's type. It is used to
// determine whether the types of array elements are mixed (which is forbidden).
// If the Go value is nil, then it is illegal for it to be an array element, and
// valueIsNil is returned as true.
// Returns the confl type of a Go value. The type may be `nil`, which means
// no concrete confl type could be found.
func confTypeOfGo(rv reflect.Value) confType {
if isNil(rv) || !rv.IsValid() {
return nil
}
switch rv.Kind() {
case reflect.Bool:
return confBool
case reflect.Int, reflect.Int8, reflect.Int16, reflect.Int32, reflect.Int64,
reflect.Uint, reflect.Uint8, reflect.Uint16, reflect.Uint32,
reflect.Uint64:
return confInteger
case reflect.Float32, reflect.Float64:
return confFloat
case reflect.Array, reflect.Slice:
if typeEqual(confHash, confArrayType(rv)) {
return confArrayHash
}
return confArray
case reflect.Ptr, reflect.Interface:
return confTypeOfGo(rv.Elem())
case reflect.String:
return confString
case reflect.Map:
return confHash
case reflect.Struct:
switch rv.Interface().(type) {
case time.Time:
return confDatetime
case TextMarshaler:
return confString
default:
return confHash
}
default:
panic("unexpected reflect.Kind: " + rv.Kind().String())
}
}
// returns the element type of a array. The type returned
// may be nil if it cannot be determined (e.g., a nil slice or a zero length
// slize). This function may also panic if it finds a type that cannot be
// expressed in (such as nil elements, heterogeneous arrays or directly
// nested arrays of tables).
func confArrayType(rv reflect.Value) confType {
if isNil(rv) || !rv.IsValid() || rv.Len() == 0 {
return nil
}
firstType := confTypeOfGo(rv.Index(0))
if firstType == nil {
encPanic(errArrayNilElement)
}
rvlen := rv.Len()
for i := 1; i < rvlen; i++ {
elem := rv.Index(i)
switch elemType := confTypeOfGo(elem); {
case elemType == nil:
encPanic(errArrayNilElement)
case !typeEqual(firstType, elemType):
encPanic(errArrayMixedElementTypes)
}
}
// If we have a nested array, then we must make sure that the nested
// array contains ONLY primitives.
// This checks arbitrarily nested arrays.
if typeEqual(firstType, confArray) || typeEqual(firstType, confArrayHash) {
nest := confArrayType(eindirect(rv.Index(0)))
if typeEqual(nest, confHash) || typeEqual(nest, confArrayHash) {
encPanic(errArrayNoTable)
}
}
return firstType
}
func (enc *Encoder) newline() {
if enc.hasWritten {
enc.wf("\n")
}
}
func (enc *Encoder) keyEqElement(key Key, val reflect.Value) {
if len(key) == 0 {
encPanic(errNoKey)
}
panicIfInvalidKey(key, false)
enc.wf("%s%s "+enc.KeyEqElement+" ", enc.indentStrDelta(key, -1), SafeKey(key[len(key)-1]))
enc.eElement(val)
enc.newline()
}
func (enc *Encoder) wf(format string, v ...interface{}) {
if _, err := fmt.Fprintf(enc.w, format, v...); err != nil {
encPanic(err)
}
enc.hasWritten = true
}
func (enc *Encoder) indentStr(key Key) string {
return strings.Repeat(enc.Indent, len(key))
}
func (enc *Encoder) indentStrDelta(key Key, delta int) string {
return strings.Repeat(enc.Indent, len(key)+delta)
}
func encPanic(err error) {
panic(encodeError{err})
}
func eindirect(v reflect.Value) reflect.Value {
switch v.Kind() {
case reflect.Ptr, reflect.Interface:
return eindirect(v.Elem())
default:
return v
}
}
func isNil(rv reflect.Value) bool {
switch rv.Kind() {
case reflect.Interface, reflect.Map, reflect.Ptr, reflect.Slice:
return rv.IsNil()
default:
return false
}
}
func panicIfInvalidKey(key Key, hash bool) {
if hash {
for _, k := range key {
if !isValidTableName(k) {
encPanic(e("Key '%s' is not a valid table name. Table names "+
"cannot contain '[', ']' or '.'.", key.String()))
}
}
} else {
if !isValidKeyName(key[len(key)-1]) {
encPanic(e("Key '%s' is not a name. Key names "+
"cannot contain whitespace.", key.String()))
}
}
}
func isValidTableName(s string) bool {
if len(s) == 0 {
return false
}
for _, r := range s {
if r == '[' || r == ']' || r == '.' {
return false
}
}
return true
}
func isValidKeyName(s string) bool {
if len(s) == 0 {
return false
}
return true
}
func isZero(v reflect.Value) bool {
switch v.Kind() {
case reflect.String:
return len(v.String()) == 0
case reflect.Interface, reflect.Ptr:
return v.IsNil()
case reflect.Slice:
return v.Len() == 0
case reflect.Map:
return v.Len() == 0
case reflect.Int, reflect.Int8, reflect.Int16, reflect.Int32, reflect.Int64:
return v.Int() == 0
case reflect.Float32, reflect.Float64:
return v.Float() == 0
case reflect.Uint, reflect.Uint8, reflect.Uint16, reflect.Uint32, reflect.Uint64, reflect.Uintptr:
return v.Uint() == 0
case reflect.Bool:
return !v.Bool()
case reflect.Struct:
vt := v.Type()
for i := v.NumField() - 1; i >= 0; i-- {
if len(vt.Field(i).PkgPath) > 0 {
continue // Private field
}
if !isZero(v.Field(i)) {
return false
}
}
return true
}
return false
}