summaryrefslogtreecommitdiff
path: root/vendor/github.com/ugorji/go/codec/json.base.go
diff options
context:
space:
mode:
Diffstat (limited to 'vendor/github.com/ugorji/go/codec/json.base.go')
-rw-r--r--vendor/github.com/ugorji/go/codec/json.base.go504
1 files changed, 504 insertions, 0 deletions
diff --git a/vendor/github.com/ugorji/go/codec/json.base.go b/vendor/github.com/ugorji/go/codec/json.base.go
new file mode 100644
index 000000000..d87403393
--- /dev/null
+++ b/vendor/github.com/ugorji/go/codec/json.base.go
@@ -0,0 +1,504 @@
+// Copyright (c) 2012-2020 Ugorji Nwoke. All rights reserved.
+// Use of this source code is governed by a MIT license found in the LICENSE file.
+
+package codec
+
+import (
+ "encoding/base32"
+ "encoding/base64"
+ "errors"
+ "math"
+ "reflect"
+ "strings"
+ "time"
+ "unicode"
+)
+
+//--------------------------------
+
+// jsonLits and jsonLitb are defined at the package level,
+// so they are guaranteed to be stored efficiently, making
+// for better append/string comparison/etc.
+//
+// (anecdotal evidence from some benchmarking on go 1.20 devel in 20220104)
+const jsonLits = `"true"false"null"{}[]`
+
+const (
+ jsonLitT = 1
+ jsonLitF = 6
+ jsonLitN = 12
+ jsonLitM = 17
+ jsonLitA = 19
+)
+
+var jsonLitb = []byte(jsonLits)
+var jsonNull = jsonLitb[jsonLitN : jsonLitN+4]
+var jsonArrayEmpty = jsonLitb[jsonLitA : jsonLitA+2]
+var jsonMapEmpty = jsonLitb[jsonLitM : jsonLitM+2]
+
+const jsonEncodeUintSmallsString = "" +
+ "00010203040506070809" +
+ "10111213141516171819" +
+ "20212223242526272829" +
+ "30313233343536373839" +
+ "40414243444546474849" +
+ "50515253545556575859" +
+ "60616263646566676869" +
+ "70717273747576777879" +
+ "80818283848586878889" +
+ "90919293949596979899"
+
+var jsonEncodeUintSmallsStringBytes = (*[len(jsonEncodeUintSmallsString)]byte)([]byte(jsonEncodeUintSmallsString))
+
+const (
+ jsonU4Chk2 = '0'
+ jsonU4Chk1 = 'a' - 10
+ jsonU4Chk0 = 'A' - 10
+)
+
+const (
+ // If !jsonValidateSymbols, decoding will be faster, by skipping some checks:
+ // - If we see first character of null, false or true,
+ // do not validate subsequent characters.
+ // - e.g. if we see a n, assume null and skip next 3 characters,
+ // and do not validate they are ull.
+ // P.S. Do not expect a significant decoding boost from this.
+ jsonValidateSymbols = true
+
+ // jsonEscapeMultiByteUnicodeSep controls whether some unicode characters
+ // that are valid json but may bomb in some contexts are escaped during encoeing.
+ //
+ // U+2028 is LINE SEPARATOR. U+2029 is PARAGRAPH SEPARATOR.
+ // Both technically valid JSON, but bomb on JSONP, so fix here unconditionally.
+ jsonEscapeMultiByteUnicodeSep = true
+
+ // jsonNakedBoolNumInQuotedStr is used during decoding into a blank interface{}
+ // to control whether we detect quoted values of bools and null where a map key is expected,
+ // and treat as nil, true or false.
+ jsonNakedBoolNumInQuotedStr = true
+)
+
+var (
+ // jsonTabs and jsonSpaces are used as caches for indents
+ jsonTabs [32]byte
+ jsonSpaces [128]byte
+
+ jsonHexEncoder hexEncoder
+ // jsonTimeLayout is used to validate time layouts.
+ // Unfortunately, we couldn't compare time.Time effectively, so punted.
+ // jsonTimeLayout time.Time
+)
+
+func init() {
+ for i := 0; i < len(jsonTabs); i++ {
+ jsonTabs[i] = '\t'
+ }
+ for i := 0; i < len(jsonSpaces); i++ {
+ jsonSpaces[i] = ' '
+ }
+ // jsonTimeLayout, err := time.Parse(time.Layout, time.Layout)
+ // halt.onerror(err)
+ // jsonTimeLayout = jsonTimeLayout.Round(time.Second).UTC()
+}
+
+// ----------------
+
+type jsonBytesFmt uint8
+
+const (
+ jsonBytesFmtArray jsonBytesFmt = iota + 1
+ jsonBytesFmtBase64
+ jsonBytesFmtBase64url
+ jsonBytesFmtBase32
+ jsonBytesFmtBase32hex
+ jsonBytesFmtBase16
+
+ jsonBytesFmtHex = jsonBytesFmtBase16
+)
+
+type jsonTimeFmt uint8
+
+const (
+ jsonTimeFmtStringLayout jsonTimeFmt = iota + 1
+ jsonTimeFmtUnix
+ jsonTimeFmtUnixMilli
+ jsonTimeFmtUnixMicro
+ jsonTimeFmtUnixNano
+)
+
+type jsonBytesFmter = bytesEncoder
+
+type jsonHandleOpts struct {
+ rawext bool
+ // bytesFmt used during encode to determine how to encode []byte
+ bytesFmt jsonBytesFmt
+ // timeFmt used during encode to determine how to encode a time.Time
+ timeFmt jsonTimeFmt
+ // timeFmtNum used during decode to decode a time.Time from an int64 in the stream
+ timeFmtNum jsonTimeFmt
+ // timeFmtLayouts used on decode, to try to parse time.Time until successful
+ timeFmtLayouts []string
+ // byteFmters used on decode, to try to parse []byte from a UTF-8 string encoding (e.g. base64)
+ byteFmters []jsonBytesFmter
+}
+
+func jsonCheckTimeLayout(s string) (ok bool) {
+ _, err := time.Parse(s, s)
+ // t...Equal(jsonTimeLayout) always returns false - unsure why
+ // return err == nil && t.Round(time.Second).UTC().Equal(jsonTimeLayout)
+ return err == nil
+}
+
+func (x *jsonHandleOpts) reset(h *JsonHandle) {
+ x.timeFmt = 0
+ x.timeFmtNum = 0
+ x.timeFmtLayouts = x.timeFmtLayouts[:0]
+ if len(h.TimeFormat) != 0 {
+ switch h.TimeFormat[0] {
+ case "unix":
+ x.timeFmt = jsonTimeFmtUnix
+ case "unixmilli":
+ x.timeFmt = jsonTimeFmtUnixMilli
+ case "unixmicro":
+ x.timeFmt = jsonTimeFmtUnixMicro
+ case "unixnano":
+ x.timeFmt = jsonTimeFmtUnixNano
+ }
+ x.timeFmtNum = x.timeFmt
+ for _, v := range h.TimeFormat {
+ if !strings.HasPrefix(v, "unix") && jsonCheckTimeLayout(v) {
+ x.timeFmtLayouts = append(x.timeFmtLayouts, v)
+ }
+ }
+ }
+ if x.timeFmt == 0 { // both timeFmt and timeFmtNum are 0
+ x.timeFmtNum = jsonTimeFmtUnix
+ x.timeFmt = jsonTimeFmtStringLayout
+ if len(x.timeFmtLayouts) == 0 {
+ x.timeFmtLayouts = append(x.timeFmtLayouts, time.RFC3339Nano)
+ }
+ }
+
+ x.bytesFmt = 0
+ x.byteFmters = x.byteFmters[:0]
+ var b64 bool
+ if len(h.BytesFormat) != 0 {
+ switch h.BytesFormat[0] {
+ case "array":
+ x.bytesFmt = jsonBytesFmtArray
+ case "base64":
+ x.bytesFmt = jsonBytesFmtBase64
+ case "base64url":
+ x.bytesFmt = jsonBytesFmtBase64url
+ case "base32":
+ x.bytesFmt = jsonBytesFmtBase32
+ case "base32hex":
+ x.bytesFmt = jsonBytesFmtBase32hex
+ case "base16", "hex":
+ x.bytesFmt = jsonBytesFmtBase16
+ }
+ for _, v := range h.BytesFormat {
+ switch v {
+ // case "array":
+ case "base64":
+ x.byteFmters = append(x.byteFmters, base64.StdEncoding)
+ b64 = true
+ case "base64url":
+ x.byteFmters = append(x.byteFmters, base64.URLEncoding)
+ case "base32":
+ x.byteFmters = append(x.byteFmters, base32.StdEncoding)
+ case "base32hex":
+ x.byteFmters = append(x.byteFmters, base32.HexEncoding)
+ case "base16", "hex":
+ x.byteFmters = append(x.byteFmters, &jsonHexEncoder)
+ }
+ }
+ }
+ if x.bytesFmt == 0 {
+ // either len==0 OR gibberish was in the first element; resolve here
+ x.bytesFmt = jsonBytesFmtBase64
+ if !b64 { // not present - so insert into pos 0
+ x.byteFmters = append(x.byteFmters, nil)
+ copy(x.byteFmters[1:], x.byteFmters[0:])
+ x.byteFmters[0] = base64.StdEncoding
+ }
+ }
+ // ----
+ x.rawext = h.RawBytesExt != nil
+}
+
+var jsonEncBoolStrs = [2][2]string{
+ {jsonLits[jsonLitF : jsonLitF+5], jsonLits[jsonLitT : jsonLitT+4]},
+ {jsonLits[jsonLitF-1 : jsonLitF+6], jsonLits[jsonLitT-1 : jsonLitT+5]},
+}
+
+func jsonEncodeUint(neg, quotes bool, u uint64, b *[48]byte) []byte {
+ // MARKER: use setByteAt/byteAt to elide the bounds-checks
+ // when we are sure that we don't go beyond the bounds.
+
+ // MARKER: copied mostly from std library: strconv/itoa.go
+ // this should only be called on 64bit OS.
+
+ var ss = jsonEncodeUintSmallsStringBytes[:]
+
+ // typically, 19 or 20 bytes sufficient for decimal encoding a uint64
+ var a = b[:24]
+ var i = uint(len(a))
+
+ if quotes {
+ i--
+ setByteAt(a, i, '"')
+ // a[i] = '"'
+ }
+ var is, us uint // use uint, as those fit into a register on the platform
+ if cpu32Bit {
+ for u >= 1e9 {
+ q := u / 1e9
+ us = uint(u - q*1e9) // u % 1e9 fits into a uint
+ for j := 4; j > 0; j-- {
+ is = us % 100 * 2
+ us /= 100
+ i -= 2
+ setByteAt(a, i+1, byteAt(ss, is+1))
+ setByteAt(a, i, byteAt(ss, is))
+ }
+ i--
+ setByteAt(a, i, byteAt(ss, us*2+1))
+ u = q
+ }
+ // u is now < 1e9, so is guaranteed to fit into a uint
+ }
+ us = uint(u)
+ for us >= 100 {
+ is = us % 100 * 2
+ us /= 100
+ i -= 2
+ setByteAt(a, i+1, byteAt(ss, is+1))
+ setByteAt(a, i, byteAt(ss, is))
+ // a[i+1], a[i] = ss[is+1], ss[is]
+ }
+
+ // us < 100
+ is = us * 2
+ i--
+ setByteAt(a, i, byteAt(ss, is+1))
+ // a[i] = ss[is+1]
+ if us >= 10 {
+ i--
+ setByteAt(a, i, byteAt(ss, is))
+ // a[i] = ss[is]
+ }
+ if neg {
+ i--
+ setByteAt(a, i, '-')
+ // a[i] = '-'
+ }
+ if quotes {
+ i--
+ setByteAt(a, i, '"')
+ // a[i] = '"'
+ }
+ return a[i:]
+}
+
+// MARKER: checkLitErr methods to prevent the got/expect parameters from escaping
+
+//go:noinline
+func jsonCheckLitErr3(got, expect [3]byte) {
+ halt.errorf("expecting %s: got %s", expect, got)
+}
+
+//go:noinline
+func jsonCheckLitErr4(got, expect [4]byte) {
+ halt.errorf("expecting %s: got %s", expect, got)
+}
+
+func jsonSlashURune(cs [4]byte) (rr uint32) {
+ for _, c := range cs {
+ // best to use explicit if-else
+ // - not a table, etc which involve memory loads, array lookup with bounds checks, etc
+ if c >= '0' && c <= '9' {
+ rr = rr*16 + uint32(c-jsonU4Chk2)
+ } else if c >= 'a' && c <= 'f' {
+ rr = rr*16 + uint32(c-jsonU4Chk1)
+ } else if c >= 'A' && c <= 'F' {
+ rr = rr*16 + uint32(c-jsonU4Chk0)
+ } else {
+ return unicode.ReplacementChar
+ }
+ }
+ return
+}
+
+func jsonNakedNum(z *fauxUnion, bs []byte, preferFloat, signedInt bool) (err error) {
+ // Note: jsonNakedNum is NEVER called with a zero-length []byte
+ if preferFloat {
+ z.v = valueTypeFloat
+ z.f, err = parseFloat64(bs)
+ } else {
+ err = parseNumber(bs, z, signedInt)
+ }
+ return
+}
+
+//----------------------
+
+// JsonHandle is a handle for JSON encoding format.
+//
+// Json is comprehensively supported:
+// - decodes numbers into interface{} as int, uint or float64
+// based on how the number looks and some config parameters e.g. PreferFloat, SignedInt, etc.
+// - decode integers from float formatted numbers e.g. 1.27e+8
+// - decode any json value (numbers, bool, etc) from quoted strings
+// - configurable way to encode/decode []byte .
+// by default, encodes and decodes []byte using base64 Std Encoding
+// - UTF-8 support for encoding and decoding
+//
+// It has better performance than the json library in the standard library,
+// by leveraging the performance improvements of the codec library.
+//
+// In addition, it doesn't read more bytes than necessary during a decode, which allows
+// reading multiple values from a stream containing json and non-json content.
+// For example, a user can read a json value, then a cbor value, then a msgpack value,
+// all from the same stream in sequence.
+//
+// Note that, when decoding quoted strings, invalid UTF-8 or invalid UTF-16 surrogate pairs are
+// not treated as an error. Instead, they are replaced by the Unicode replacement character U+FFFD.
+//
+// Note also that the float values for NaN, +Inf or -Inf are encoded as null,
+// as suggested by NOTE 4 of the ECMA-262 ECMAScript Language Specification 5.1 edition.
+// see http://www.ecma-international.org/publications/files/ECMA-ST/Ecma-262.pdf .
+//
+// Note the following behaviour differences vs std-library encoding/json package:
+// - struct field names matched in case-sensitive manner
+type JsonHandle struct {
+ textEncodingType
+ BasicHandle
+
+ // Indent indicates how a value is encoded.
+ // - If positive, indent by that number of spaces.
+ // - If negative, indent by that number of tabs.
+ Indent int8
+
+ // IntegerAsString controls how integers (signed and unsigned) are encoded.
+ //
+ // Per the JSON Spec, JSON numbers are 64-bit floating point numbers.
+ // Consequently, integers > 2^53 cannot be represented as a JSON number without losing precision.
+ // This can be mitigated by configuring how to encode integers.
+ //
+ // IntegerAsString interpretes the following values:
+ // - if 'L', then encode integers > 2^53 as a json string.
+ // - if 'A', then encode all integers as a json string
+ // containing the exact integer representation as a decimal.
+ // - else encode all integers as a json number (default)
+ IntegerAsString byte
+
+ // HTMLCharsAsIs controls how to encode some special characters to html: < > &
+ //
+ // By default, we encode them as \uXXX
+ // to prevent security holes when served from some browsers.
+ HTMLCharsAsIs bool
+
+ // PreferFloat says that we will default to decoding a number as a float.
+ // If not set, we will examine the characters of the number and decode as an
+ // integer type if it doesn't have any of the characters [.eE].
+ PreferFloat bool
+
+ // TermWhitespace says that we add a whitespace character
+ // at the end of an encoding.
+ //
+ // The whitespace is important, especially if using numbers in a context
+ // where multiple items are written to a stream.
+ TermWhitespace bool
+
+ // MapKeyAsString says to encode all map keys as strings.
+ //
+ // Use this to enforce strict json output.
+ // The only caveat is that nil value is ALWAYS written as null (never as "null")
+ MapKeyAsString bool
+
+ // _ uint64 // padding (cache line)
+
+ // Note: below, we store hardly-used items e.g. RawBytesExt.
+ // These values below may straddle a cache line, but they are hardly-used,
+ // so shouldn't contribute to false-sharing except in rare cases.
+
+ // RawBytesExt, if configured, is used to encode and decode raw bytes in a custom way.
+ // If not configured, raw bytes are encoded to/from base64 text.
+ RawBytesExt InterfaceExt
+
+ // TimeFormat is an array of strings representing a time.Time format, with each one being either
+ // a layout that honor the time.Time.Format specification.
+ // In addition, at most one of the set below (unix, unixmilli, unixmicro, unixnana) can be specified
+ // supporting encoding and decoding time as a number relative to the time epoch of Jan 1, 1970.
+ //
+ // During encode of a time.Time, the first entry in the array is used (defaults to RFC 3339).
+ //
+ // During decode,
+ // - if a string, then each of the layout formats will be tried in order until a time.Time is decoded.
+ // - if a number, then the sole unix entry is used.
+ TimeFormat []string
+
+ // BytesFormat is an array of strings representing how bytes are encoded.
+ //
+ // Supported values are base64 (default), base64url, base32, base32hex, base16 (synonymous with hex) and array.
+ //
+ // array is a special value configuring that bytes are encoded as a sequence of numbers.
+ //
+ // During encode of a []byte, the first entry is used (defaults to base64 if none specified).
+ //
+ // During decode
+ // - if a string, then attempt decoding using each format in sequence until successful.
+ // - if an array, then decode normally
+ BytesFormat []string
+}
+
+func (h *JsonHandle) isJson() bool { return true }
+
+// Name returns the name of the handle: json
+func (h *JsonHandle) Name() string { return "json" }
+
+// func (h *JsonHandle) desc(bd byte) string { return str4byte(bd) }
+func (h *JsonHandle) desc(bd byte) string { return string(bd) }
+
+func (h *JsonHandle) typical() bool {
+ return h.Indent == 0 && !h.MapKeyAsString && h.IntegerAsString != 'A' && h.IntegerAsString != 'L'
+}
+
+// SetInterfaceExt sets an extension
+func (h *JsonHandle) SetInterfaceExt(rt reflect.Type, tag uint64, ext InterfaceExt) (err error) {
+ return h.SetExt(rt, tag, makeExt(ext))
+}
+
+func jsonFloatStrconvFmtPrec64(f float64) (fmt byte, prec int8) {
+ fmt = 'f'
+ prec = -1
+ fbits := math.Float64bits(f)
+ abs := math.Float64frombits(fbits &^ (1 << 63))
+ if abs == 0 || abs == 1 {
+ prec = 1
+ } else if abs < 1e-6 || abs >= 1e21 {
+ fmt = 'e'
+ } else if noFrac64(fbits) {
+ prec = 1
+ }
+ return
+}
+
+func jsonFloatStrconvFmtPrec32(f float32) (fmt byte, prec int8) {
+ fmt = 'f'
+ prec = -1
+ // directly handle Modf (to get fractions) and Abs (to get absolute)
+ fbits := math.Float32bits(f)
+ abs := math.Float32frombits(fbits &^ (1 << 31))
+ if abs == 0 || abs == 1 {
+ prec = 1
+ } else if abs < 1e-6 || abs >= 1e21 {
+ fmt = 'e'
+ } else if noFrac32(fbits) {
+ prec = 1
+ }
+ return
+}
+
+var errJsonNoBd = errors.New("descBd unsupported in json")