gotosocial/vendor/github.com/ugorji/go/codec/json.base.go
kim 8b0ea56027 [chore] update go dependencies (#4304)
- github.com/KimMachineGun/automemlimit v0.7.2 => v0.7.3
- github.com/gin-contrib/cors v1.7.5 => v1.7.6
- github.com/minio/minio-go/v7 v7.0.92 => v7.0.94
- github.com/spf13/cast v1.8.0 => v1.9.2
- github.com/uptrace/bun{,/*} v1.2.11 => v1.2.14
- golang.org/x/image v0.27.0 => v0.28.0
- golang.org/x/net v0.40.0 => v0.41.0
- code.superseriousbusiness.org/go-swagger v0.31.0-gts-go1.23-fix => v0.32.3-gts-go1.23-fix

Reviewed-on: https://codeberg.org/superseriousbusiness/gotosocial/pulls/4304
Co-authored-by: kim <grufwub@gmail.com>
Co-committed-by: kim <grufwub@gmail.com>
2025-06-30 15:19:09 +02:00

504 lines
15 KiB
Go

// Copyright (c) 2012-2020 Ugorji Nwoke. All rights reserved.
// Use of this source code is governed by a MIT license found in the LICENSE file.
package codec
import (
"encoding/base32"
"encoding/base64"
"errors"
"math"
"reflect"
"strings"
"time"
"unicode"
)
//--------------------------------
// jsonLits and jsonLitb are defined at the package level,
// so they are guaranteed to be stored efficiently, making
// for better append/string comparison/etc.
//
// (anecdotal evidence from some benchmarking on go 1.20 devel in 20220104)
const jsonLits = `"true"false"null"{}[]`
const (
jsonLitT = 1
jsonLitF = 6
jsonLitN = 12
jsonLitM = 17
jsonLitA = 19
)
var jsonLitb = []byte(jsonLits)
var jsonNull = jsonLitb[jsonLitN : jsonLitN+4]
var jsonArrayEmpty = jsonLitb[jsonLitA : jsonLitA+2]
var jsonMapEmpty = jsonLitb[jsonLitM : jsonLitM+2]
const jsonEncodeUintSmallsString = "" +
"00010203040506070809" +
"10111213141516171819" +
"20212223242526272829" +
"30313233343536373839" +
"40414243444546474849" +
"50515253545556575859" +
"60616263646566676869" +
"70717273747576777879" +
"80818283848586878889" +
"90919293949596979899"
var jsonEncodeUintSmallsStringBytes = (*[len(jsonEncodeUintSmallsString)]byte)([]byte(jsonEncodeUintSmallsString))
const (
jsonU4Chk2 = '0'
jsonU4Chk1 = 'a' - 10
jsonU4Chk0 = 'A' - 10
)
const (
// If !jsonValidateSymbols, decoding will be faster, by skipping some checks:
// - If we see first character of null, false or true,
// do not validate subsequent characters.
// - e.g. if we see a n, assume null and skip next 3 characters,
// and do not validate they are ull.
// P.S. Do not expect a significant decoding boost from this.
jsonValidateSymbols = true
// jsonEscapeMultiByteUnicodeSep controls whether some unicode characters
// that are valid json but may bomb in some contexts are escaped during encoeing.
//
// U+2028 is LINE SEPARATOR. U+2029 is PARAGRAPH SEPARATOR.
// Both technically valid JSON, but bomb on JSONP, so fix here unconditionally.
jsonEscapeMultiByteUnicodeSep = true
// jsonNakedBoolNumInQuotedStr is used during decoding into a blank interface{}
// to control whether we detect quoted values of bools and null where a map key is expected,
// and treat as nil, true or false.
jsonNakedBoolNumInQuotedStr = true
)
var (
// jsonTabs and jsonSpaces are used as caches for indents
jsonTabs [32]byte
jsonSpaces [128]byte
jsonHexEncoder hexEncoder
// jsonTimeLayout is used to validate time layouts.
// Unfortunately, we couldn't compare time.Time effectively, so punted.
// jsonTimeLayout time.Time
)
func init() {
for i := 0; i < len(jsonTabs); i++ {
jsonTabs[i] = '\t'
}
for i := 0; i < len(jsonSpaces); i++ {
jsonSpaces[i] = ' '
}
// jsonTimeLayout, err := time.Parse(time.Layout, time.Layout)
// halt.onerror(err)
// jsonTimeLayout = jsonTimeLayout.Round(time.Second).UTC()
}
// ----------------
type jsonBytesFmt uint8
const (
jsonBytesFmtArray jsonBytesFmt = iota + 1
jsonBytesFmtBase64
jsonBytesFmtBase64url
jsonBytesFmtBase32
jsonBytesFmtBase32hex
jsonBytesFmtBase16
jsonBytesFmtHex = jsonBytesFmtBase16
)
type jsonTimeFmt uint8
const (
jsonTimeFmtStringLayout jsonTimeFmt = iota + 1
jsonTimeFmtUnix
jsonTimeFmtUnixMilli
jsonTimeFmtUnixMicro
jsonTimeFmtUnixNano
)
type jsonBytesFmter = bytesEncoder
type jsonHandleOpts struct {
rawext bool
// bytesFmt used during encode to determine how to encode []byte
bytesFmt jsonBytesFmt
// timeFmt used during encode to determine how to encode a time.Time
timeFmt jsonTimeFmt
// timeFmtNum used during decode to decode a time.Time from an int64 in the stream
timeFmtNum jsonTimeFmt
// timeFmtLayouts used on decode, to try to parse time.Time until successful
timeFmtLayouts []string
// byteFmters used on decode, to try to parse []byte from a UTF-8 string encoding (e.g. base64)
byteFmters []jsonBytesFmter
}
func jsonCheckTimeLayout(s string) (ok bool) {
_, err := time.Parse(s, s)
// t...Equal(jsonTimeLayout) always returns false - unsure why
// return err == nil && t.Round(time.Second).UTC().Equal(jsonTimeLayout)
return err == nil
}
func (x *jsonHandleOpts) reset(h *JsonHandle) {
x.timeFmt = 0
x.timeFmtNum = 0
x.timeFmtLayouts = x.timeFmtLayouts[:0]
if len(h.TimeFormat) != 0 {
switch h.TimeFormat[0] {
case "unix":
x.timeFmt = jsonTimeFmtUnix
case "unixmilli":
x.timeFmt = jsonTimeFmtUnixMilli
case "unixmicro":
x.timeFmt = jsonTimeFmtUnixMicro
case "unixnano":
x.timeFmt = jsonTimeFmtUnixNano
}
x.timeFmtNum = x.timeFmt
for _, v := range h.TimeFormat {
if !strings.HasPrefix(v, "unix") && jsonCheckTimeLayout(v) {
x.timeFmtLayouts = append(x.timeFmtLayouts, v)
}
}
}
if x.timeFmt == 0 { // both timeFmt and timeFmtNum are 0
x.timeFmtNum = jsonTimeFmtUnix
x.timeFmt = jsonTimeFmtStringLayout
if len(x.timeFmtLayouts) == 0 {
x.timeFmtLayouts = append(x.timeFmtLayouts, time.RFC3339Nano)
}
}
x.bytesFmt = 0
x.byteFmters = x.byteFmters[:0]
var b64 bool
if len(h.BytesFormat) != 0 {
switch h.BytesFormat[0] {
case "array":
x.bytesFmt = jsonBytesFmtArray
case "base64":
x.bytesFmt = jsonBytesFmtBase64
case "base64url":
x.bytesFmt = jsonBytesFmtBase64url
case "base32":
x.bytesFmt = jsonBytesFmtBase32
case "base32hex":
x.bytesFmt = jsonBytesFmtBase32hex
case "base16", "hex":
x.bytesFmt = jsonBytesFmtBase16
}
for _, v := range h.BytesFormat {
switch v {
// case "array":
case "base64":
x.byteFmters = append(x.byteFmters, base64.StdEncoding)
b64 = true
case "base64url":
x.byteFmters = append(x.byteFmters, base64.URLEncoding)
case "base32":
x.byteFmters = append(x.byteFmters, base32.StdEncoding)
case "base32hex":
x.byteFmters = append(x.byteFmters, base32.HexEncoding)
case "base16", "hex":
x.byteFmters = append(x.byteFmters, &jsonHexEncoder)
}
}
}
if x.bytesFmt == 0 {
// either len==0 OR gibberish was in the first element; resolve here
x.bytesFmt = jsonBytesFmtBase64
if !b64 { // not present - so insert into pos 0
x.byteFmters = append(x.byteFmters, nil)
copy(x.byteFmters[1:], x.byteFmters[0:])
x.byteFmters[0] = base64.StdEncoding
}
}
// ----
x.rawext = h.RawBytesExt != nil
}
var jsonEncBoolStrs = [2][2]string{
{jsonLits[jsonLitF : jsonLitF+5], jsonLits[jsonLitT : jsonLitT+4]},
{jsonLits[jsonLitF-1 : jsonLitF+6], jsonLits[jsonLitT-1 : jsonLitT+5]},
}
func jsonEncodeUint(neg, quotes bool, u uint64, b *[48]byte) []byte {
// MARKER: use setByteAt/byteAt to elide the bounds-checks
// when we are sure that we don't go beyond the bounds.
// MARKER: copied mostly from std library: strconv/itoa.go
// this should only be called on 64bit OS.
var ss = jsonEncodeUintSmallsStringBytes[:]
// typically, 19 or 20 bytes sufficient for decimal encoding a uint64
var a = b[:24]
var i = uint(len(a))
if quotes {
i--
setByteAt(a, i, '"')
// a[i] = '"'
}
var is, us uint // use uint, as those fit into a register on the platform
if cpu32Bit {
for u >= 1e9 {
q := u / 1e9
us = uint(u - q*1e9) // u % 1e9 fits into a uint
for j := 4; j > 0; j-- {
is = us % 100 * 2
us /= 100
i -= 2
setByteAt(a, i+1, byteAt(ss, is+1))
setByteAt(a, i, byteAt(ss, is))
}
i--
setByteAt(a, i, byteAt(ss, us*2+1))
u = q
}
// u is now < 1e9, so is guaranteed to fit into a uint
}
us = uint(u)
for us >= 100 {
is = us % 100 * 2
us /= 100
i -= 2
setByteAt(a, i+1, byteAt(ss, is+1))
setByteAt(a, i, byteAt(ss, is))
// a[i+1], a[i] = ss[is+1], ss[is]
}
// us < 100
is = us * 2
i--
setByteAt(a, i, byteAt(ss, is+1))
// a[i] = ss[is+1]
if us >= 10 {
i--
setByteAt(a, i, byteAt(ss, is))
// a[i] = ss[is]
}
if neg {
i--
setByteAt(a, i, '-')
// a[i] = '-'
}
if quotes {
i--
setByteAt(a, i, '"')
// a[i] = '"'
}
return a[i:]
}
// MARKER: checkLitErr methods to prevent the got/expect parameters from escaping
//go:noinline
func jsonCheckLitErr3(got, expect [3]byte) {
halt.errorf("expecting %s: got %s", expect, got)
}
//go:noinline
func jsonCheckLitErr4(got, expect [4]byte) {
halt.errorf("expecting %s: got %s", expect, got)
}
func jsonSlashURune(cs [4]byte) (rr uint32) {
for _, c := range cs {
// best to use explicit if-else
// - not a table, etc which involve memory loads, array lookup with bounds checks, etc
if c >= '0' && c <= '9' {
rr = rr*16 + uint32(c-jsonU4Chk2)
} else if c >= 'a' && c <= 'f' {
rr = rr*16 + uint32(c-jsonU4Chk1)
} else if c >= 'A' && c <= 'F' {
rr = rr*16 + uint32(c-jsonU4Chk0)
} else {
return unicode.ReplacementChar
}
}
return
}
func jsonNakedNum(z *fauxUnion, bs []byte, preferFloat, signedInt bool) (err error) {
// Note: jsonNakedNum is NEVER called with a zero-length []byte
if preferFloat {
z.v = valueTypeFloat
z.f, err = parseFloat64(bs)
} else {
err = parseNumber(bs, z, signedInt)
}
return
}
//----------------------
// JsonHandle is a handle for JSON encoding format.
//
// Json is comprehensively supported:
// - decodes numbers into interface{} as int, uint or float64
// based on how the number looks and some config parameters e.g. PreferFloat, SignedInt, etc.
// - decode integers from float formatted numbers e.g. 1.27e+8
// - decode any json value (numbers, bool, etc) from quoted strings
// - configurable way to encode/decode []byte .
// by default, encodes and decodes []byte using base64 Std Encoding
// - UTF-8 support for encoding and decoding
//
// It has better performance than the json library in the standard library,
// by leveraging the performance improvements of the codec library.
//
// In addition, it doesn't read more bytes than necessary during a decode, which allows
// reading multiple values from a stream containing json and non-json content.
// For example, a user can read a json value, then a cbor value, then a msgpack value,
// all from the same stream in sequence.
//
// Note that, when decoding quoted strings, invalid UTF-8 or invalid UTF-16 surrogate pairs are
// not treated as an error. Instead, they are replaced by the Unicode replacement character U+FFFD.
//
// Note also that the float values for NaN, +Inf or -Inf are encoded as null,
// as suggested by NOTE 4 of the ECMA-262 ECMAScript Language Specification 5.1 edition.
// see http://www.ecma-international.org/publications/files/ECMA-ST/Ecma-262.pdf .
//
// Note the following behaviour differences vs std-library encoding/json package:
// - struct field names matched in case-sensitive manner
type JsonHandle struct {
textEncodingType
BasicHandle
// Indent indicates how a value is encoded.
// - If positive, indent by that number of spaces.
// - If negative, indent by that number of tabs.
Indent int8
// IntegerAsString controls how integers (signed and unsigned) are encoded.
//
// Per the JSON Spec, JSON numbers are 64-bit floating point numbers.
// Consequently, integers > 2^53 cannot be represented as a JSON number without losing precision.
// This can be mitigated by configuring how to encode integers.
//
// IntegerAsString interpretes the following values:
// - if 'L', then encode integers > 2^53 as a json string.
// - if 'A', then encode all integers as a json string
// containing the exact integer representation as a decimal.
// - else encode all integers as a json number (default)
IntegerAsString byte
// HTMLCharsAsIs controls how to encode some special characters to html: < > &
//
// By default, we encode them as \uXXX
// to prevent security holes when served from some browsers.
HTMLCharsAsIs bool
// PreferFloat says that we will default to decoding a number as a float.
// If not set, we will examine the characters of the number and decode as an
// integer type if it doesn't have any of the characters [.eE].
PreferFloat bool
// TermWhitespace says that we add a whitespace character
// at the end of an encoding.
//
// The whitespace is important, especially if using numbers in a context
// where multiple items are written to a stream.
TermWhitespace bool
// MapKeyAsString says to encode all map keys as strings.
//
// Use this to enforce strict json output.
// The only caveat is that nil value is ALWAYS written as null (never as "null")
MapKeyAsString bool
// _ uint64 // padding (cache line)
// Note: below, we store hardly-used items e.g. RawBytesExt.
// These values below may straddle a cache line, but they are hardly-used,
// so shouldn't contribute to false-sharing except in rare cases.
// RawBytesExt, if configured, is used to encode and decode raw bytes in a custom way.
// If not configured, raw bytes are encoded to/from base64 text.
RawBytesExt InterfaceExt
// TimeFormat is an array of strings representing a time.Time format, with each one being either
// a layout that honor the time.Time.Format specification.
// In addition, at most one of the set below (unix, unixmilli, unixmicro, unixnana) can be specified
// supporting encoding and decoding time as a number relative to the time epoch of Jan 1, 1970.
//
// During encode of a time.Time, the first entry in the array is used (defaults to RFC 3339).
//
// During decode,
// - if a string, then each of the layout formats will be tried in order until a time.Time is decoded.
// - if a number, then the sole unix entry is used.
TimeFormat []string
// BytesFormat is an array of strings representing how bytes are encoded.
//
// Supported values are base64 (default), base64url, base32, base32hex, base16 (synonymous with hex) and array.
//
// array is a special value configuring that bytes are encoded as a sequence of numbers.
//
// During encode of a []byte, the first entry is used (defaults to base64 if none specified).
//
// During decode
// - if a string, then attempt decoding using each format in sequence until successful.
// - if an array, then decode normally
BytesFormat []string
}
func (h *JsonHandle) isJson() bool { return true }
// Name returns the name of the handle: json
func (h *JsonHandle) Name() string { return "json" }
// func (h *JsonHandle) desc(bd byte) string { return str4byte(bd) }
func (h *JsonHandle) desc(bd byte) string { return string(bd) }
func (h *JsonHandle) typical() bool {
return h.Indent == 0 && !h.MapKeyAsString && h.IntegerAsString != 'A' && h.IntegerAsString != 'L'
}
// SetInterfaceExt sets an extension
func (h *JsonHandle) SetInterfaceExt(rt reflect.Type, tag uint64, ext InterfaceExt) (err error) {
return h.SetExt(rt, tag, makeExt(ext))
}
func jsonFloatStrconvFmtPrec64(f float64) (fmt byte, prec int8) {
fmt = 'f'
prec = -1
fbits := math.Float64bits(f)
abs := math.Float64frombits(fbits &^ (1 << 63))
if abs == 0 || abs == 1 {
prec = 1
} else if abs < 1e-6 || abs >= 1e21 {
fmt = 'e'
} else if noFrac64(fbits) {
prec = 1
}
return
}
func jsonFloatStrconvFmtPrec32(f float32) (fmt byte, prec int8) {
fmt = 'f'
prec = -1
// directly handle Modf (to get fractions) and Abs (to get absolute)
fbits := math.Float32bits(f)
abs := math.Float32frombits(fbits &^ (1 << 31))
if abs == 0 || abs == 1 {
prec = 1
} else if abs < 1e-6 || abs >= 1e21 {
fmt = 'e'
} else if noFrac32(fbits) {
prec = 1
}
return
}
var errJsonNoBd = errors.New("descBd unsupported in json")