mirror of
https://github.com/superseriousbusiness/gotosocial.git
synced 2025-10-29 14:32:25 -05:00
- github.com/KimMachineGun/automemlimit v0.7.2 => v0.7.3
- github.com/gin-contrib/cors v1.7.5 => v1.7.6
- github.com/minio/minio-go/v7 v7.0.92 => v7.0.94
- github.com/spf13/cast v1.8.0 => v1.9.2
- github.com/uptrace/bun{,/*} v1.2.11 => v1.2.14
- golang.org/x/image v0.27.0 => v0.28.0
- golang.org/x/net v0.40.0 => v0.41.0
- code.superseriousbusiness.org/go-swagger v0.31.0-gts-go1.23-fix => v0.32.3-gts-go1.23-fix
Reviewed-on: https://codeberg.org/superseriousbusiness/gotosocial/pulls/4304
Co-authored-by: kim <grufwub@gmail.com>
Co-committed-by: kim <grufwub@gmail.com>
504 lines
15 KiB
Go
504 lines
15 KiB
Go
// Copyright (c) 2012-2020 Ugorji Nwoke. All rights reserved.
|
|
// Use of this source code is governed by a MIT license found in the LICENSE file.
|
|
|
|
package codec
|
|
|
|
import (
|
|
"encoding/base32"
|
|
"encoding/base64"
|
|
"errors"
|
|
"math"
|
|
"reflect"
|
|
"strings"
|
|
"time"
|
|
"unicode"
|
|
)
|
|
|
|
//--------------------------------
|
|
|
|
// jsonLits and jsonLitb are defined at the package level,
|
|
// so they are guaranteed to be stored efficiently, making
|
|
// for better append/string comparison/etc.
|
|
//
|
|
// (anecdotal evidence from some benchmarking on go 1.20 devel in 20220104)
|
|
const jsonLits = `"true"false"null"{}[]`
|
|
|
|
const (
|
|
jsonLitT = 1
|
|
jsonLitF = 6
|
|
jsonLitN = 12
|
|
jsonLitM = 17
|
|
jsonLitA = 19
|
|
)
|
|
|
|
var jsonLitb = []byte(jsonLits)
|
|
var jsonNull = jsonLitb[jsonLitN : jsonLitN+4]
|
|
var jsonArrayEmpty = jsonLitb[jsonLitA : jsonLitA+2]
|
|
var jsonMapEmpty = jsonLitb[jsonLitM : jsonLitM+2]
|
|
|
|
const jsonEncodeUintSmallsString = "" +
|
|
"00010203040506070809" +
|
|
"10111213141516171819" +
|
|
"20212223242526272829" +
|
|
"30313233343536373839" +
|
|
"40414243444546474849" +
|
|
"50515253545556575859" +
|
|
"60616263646566676869" +
|
|
"70717273747576777879" +
|
|
"80818283848586878889" +
|
|
"90919293949596979899"
|
|
|
|
var jsonEncodeUintSmallsStringBytes = (*[len(jsonEncodeUintSmallsString)]byte)([]byte(jsonEncodeUintSmallsString))
|
|
|
|
const (
|
|
jsonU4Chk2 = '0'
|
|
jsonU4Chk1 = 'a' - 10
|
|
jsonU4Chk0 = 'A' - 10
|
|
)
|
|
|
|
const (
|
|
// If !jsonValidateSymbols, decoding will be faster, by skipping some checks:
|
|
// - If we see first character of null, false or true,
|
|
// do not validate subsequent characters.
|
|
// - e.g. if we see a n, assume null and skip next 3 characters,
|
|
// and do not validate they are ull.
|
|
// P.S. Do not expect a significant decoding boost from this.
|
|
jsonValidateSymbols = true
|
|
|
|
// jsonEscapeMultiByteUnicodeSep controls whether some unicode characters
|
|
// that are valid json but may bomb in some contexts are escaped during encoeing.
|
|
//
|
|
// U+2028 is LINE SEPARATOR. U+2029 is PARAGRAPH SEPARATOR.
|
|
// Both technically valid JSON, but bomb on JSONP, so fix here unconditionally.
|
|
jsonEscapeMultiByteUnicodeSep = true
|
|
|
|
// jsonNakedBoolNumInQuotedStr is used during decoding into a blank interface{}
|
|
// to control whether we detect quoted values of bools and null where a map key is expected,
|
|
// and treat as nil, true or false.
|
|
jsonNakedBoolNumInQuotedStr = true
|
|
)
|
|
|
|
var (
|
|
// jsonTabs and jsonSpaces are used as caches for indents
|
|
jsonTabs [32]byte
|
|
jsonSpaces [128]byte
|
|
|
|
jsonHexEncoder hexEncoder
|
|
// jsonTimeLayout is used to validate time layouts.
|
|
// Unfortunately, we couldn't compare time.Time effectively, so punted.
|
|
// jsonTimeLayout time.Time
|
|
)
|
|
|
|
func init() {
|
|
for i := 0; i < len(jsonTabs); i++ {
|
|
jsonTabs[i] = '\t'
|
|
}
|
|
for i := 0; i < len(jsonSpaces); i++ {
|
|
jsonSpaces[i] = ' '
|
|
}
|
|
// jsonTimeLayout, err := time.Parse(time.Layout, time.Layout)
|
|
// halt.onerror(err)
|
|
// jsonTimeLayout = jsonTimeLayout.Round(time.Second).UTC()
|
|
}
|
|
|
|
// ----------------
|
|
|
|
type jsonBytesFmt uint8
|
|
|
|
const (
|
|
jsonBytesFmtArray jsonBytesFmt = iota + 1
|
|
jsonBytesFmtBase64
|
|
jsonBytesFmtBase64url
|
|
jsonBytesFmtBase32
|
|
jsonBytesFmtBase32hex
|
|
jsonBytesFmtBase16
|
|
|
|
jsonBytesFmtHex = jsonBytesFmtBase16
|
|
)
|
|
|
|
type jsonTimeFmt uint8
|
|
|
|
const (
|
|
jsonTimeFmtStringLayout jsonTimeFmt = iota + 1
|
|
jsonTimeFmtUnix
|
|
jsonTimeFmtUnixMilli
|
|
jsonTimeFmtUnixMicro
|
|
jsonTimeFmtUnixNano
|
|
)
|
|
|
|
type jsonBytesFmter = bytesEncoder
|
|
|
|
type jsonHandleOpts struct {
|
|
rawext bool
|
|
// bytesFmt used during encode to determine how to encode []byte
|
|
bytesFmt jsonBytesFmt
|
|
// timeFmt used during encode to determine how to encode a time.Time
|
|
timeFmt jsonTimeFmt
|
|
// timeFmtNum used during decode to decode a time.Time from an int64 in the stream
|
|
timeFmtNum jsonTimeFmt
|
|
// timeFmtLayouts used on decode, to try to parse time.Time until successful
|
|
timeFmtLayouts []string
|
|
// byteFmters used on decode, to try to parse []byte from a UTF-8 string encoding (e.g. base64)
|
|
byteFmters []jsonBytesFmter
|
|
}
|
|
|
|
func jsonCheckTimeLayout(s string) (ok bool) {
|
|
_, err := time.Parse(s, s)
|
|
// t...Equal(jsonTimeLayout) always returns false - unsure why
|
|
// return err == nil && t.Round(time.Second).UTC().Equal(jsonTimeLayout)
|
|
return err == nil
|
|
}
|
|
|
|
func (x *jsonHandleOpts) reset(h *JsonHandle) {
|
|
x.timeFmt = 0
|
|
x.timeFmtNum = 0
|
|
x.timeFmtLayouts = x.timeFmtLayouts[:0]
|
|
if len(h.TimeFormat) != 0 {
|
|
switch h.TimeFormat[0] {
|
|
case "unix":
|
|
x.timeFmt = jsonTimeFmtUnix
|
|
case "unixmilli":
|
|
x.timeFmt = jsonTimeFmtUnixMilli
|
|
case "unixmicro":
|
|
x.timeFmt = jsonTimeFmtUnixMicro
|
|
case "unixnano":
|
|
x.timeFmt = jsonTimeFmtUnixNano
|
|
}
|
|
x.timeFmtNum = x.timeFmt
|
|
for _, v := range h.TimeFormat {
|
|
if !strings.HasPrefix(v, "unix") && jsonCheckTimeLayout(v) {
|
|
x.timeFmtLayouts = append(x.timeFmtLayouts, v)
|
|
}
|
|
}
|
|
}
|
|
if x.timeFmt == 0 { // both timeFmt and timeFmtNum are 0
|
|
x.timeFmtNum = jsonTimeFmtUnix
|
|
x.timeFmt = jsonTimeFmtStringLayout
|
|
if len(x.timeFmtLayouts) == 0 {
|
|
x.timeFmtLayouts = append(x.timeFmtLayouts, time.RFC3339Nano)
|
|
}
|
|
}
|
|
|
|
x.bytesFmt = 0
|
|
x.byteFmters = x.byteFmters[:0]
|
|
var b64 bool
|
|
if len(h.BytesFormat) != 0 {
|
|
switch h.BytesFormat[0] {
|
|
case "array":
|
|
x.bytesFmt = jsonBytesFmtArray
|
|
case "base64":
|
|
x.bytesFmt = jsonBytesFmtBase64
|
|
case "base64url":
|
|
x.bytesFmt = jsonBytesFmtBase64url
|
|
case "base32":
|
|
x.bytesFmt = jsonBytesFmtBase32
|
|
case "base32hex":
|
|
x.bytesFmt = jsonBytesFmtBase32hex
|
|
case "base16", "hex":
|
|
x.bytesFmt = jsonBytesFmtBase16
|
|
}
|
|
for _, v := range h.BytesFormat {
|
|
switch v {
|
|
// case "array":
|
|
case "base64":
|
|
x.byteFmters = append(x.byteFmters, base64.StdEncoding)
|
|
b64 = true
|
|
case "base64url":
|
|
x.byteFmters = append(x.byteFmters, base64.URLEncoding)
|
|
case "base32":
|
|
x.byteFmters = append(x.byteFmters, base32.StdEncoding)
|
|
case "base32hex":
|
|
x.byteFmters = append(x.byteFmters, base32.HexEncoding)
|
|
case "base16", "hex":
|
|
x.byteFmters = append(x.byteFmters, &jsonHexEncoder)
|
|
}
|
|
}
|
|
}
|
|
if x.bytesFmt == 0 {
|
|
// either len==0 OR gibberish was in the first element; resolve here
|
|
x.bytesFmt = jsonBytesFmtBase64
|
|
if !b64 { // not present - so insert into pos 0
|
|
x.byteFmters = append(x.byteFmters, nil)
|
|
copy(x.byteFmters[1:], x.byteFmters[0:])
|
|
x.byteFmters[0] = base64.StdEncoding
|
|
}
|
|
}
|
|
// ----
|
|
x.rawext = h.RawBytesExt != nil
|
|
}
|
|
|
|
var jsonEncBoolStrs = [2][2]string{
|
|
{jsonLits[jsonLitF : jsonLitF+5], jsonLits[jsonLitT : jsonLitT+4]},
|
|
{jsonLits[jsonLitF-1 : jsonLitF+6], jsonLits[jsonLitT-1 : jsonLitT+5]},
|
|
}
|
|
|
|
func jsonEncodeUint(neg, quotes bool, u uint64, b *[48]byte) []byte {
|
|
// MARKER: use setByteAt/byteAt to elide the bounds-checks
|
|
// when we are sure that we don't go beyond the bounds.
|
|
|
|
// MARKER: copied mostly from std library: strconv/itoa.go
|
|
// this should only be called on 64bit OS.
|
|
|
|
var ss = jsonEncodeUintSmallsStringBytes[:]
|
|
|
|
// typically, 19 or 20 bytes sufficient for decimal encoding a uint64
|
|
var a = b[:24]
|
|
var i = uint(len(a))
|
|
|
|
if quotes {
|
|
i--
|
|
setByteAt(a, i, '"')
|
|
// a[i] = '"'
|
|
}
|
|
var is, us uint // use uint, as those fit into a register on the platform
|
|
if cpu32Bit {
|
|
for u >= 1e9 {
|
|
q := u / 1e9
|
|
us = uint(u - q*1e9) // u % 1e9 fits into a uint
|
|
for j := 4; j > 0; j-- {
|
|
is = us % 100 * 2
|
|
us /= 100
|
|
i -= 2
|
|
setByteAt(a, i+1, byteAt(ss, is+1))
|
|
setByteAt(a, i, byteAt(ss, is))
|
|
}
|
|
i--
|
|
setByteAt(a, i, byteAt(ss, us*2+1))
|
|
u = q
|
|
}
|
|
// u is now < 1e9, so is guaranteed to fit into a uint
|
|
}
|
|
us = uint(u)
|
|
for us >= 100 {
|
|
is = us % 100 * 2
|
|
us /= 100
|
|
i -= 2
|
|
setByteAt(a, i+1, byteAt(ss, is+1))
|
|
setByteAt(a, i, byteAt(ss, is))
|
|
// a[i+1], a[i] = ss[is+1], ss[is]
|
|
}
|
|
|
|
// us < 100
|
|
is = us * 2
|
|
i--
|
|
setByteAt(a, i, byteAt(ss, is+1))
|
|
// a[i] = ss[is+1]
|
|
if us >= 10 {
|
|
i--
|
|
setByteAt(a, i, byteAt(ss, is))
|
|
// a[i] = ss[is]
|
|
}
|
|
if neg {
|
|
i--
|
|
setByteAt(a, i, '-')
|
|
// a[i] = '-'
|
|
}
|
|
if quotes {
|
|
i--
|
|
setByteAt(a, i, '"')
|
|
// a[i] = '"'
|
|
}
|
|
return a[i:]
|
|
}
|
|
|
|
// MARKER: checkLitErr methods to prevent the got/expect parameters from escaping
|
|
|
|
//go:noinline
|
|
func jsonCheckLitErr3(got, expect [3]byte) {
|
|
halt.errorf("expecting %s: got %s", expect, got)
|
|
}
|
|
|
|
//go:noinline
|
|
func jsonCheckLitErr4(got, expect [4]byte) {
|
|
halt.errorf("expecting %s: got %s", expect, got)
|
|
}
|
|
|
|
func jsonSlashURune(cs [4]byte) (rr uint32) {
|
|
for _, c := range cs {
|
|
// best to use explicit if-else
|
|
// - not a table, etc which involve memory loads, array lookup with bounds checks, etc
|
|
if c >= '0' && c <= '9' {
|
|
rr = rr*16 + uint32(c-jsonU4Chk2)
|
|
} else if c >= 'a' && c <= 'f' {
|
|
rr = rr*16 + uint32(c-jsonU4Chk1)
|
|
} else if c >= 'A' && c <= 'F' {
|
|
rr = rr*16 + uint32(c-jsonU4Chk0)
|
|
} else {
|
|
return unicode.ReplacementChar
|
|
}
|
|
}
|
|
return
|
|
}
|
|
|
|
func jsonNakedNum(z *fauxUnion, bs []byte, preferFloat, signedInt bool) (err error) {
|
|
// Note: jsonNakedNum is NEVER called with a zero-length []byte
|
|
if preferFloat {
|
|
z.v = valueTypeFloat
|
|
z.f, err = parseFloat64(bs)
|
|
} else {
|
|
err = parseNumber(bs, z, signedInt)
|
|
}
|
|
return
|
|
}
|
|
|
|
//----------------------
|
|
|
|
// JsonHandle is a handle for JSON encoding format.
|
|
//
|
|
// Json is comprehensively supported:
|
|
// - decodes numbers into interface{} as int, uint or float64
|
|
// based on how the number looks and some config parameters e.g. PreferFloat, SignedInt, etc.
|
|
// - decode integers from float formatted numbers e.g. 1.27e+8
|
|
// - decode any json value (numbers, bool, etc) from quoted strings
|
|
// - configurable way to encode/decode []byte .
|
|
// by default, encodes and decodes []byte using base64 Std Encoding
|
|
// - UTF-8 support for encoding and decoding
|
|
//
|
|
// It has better performance than the json library in the standard library,
|
|
// by leveraging the performance improvements of the codec library.
|
|
//
|
|
// In addition, it doesn't read more bytes than necessary during a decode, which allows
|
|
// reading multiple values from a stream containing json and non-json content.
|
|
// For example, a user can read a json value, then a cbor value, then a msgpack value,
|
|
// all from the same stream in sequence.
|
|
//
|
|
// Note that, when decoding quoted strings, invalid UTF-8 or invalid UTF-16 surrogate pairs are
|
|
// not treated as an error. Instead, they are replaced by the Unicode replacement character U+FFFD.
|
|
//
|
|
// Note also that the float values for NaN, +Inf or -Inf are encoded as null,
|
|
// as suggested by NOTE 4 of the ECMA-262 ECMAScript Language Specification 5.1 edition.
|
|
// see http://www.ecma-international.org/publications/files/ECMA-ST/Ecma-262.pdf .
|
|
//
|
|
// Note the following behaviour differences vs std-library encoding/json package:
|
|
// - struct field names matched in case-sensitive manner
|
|
type JsonHandle struct {
|
|
textEncodingType
|
|
BasicHandle
|
|
|
|
// Indent indicates how a value is encoded.
|
|
// - If positive, indent by that number of spaces.
|
|
// - If negative, indent by that number of tabs.
|
|
Indent int8
|
|
|
|
// IntegerAsString controls how integers (signed and unsigned) are encoded.
|
|
//
|
|
// Per the JSON Spec, JSON numbers are 64-bit floating point numbers.
|
|
// Consequently, integers > 2^53 cannot be represented as a JSON number without losing precision.
|
|
// This can be mitigated by configuring how to encode integers.
|
|
//
|
|
// IntegerAsString interpretes the following values:
|
|
// - if 'L', then encode integers > 2^53 as a json string.
|
|
// - if 'A', then encode all integers as a json string
|
|
// containing the exact integer representation as a decimal.
|
|
// - else encode all integers as a json number (default)
|
|
IntegerAsString byte
|
|
|
|
// HTMLCharsAsIs controls how to encode some special characters to html: < > &
|
|
//
|
|
// By default, we encode them as \uXXX
|
|
// to prevent security holes when served from some browsers.
|
|
HTMLCharsAsIs bool
|
|
|
|
// PreferFloat says that we will default to decoding a number as a float.
|
|
// If not set, we will examine the characters of the number and decode as an
|
|
// integer type if it doesn't have any of the characters [.eE].
|
|
PreferFloat bool
|
|
|
|
// TermWhitespace says that we add a whitespace character
|
|
// at the end of an encoding.
|
|
//
|
|
// The whitespace is important, especially if using numbers in a context
|
|
// where multiple items are written to a stream.
|
|
TermWhitespace bool
|
|
|
|
// MapKeyAsString says to encode all map keys as strings.
|
|
//
|
|
// Use this to enforce strict json output.
|
|
// The only caveat is that nil value is ALWAYS written as null (never as "null")
|
|
MapKeyAsString bool
|
|
|
|
// _ uint64 // padding (cache line)
|
|
|
|
// Note: below, we store hardly-used items e.g. RawBytesExt.
|
|
// These values below may straddle a cache line, but they are hardly-used,
|
|
// so shouldn't contribute to false-sharing except in rare cases.
|
|
|
|
// RawBytesExt, if configured, is used to encode and decode raw bytes in a custom way.
|
|
// If not configured, raw bytes are encoded to/from base64 text.
|
|
RawBytesExt InterfaceExt
|
|
|
|
// TimeFormat is an array of strings representing a time.Time format, with each one being either
|
|
// a layout that honor the time.Time.Format specification.
|
|
// In addition, at most one of the set below (unix, unixmilli, unixmicro, unixnana) can be specified
|
|
// supporting encoding and decoding time as a number relative to the time epoch of Jan 1, 1970.
|
|
//
|
|
// During encode of a time.Time, the first entry in the array is used (defaults to RFC 3339).
|
|
//
|
|
// During decode,
|
|
// - if a string, then each of the layout formats will be tried in order until a time.Time is decoded.
|
|
// - if a number, then the sole unix entry is used.
|
|
TimeFormat []string
|
|
|
|
// BytesFormat is an array of strings representing how bytes are encoded.
|
|
//
|
|
// Supported values are base64 (default), base64url, base32, base32hex, base16 (synonymous with hex) and array.
|
|
//
|
|
// array is a special value configuring that bytes are encoded as a sequence of numbers.
|
|
//
|
|
// During encode of a []byte, the first entry is used (defaults to base64 if none specified).
|
|
//
|
|
// During decode
|
|
// - if a string, then attempt decoding using each format in sequence until successful.
|
|
// - if an array, then decode normally
|
|
BytesFormat []string
|
|
}
|
|
|
|
func (h *JsonHandle) isJson() bool { return true }
|
|
|
|
// Name returns the name of the handle: json
|
|
func (h *JsonHandle) Name() string { return "json" }
|
|
|
|
// func (h *JsonHandle) desc(bd byte) string { return str4byte(bd) }
|
|
func (h *JsonHandle) desc(bd byte) string { return string(bd) }
|
|
|
|
func (h *JsonHandle) typical() bool {
|
|
return h.Indent == 0 && !h.MapKeyAsString && h.IntegerAsString != 'A' && h.IntegerAsString != 'L'
|
|
}
|
|
|
|
// SetInterfaceExt sets an extension
|
|
func (h *JsonHandle) SetInterfaceExt(rt reflect.Type, tag uint64, ext InterfaceExt) (err error) {
|
|
return h.SetExt(rt, tag, makeExt(ext))
|
|
}
|
|
|
|
func jsonFloatStrconvFmtPrec64(f float64) (fmt byte, prec int8) {
|
|
fmt = 'f'
|
|
prec = -1
|
|
fbits := math.Float64bits(f)
|
|
abs := math.Float64frombits(fbits &^ (1 << 63))
|
|
if abs == 0 || abs == 1 {
|
|
prec = 1
|
|
} else if abs < 1e-6 || abs >= 1e21 {
|
|
fmt = 'e'
|
|
} else if noFrac64(fbits) {
|
|
prec = 1
|
|
}
|
|
return
|
|
}
|
|
|
|
func jsonFloatStrconvFmtPrec32(f float32) (fmt byte, prec int8) {
|
|
fmt = 'f'
|
|
prec = -1
|
|
// directly handle Modf (to get fractions) and Abs (to get absolute)
|
|
fbits := math.Float32bits(f)
|
|
abs := math.Float32frombits(fbits &^ (1 << 31))
|
|
if abs == 0 || abs == 1 {
|
|
prec = 1
|
|
} else if abs < 1e-6 || abs >= 1e21 {
|
|
fmt = 'e'
|
|
} else if noFrac32(fbits) {
|
|
prec = 1
|
|
}
|
|
return
|
|
}
|
|
|
|
var errJsonNoBd = errors.New("descBd unsupported in json")
|