328 lines
9.0 KiB
Go
328 lines
9.0 KiB
Go
/*
|
|
* Copyright 2021 ByteDance Inc.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
package encoder
|
|
|
|
import (
|
|
`bytes`
|
|
`encoding/json`
|
|
`reflect`
|
|
`runtime`
|
|
`unsafe`
|
|
|
|
`github.com/bytedance/sonic/internal/native`
|
|
`github.com/bytedance/sonic/internal/native/types`
|
|
`github.com/bytedance/sonic/internal/rt`
|
|
`github.com/bytedance/sonic/utf8`
|
|
`github.com/bytedance/sonic/option`
|
|
)
|
|
|
|
// Options is a set of encoding options.
|
|
type Options uint64
|
|
|
|
const (
|
|
bitSortMapKeys = iota
|
|
bitEscapeHTML
|
|
bitCompactMarshaler
|
|
bitNoQuoteTextMarshaler
|
|
bitNoNullSliceOrMap
|
|
bitValidateString
|
|
|
|
// used for recursive compile
|
|
bitPointerValue = 63
|
|
)
|
|
|
|
const (
|
|
// SortMapKeys indicates that the keys of a map needs to be sorted
|
|
// before serializing into JSON.
|
|
// WARNING: This hurts performance A LOT, USE WITH CARE.
|
|
SortMapKeys Options = 1 << bitSortMapKeys
|
|
|
|
// EscapeHTML indicates encoder to escape all HTML characters
|
|
// after serializing into JSON (see https://pkg.go.dev/encoding/json#HTMLEscape).
|
|
// WARNING: This hurts performance A LOT, USE WITH CARE.
|
|
EscapeHTML Options = 1 << bitEscapeHTML
|
|
|
|
// CompactMarshaler indicates that the output JSON from json.Marshaler
|
|
// is always compact and needs no validation
|
|
CompactMarshaler Options = 1 << bitCompactMarshaler
|
|
|
|
// NoQuoteTextMarshaler indicates that the output text from encoding.TextMarshaler
|
|
// is always escaped string and needs no quoting
|
|
NoQuoteTextMarshaler Options = 1 << bitNoQuoteTextMarshaler
|
|
|
|
// NoNullSliceOrMap indicates all empty Array or Object are encoded as '[]' or '{}',
|
|
// instead of 'null'
|
|
NoNullSliceOrMap Options = 1 << bitNoNullSliceOrMap
|
|
|
|
// ValidateString indicates that encoder should validate the input string
|
|
// before encoding it into JSON.
|
|
ValidateString Options = 1 << bitValidateString
|
|
|
|
// CompatibleWithStd is used to be compatible with std encoder.
|
|
CompatibleWithStd Options = SortMapKeys | EscapeHTML | CompactMarshaler
|
|
)
|
|
|
|
// Encoder represents a specific set of encoder configurations.
|
|
type Encoder struct {
|
|
Opts Options
|
|
prefix string
|
|
indent string
|
|
}
|
|
|
|
// Encode returns the JSON encoding of v.
|
|
func (self *Encoder) Encode(v interface{}) ([]byte, error) {
|
|
if self.indent != "" || self.prefix != "" {
|
|
return EncodeIndented(v, self.prefix, self.indent, self.Opts)
|
|
}
|
|
return Encode(v, self.Opts)
|
|
}
|
|
|
|
// SortKeys enables the SortMapKeys option.
|
|
func (self *Encoder) SortKeys() *Encoder {
|
|
self.Opts |= SortMapKeys
|
|
return self
|
|
}
|
|
|
|
// SetEscapeHTML specifies if option EscapeHTML opens
|
|
func (self *Encoder) SetEscapeHTML(f bool) {
|
|
if f {
|
|
self.Opts |= EscapeHTML
|
|
} else {
|
|
self.Opts &= ^EscapeHTML
|
|
}
|
|
}
|
|
|
|
// SetValidateString specifies if option ValidateString opens
|
|
func (self *Encoder) SetValidateString(f bool) {
|
|
if f {
|
|
self.Opts |= ValidateString
|
|
} else {
|
|
self.Opts &= ^ValidateString
|
|
}
|
|
}
|
|
|
|
// SetCompactMarshaler specifies if option CompactMarshaler opens
|
|
func (self *Encoder) SetCompactMarshaler(f bool) {
|
|
if f {
|
|
self.Opts |= CompactMarshaler
|
|
} else {
|
|
self.Opts &= ^CompactMarshaler
|
|
}
|
|
}
|
|
|
|
// SetNoQuoteTextMarshaler specifies if option NoQuoteTextMarshaler opens
|
|
func (self *Encoder) SetNoQuoteTextMarshaler(f bool) {
|
|
if f {
|
|
self.Opts |= NoQuoteTextMarshaler
|
|
} else {
|
|
self.Opts &= ^NoQuoteTextMarshaler
|
|
}
|
|
}
|
|
|
|
// SetIndent instructs the encoder to format each subsequent encoded
|
|
// value as if indented by the package-level function EncodeIndent().
|
|
// Calling SetIndent("", "") disables indentation.
|
|
func (enc *Encoder) SetIndent(prefix, indent string) {
|
|
enc.prefix = prefix
|
|
enc.indent = indent
|
|
}
|
|
|
|
// Quote returns the JSON-quoted version of s.
|
|
func Quote(s string) string {
|
|
var n int
|
|
var p []byte
|
|
|
|
/* check for empty string */
|
|
if s == "" {
|
|
return `""`
|
|
}
|
|
|
|
/* allocate space for result */
|
|
n = len(s) + 2
|
|
p = make([]byte, 0, n)
|
|
|
|
/* call the encoder */
|
|
_ = encodeString(&p, s)
|
|
return rt.Mem2Str(p)
|
|
}
|
|
|
|
// Encode returns the JSON encoding of val, encoded with opts.
|
|
func Encode(val interface{}, opts Options) ([]byte, error) {
|
|
var ret []byte
|
|
|
|
buf := newBytes()
|
|
err := encodeInto(&buf, val, opts)
|
|
|
|
/* check for errors */
|
|
if err != nil {
|
|
freeBytes(buf)
|
|
return nil, err
|
|
}
|
|
|
|
/* htmlescape or correct UTF-8 if opts enable */
|
|
old := buf
|
|
buf = encodeFinish(old, opts)
|
|
pbuf := ((*rt.GoSlice)(unsafe.Pointer(&buf))).Ptr
|
|
pold := ((*rt.GoSlice)(unsafe.Pointer(&old))).Ptr
|
|
|
|
/* return when allocated a new buffer */
|
|
if pbuf != pold {
|
|
freeBytes(old)
|
|
return buf, nil
|
|
}
|
|
|
|
/* make a copy of the result */
|
|
ret = make([]byte, len(buf))
|
|
copy(ret, buf)
|
|
|
|
freeBytes(buf)
|
|
/* return the buffer into pool */
|
|
return ret, nil
|
|
}
|
|
|
|
// EncodeInto is like Encode but uses a user-supplied buffer instead of allocating
|
|
// a new one.
|
|
func EncodeInto(buf *[]byte, val interface{}, opts Options) error {
|
|
err := encodeInto(buf, val, opts)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
*buf = encodeFinish(*buf, opts)
|
|
return err
|
|
}
|
|
|
|
func encodeInto(buf *[]byte, val interface{}, opts Options) error {
|
|
stk := newStack()
|
|
efv := rt.UnpackEface(val)
|
|
err := encodeTypedPointer(buf, efv.Type, &efv.Value, stk, uint64(opts))
|
|
|
|
/* return the stack into pool */
|
|
if err != nil {
|
|
resetStack(stk)
|
|
}
|
|
freeStack(stk)
|
|
|
|
/* avoid GC ahead */
|
|
runtime.KeepAlive(buf)
|
|
runtime.KeepAlive(efv)
|
|
return err
|
|
}
|
|
|
|
func encodeFinish(buf []byte, opts Options) []byte {
|
|
if opts & EscapeHTML != 0 {
|
|
buf = HTMLEscape(nil, buf)
|
|
}
|
|
if opts & ValidateString != 0 && !utf8.Validate(buf) {
|
|
buf = utf8.CorrectWith(nil, buf, `\ufffd`)
|
|
}
|
|
return buf
|
|
}
|
|
|
|
var typeByte = rt.UnpackType(reflect.TypeOf(byte(0)))
|
|
|
|
// HTMLEscape appends to dst the JSON-encoded src with <, >, &, U+2028 and U+2029
|
|
// characters inside string literals changed to \u003c, \u003e, \u0026, \u2028, \u2029
|
|
// so that the JSON will be safe to embed inside HTML <script> tags.
|
|
// For historical reasons, web browsers don't honor standard HTML
|
|
// escaping within <script> tags, so an alternative JSON encoding must
|
|
// be used.
|
|
func HTMLEscape(dst []byte, src []byte) []byte {
|
|
return htmlEscape(dst, src)
|
|
}
|
|
|
|
// EncodeIndented is like Encode but applies Indent to format the output.
|
|
// Each JSON element in the output will begin on a new line beginning with prefix
|
|
// followed by one or more copies of indent according to the indentation nesting.
|
|
func EncodeIndented(val interface{}, prefix string, indent string, opts Options) ([]byte, error) {
|
|
var err error
|
|
var out []byte
|
|
var buf *bytes.Buffer
|
|
|
|
/* encode into the buffer */
|
|
out = newBytes()
|
|
err = EncodeInto(&out, val, opts)
|
|
|
|
/* check for errors */
|
|
if err != nil {
|
|
freeBytes(out)
|
|
return nil, err
|
|
}
|
|
|
|
/* indent the JSON */
|
|
buf = newBuffer()
|
|
err = json.Indent(buf, out, prefix, indent)
|
|
|
|
/* check for errors */
|
|
if err != nil {
|
|
freeBytes(out)
|
|
freeBuffer(buf)
|
|
return nil, err
|
|
}
|
|
|
|
/* copy to the result buffer */
|
|
ret := make([]byte, buf.Len())
|
|
copy(ret, buf.Bytes())
|
|
|
|
/* return the buffers into pool */
|
|
freeBytes(out)
|
|
freeBuffer(buf)
|
|
return ret, nil
|
|
}
|
|
|
|
// Pretouch compiles vt ahead-of-time to avoid JIT compilation on-the-fly, in
|
|
// order to reduce the first-hit latency.
|
|
//
|
|
// Opts are the compile options, for example, "option.WithCompileRecursiveDepth" is
|
|
// a compile option to set the depth of recursive compile for the nested struct type.
|
|
func Pretouch(vt reflect.Type, opts ...option.CompileOption) error {
|
|
cfg := option.DefaultCompileOptions()
|
|
for _, opt := range opts {
|
|
opt(&cfg)
|
|
break
|
|
}
|
|
return pretouchRec(map[reflect.Type]uint8{vt: 0}, cfg)
|
|
}
|
|
|
|
// Valid validates json and returns first non-blank character position,
|
|
// if it is only one valid json value.
|
|
// Otherwise returns invalid character position using start.
|
|
//
|
|
// Note: it does not check for the invalid UTF-8 characters.
|
|
func Valid(data []byte) (ok bool, start int) {
|
|
n := len(data)
|
|
if n == 0 {
|
|
return false, -1
|
|
}
|
|
s := rt.Mem2Str(data)
|
|
p := 0
|
|
m := types.NewStateMachine()
|
|
ret := native.ValidateOne(&s, &p, m)
|
|
types.FreeStateMachine(m)
|
|
|
|
if ret < 0 {
|
|
return false, p-1
|
|
}
|
|
|
|
/* check for trailing spaces */
|
|
for ;p < n; p++ {
|
|
if (types.SPACE_MASK & (1 << data[p])) == 0 {
|
|
return false, p
|
|
}
|
|
}
|
|
|
|
return true, ret
|
|
} |