2
0
Fork 0
mirror of https://github.com/ii64/sonic.git synced 2026-06-20 16:45:22 +08:00
sonic/encoder/encoder_test.go

546 lines
No EOL
15 KiB
Go

/*
* Copyright 2021 ByteDance Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package encoder
import (
`bytes`
`encoding`
`encoding/json`
`runtime`
`runtime/debug`
`strconv`
`sync`
`testing`
`time`
`github.com/bytedance/sonic/internal/rt`
`github.com/stretchr/testify/require`
)
func TestMain(m *testing.M) {
go func () {
if !debugAsyncGC {
return
}
println("Begin GC looping...")
for {
runtime.GC()
debug.FreeOSMemory()
}
println("stop GC looping!")
}()
time.Sleep(time.Millisecond)
m.Run()
}
func TestGC(t *testing.T) {
if debugSyncGC {
return
}
out, err := Encode(_GenericValue, 0)
if err != nil {
t.Fatal(err)
}
n := len(out)
wg := &sync.WaitGroup{}
N := 10000
for i:=0; i<N; i++ {
wg.Add(1)
go func (wg *sync.WaitGroup, size int) {
defer wg.Done()
out, err := Encode(_GenericValue, 0)
if err != nil {
t.Fatal(err)
}
if len(out) != size {
t.Fatal(len(out), size)
}
runtime.GC()
}(wg, n)
}
wg.Wait()
}
type sample struct {
M map[string]interface{}
S []interface{}
A [0]interface{}
MP *map[string]interface{}
SP *[]interface{}
AP *[0]interface{}
}
func BenchmarkOptionSliceOrMapNoNull(b *testing.B) {
b.Run("true", func (b *testing.B) {
obj := sample{}
_, err := Encode(obj, NoNullSliceOrMap)
if err != nil {
b.Fatal(err)
}
b.ResetTimer()
for i:=0;i<b.N;i++{
_, _ = Encode(obj, NoNullSliceOrMap)
}
})
b.Run("false", func (b *testing.B) {
obj2 := sample{}
_, err := Encode(obj2, 0)
if err != nil {
b.Fatal(err)
}
for i:=0;i<b.N;i++{
_, _ = Encode(obj2, 0)
}
})
}
func runEncoderTest(t *testing.T, fn func(string)string, exp string, arg string) {
require.Equal(t, exp, fn(arg))
}
func TestEncoder_String(t *testing.T) {
runEncoderTest(t, Quote, `""` , "")
runEncoderTest(t, Quote, `"hello, world"` , "hello, world")
runEncoderTest(t, Quote, `"hello啊啊啊aa"` , "hello啊啊啊aa")
runEncoderTest(t, Quote, `"hello\\\"world"` , "hello\\\"world")
runEncoderTest(t, Quote, `"hello\n\tworld"` , "hello\n\tworld")
runEncoderTest(t, Quote, `"hello\u0000\u0001world"` , "hello\x00\x01world")
runEncoderTest(t, Quote, `"hello\u0000\u0001world"` , "hello\x00\x01world")
runEncoderTest(t, Quote, `"Cartoonist, Illustrator, and T-Shirt connoisseur"` , "Cartoonist, Illustrator, and T-Shirt connoisseur")
}
type StringStruct struct {
X *int `json:"x,string,omitempty"`
Y []int `json:"y"`
Z json.Number `json:"z,string"`
W string `json:"w,string"`
}
func TestEncoder_FieldStringize(t *testing.T) {
x := 12345
v := StringStruct{X: &x, Y: []int{1, 2, 3}, Z: "4567456", W: "asdf"}
r, e := Encode(v, 0)
require.NoError(t, e)
println(string(r))
}
func TestEncodeErrorAndScratchBuf(t *testing.T) {
var obj = map[string]interface{}{
"a": json.RawMessage(" [} "),
}
buf := make([]byte, 0, 10)
_ = EncodeInto(&buf, obj, 0)
if len(buf) < 0 || len(buf) > 10 {
t.Fatal()
}
}
type MarshalerImpl struct {
X int
}
func (self *MarshalerImpl) MarshalJSON() ([]byte, error) {
ret := []byte(strconv.Itoa(self.X))
return append(ret, " "...), nil
}
type MarshalerStruct struct {
V MarshalerImpl
}
type MarshalerErrorStruct struct {
V MarshalerImpl
}
func (self *MarshalerErrorStruct) MarshalJSON() ([]byte, error) {
return []byte(`[""] {`), nil
}
type RawMessageStruct struct {
X json.RawMessage
}
type TextMarshalerImpl struct {
X string
}
func (self *TextMarshalerImpl) MarshalText() ([]byte, error) {
return []byte(self.X), nil
}
type TextMarshalerImplV struct {
X string
}
func (self TextMarshalerImplV) MarshalText() ([]byte, error) {
return []byte(self.X), nil
}
type TextMarshalerStruct struct {
V TextMarshalerImpl
}
func TestTextMarshalTextKey_SortKeys(t *testing.T) {
v := map[*TextMarshalerImpl]string{
{"b"}: "b",
{"c"}: "c",
{"a"}: "a",
}
ret, err := Encode(v, SortMapKeys)
require.NoError(t, err)
require.Equal(t, `{"a":"a","b":"b","c":"c"}`, string(ret))
v2 := map[TextMarshalerImplV]string{
{"b"}: "b",
{"c"}: "c",
{"a"}: "a",
}
ret, err = Encode(v2, SortMapKeys)
require.NoError(t, err)
require.Equal(t, `{"a":"a","b":"b","c":"c"}`, string(ret))
v3 := map[encoding.TextMarshaler]string{
TextMarshalerImplV{"b"}: "b",
&TextMarshalerImpl{"c"}: "c",
TextMarshalerImplV{"a"}: "a",
}
ret, err = Encode(v3, SortMapKeys)
require.NoError(t, err)
require.Equal(t, `{"a":"a","b":"b","c":"c"}`, string(ret))
}
func TestEncoder_EscapeHTML(t *testing.T) {
// test data from libfuzzer
test := []string{
"&&&&&&&&&&&&&&&&&&&&&&&\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2\xe2&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&",
"{\"\"\u2028\x94\xe2\x00\x00\x00\x00\x00\x00\x00\x00\u2028\x80\u2028\x80\u2028\xe2\u2028\x8a\u2028⑀\xa8\x8a\xa8\xe2\u2028\xe2\u2028\xe2\u2028\xe2\u2000\x8d\xe2\u2028\xe2\u2028\xe2\xe2\xa8\"}",
}
for _, s := range(test) {
data := []byte(s)
sdst := HTMLEscape(nil, data)
var dst bytes.Buffer
json.HTMLEscape(&dst, data)
require.Equal(t, string(sdst), dst.String())
}
}
func TestEncoder_Marshal_EscapeHTML_LargeJson(t *testing.T) {
buf1, err1 := Encode(&_BindingValue, SortMapKeys | EscapeHTML)
require.NoError(t, err1)
buf2, err2 :=json.Marshal(&_BindingValue)
require.NoError(t, err2)
require.Equal(t, buf1, buf2)
}
var _GenericValue interface{}
var _BindingValue TwitterStruct
func init() {
_ = json.Unmarshal([]byte(TwitterJson), &_GenericValue)
_ = json.Unmarshal([]byte(TwitterJson), &_BindingValue)
}
func TestEncoder_Generic(t *testing.T) {
v, e := Encode(_GenericValue, 0)
require.NoError(t, e)
println(string(v))
}
func TestEncoder_Binding(t *testing.T) {
v, e := Encode(_BindingValue, 0)
require.NoError(t, e)
println(string(v))
}
func TestEncoder_MapSortKey(t *testing.T) {
m := map[string]string {
"C": "third",
"D": "forth",
"A": "first",
"F": "sixth",
"E": "fifth",
"B": "second",
}
v, e := Encode(m, SortMapKeys)
require.NoError(t, e)
require.Equal(t, `{"A":"first","B":"second","C":"third","D":"forth","E":"fifth","F":"sixth"}`, string(v))
}
func BenchmarkEncoder_Generic_Sonic(b *testing.B) {
_, _ = Encode(_GenericValue, SortMapKeys | EscapeHTML | CompactMarshaler)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
for i := 0; i < b.N; i++ {
_, _ = Encode(_GenericValue, SortMapKeys | EscapeHTML | CompactMarshaler)
}
}
func BenchmarkEncoder_Generic_Sonic_Fast(b *testing.B) {
_, _ = Encode(_GenericValue, 0)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
for i := 0; i < b.N; i++ {
_, _ = Encode(_GenericValue, 0)
}
}
func BenchmarkEncoder_Generic_StdLib(b *testing.B) {
_, _ = json.Marshal(_GenericValue)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
for i := 0; i < b.N; i++ {
_, _ = json.Marshal(_GenericValue)
}
}
func BenchmarkEncoder_Binding_Sonic(b *testing.B) {
_, _ = Encode(&_BindingValue, SortMapKeys | EscapeHTML | CompactMarshaler)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
for i := 0; i < b.N; i++ {
_, _ = Encode(&_BindingValue, SortMapKeys | EscapeHTML | CompactMarshaler)
}
}
func BenchmarkEncoder_Binding_Sonic_Fast(b *testing.B) {
_, _ = Encode(&_BindingValue, NoQuoteTextMarshaler)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
for i := 0; i < b.N; i++ {
_, _ = Encode(&_BindingValue, NoQuoteTextMarshaler)
}
}
func BenchmarkEncoder_Binding_StdLib(b *testing.B) {
_, _ = json.Marshal(&_BindingValue)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
for i := 0; i < b.N; i++ {
_, _ = json.Marshal(&_BindingValue)
}
}
func BenchmarkEncoder_Parallel_Generic_Sonic(b *testing.B) {
_, _ = Encode(_GenericValue, SortMapKeys | EscapeHTML | CompactMarshaler)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
b.RunParallel(func(pb *testing.PB) {
for pb.Next() {
_, _ = Encode(_GenericValue, SortMapKeys | EscapeHTML | CompactMarshaler)
}
})
}
func BenchmarkEncoder_Parallel_Generic_Sonic_Fast(b *testing.B) {
_, _ = Encode(_GenericValue, NoQuoteTextMarshaler)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
b.RunParallel(func(pb *testing.PB) {
for pb.Next() {
_, _ = Encode(_GenericValue, NoQuoteTextMarshaler)
}
})
}
func BenchmarkEncoder_Parallel_Generic_StdLib(b *testing.B) {
_, _ = json.Marshal(_GenericValue)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
b.RunParallel(func(pb *testing.PB) {
for pb.Next() {
_, _ = json.Marshal(_GenericValue)
}
})
}
func BenchmarkEncoder_Parallel_Binding_Sonic(b *testing.B) {
_, _ = Encode(&_BindingValue, SortMapKeys | EscapeHTML | CompactMarshaler)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
b.RunParallel(func(pb *testing.PB) {
for pb.Next() {
_, _ = Encode(&_BindingValue, SortMapKeys | EscapeHTML | CompactMarshaler)
}
})
}
func BenchmarkEncoder_Parallel_Binding_Sonic_Fast(b *testing.B) {
_, _ = Encode(&_BindingValue, NoQuoteTextMarshaler)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
b.RunParallel(func(pb *testing.PB) {
for pb.Next() {
_, _ = Encode(&_BindingValue, NoQuoteTextMarshaler)
}
})
}
func BenchmarkEncoder_Parallel_Binding_StdLib(b *testing.B) {
_, _ = json.Marshal(&_BindingValue)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
b.RunParallel(func(pb *testing.PB) {
for pb.Next() {
_, _ = json.Marshal(&_BindingValue)
}
})
}
func BenchmarkHTMLEscape_Sonic(b *testing.B) {
jsonByte := []byte(TwitterJson)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
var buf []byte
for i := 0; i < b.N; i++ {
buf = HTMLEscape(nil, jsonByte)
}
_ = buf
}
func BenchmarkHTMLEscape_StdLib(b *testing.B) {
jsonByte := []byte(TwitterJson)
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
var buf []byte
for i := 0; i < b.N; i++ {
out := bytes.NewBuffer(make([]byte, 0, len(TwitterJson) * 6 / 5))
json.HTMLEscape(out, jsonByte)
buf = out.Bytes()
}
_ = buf
}
func BenchmarkValidate_Sonic(b *testing.B) {
var data = rt.Str2Mem(TwitterJson)
ok, s := Valid(data)
if !ok {
b.Fatal(s)
}
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
for i:=0; i<b.N; i++ {
_, _ = Valid(data)
}
}
func BenchmarkValidate_Std(b *testing.B) {
var data = rt.Str2Mem(TwitterJson)
if !json.Valid(data) {
b.Fatal()
}
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
for i:=0; i<b.N; i++ {
_ = json.Valid(data)
}
}
func BenchmarkCompact_Std(b *testing.B) {
var data = rt.Str2Mem(TwitterJson)
var dst = bytes.NewBuffer(nil)
if err := json.Compact(dst, data); err != nil {
b.Fatal(err)
}
b.SetBytes(int64(len(TwitterJson)))
b.ResetTimer()
for i:=0; i<b.N; i++ {
dst.Reset()
_ = json.Compact(dst, data)
}
}
type f64Bench struct {
name string
float float64
}
func BenchmarkEncode_Float64(b *testing.B) {
var bench = []f64Bench{
{"Zero", 0},
{"ShortDecimal", 1000},
{"Decimal", 33909},
{"Float", 339.7784},
{"Exp", -5.09e75},
{"NegExp", -5.11e-95},
{"LongExp", 1.234567890123456e-78},
{"Big", 123456789123456789123456789},
}
maxUint := "18446744073709551615"
for i := 1; i <= len(maxUint); i++ {
name := strconv.FormatInt(int64(i), 10) + "-Digs"
num, _ := strconv.ParseUint(string(maxUint[:i]), 10, 64)
bench = append(bench, f64Bench{name, float64(num)})
}
for _, c := range bench {
libs := []struct {
name string
test func(*testing.B)
}{{
name: "StdLib",
test: func(b *testing.B) { _, _ = json.Marshal(c.float); for i := 0; i < b.N; i++ { _, _ = json.Marshal(c.float) }},
}, {
name: "Sonic",
test: func(b *testing.B) { _, _ = Encode(c.float, 0); for i := 0; i < b.N; i++ { _, _ = Encode(c.float, 0) }},
}}
for _, lib := range libs {
name := lib.name + "_" + c.name
b.Run(name, lib.test)
}
}
}
type f32Bench struct {
name string
float float32
}
func BenchmarkEncode_Float32(b *testing.B) {
var bench = []f32Bench{
{"Zero", 0},
{"ShortDecimal", 1000},
{"Decimal", 33909},
{"ExactFraction", 3.375},
{"Point", 339.7784},
{"Exp", -5.09e25},
{"NegExp", -5.11e-25},
{"Shortest", 1.234567e-8},
}
maxUint := "18446744073709551615"
for i := 1; i <= len(maxUint); i++ {
name := strconv.FormatInt(int64(i), 10) + "-Digs"
num, _ := strconv.ParseUint(string(maxUint[:i]), 10, 64)
bench = append(bench, f32Bench{name, float32(num)})
}
for _, c := range bench {
libs := []struct {
name string
test func(*testing.B)
}{{
name: "StdLib",
test: func(b *testing.B) { _, _ = json.Marshal(c.float); for i := 0; i < b.N; i++ { _, _ = json.Marshal(c.float) }},
}, {
name: "Sonic",
test: func(b *testing.B) { _, _ = Encode(c.float, 0); for i := 0; i < b.N; i++ { _, _ = Encode(c.float, 0) }},
}}
for _, lib := range libs {
name := lib.name + "_" + c.name
b.Run(name, lib.test)
}
}
}