| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385 |
- // Copyright (c) 2012-2015 Ugorji Nwoke. All rights reserved.
- // Use of this source code is governed by a MIT license found in the LICENSE file.
- package codec
- import (
- "encoding"
- "fmt"
- "io"
- "reflect"
- "sort"
- "sync"
- )
- const defEncByteBufSize = 1 << 6 // 4:16, 6:64, 8:256, 10:1024
- // AsSymbolFlag defines what should be encoded as symbols.
- type AsSymbolFlag uint8
- const (
- // AsSymbolDefault is default.
- // Currently, this means only encode struct field names as symbols.
- // The default is subject to change.
- AsSymbolDefault AsSymbolFlag = iota
- // AsSymbolAll means encode anything which could be a symbol as a symbol.
- AsSymbolAll = 0xfe
- // AsSymbolNone means do not encode anything as a symbol.
- AsSymbolNone = 1 << iota
- // AsSymbolMapStringKeys means encode keys in map[string]XXX as symbols.
- AsSymbolMapStringKeysFlag
- // AsSymbolStructFieldName means encode struct field names as symbols.
- AsSymbolStructFieldNameFlag
- )
- // encWriter abstracts writing to a byte array or to an io.Writer.
- type encWriter interface {
- writeb([]byte)
- writestr(string)
- writen1(byte)
- writen2(byte, byte)
- writen4(byte, byte, byte, byte)
- writen5(byte, byte, byte, byte, byte)
- atEndOfEncode()
- }
- // encDriver abstracts the actual codec (binc vs msgpack, etc)
- type encDriver interface {
- // IsBuiltinType(rt uintptr) bool
- EncodeBuiltin(rt uintptr, v interface{})
- EncodeNil()
- EncodeInt(i int64)
- EncodeUint(i uint64)
- EncodeBool(b bool)
- EncodeFloat32(f float32)
- EncodeFloat64(f float64)
- // encodeExtPreamble(xtag byte, length int)
- EncodeRawExt(re *RawExt, e *Encoder)
- EncodeExt(v interface{}, xtag uint64, ext Ext, e *Encoder)
- EncodeArrayStart(length int)
- EncodeMapStart(length int)
- EncodeString(c charEncoding, v string)
- EncodeSymbol(v string)
- EncodeStringBytes(c charEncoding, v []byte)
- //TODO
- //encBignum(f *big.Int)
- //encStringRunes(c charEncoding, v []rune)
- reset()
- }
- type encDriverAsis interface {
- EncodeAsis(v []byte)
- }
- type encNoSeparator struct{}
- func (_ encNoSeparator) EncodeEnd() {}
- type ioEncWriterWriter interface {
- WriteByte(c byte) error
- WriteString(s string) (n int, err error)
- Write(p []byte) (n int, err error)
- }
- type ioEncStringWriter interface {
- WriteString(s string) (n int, err error)
- }
- type EncodeOptions struct {
- // Encode a struct as an array, and not as a map
- StructToArray bool
- // Canonical representation means that encoding a value will always result in the same
- // sequence of bytes.
- //
- // This only affects maps, as the iteration order for maps is random.
- //
- // The implementation MAY use the natural sort order for the map keys if possible:
- //
- // - If there is a natural sort order (ie for number, bool, string or []byte keys),
- // then the map keys are first sorted in natural order and then written
- // with corresponding map values to the strema.
- // - If there is no natural sort order, then the map keys will first be
- // encoded into []byte, and then sorted,
- // before writing the sorted keys and the corresponding map values to the stream.
- //
- Canonical bool
- // CheckCircularRef controls whether we check for circular references
- // and error fast during an encode.
- //
- // If enabled, an error is received if a pointer to a struct
- // references itself either directly or through one of its fields (iteratively).
- //
- // This is opt-in, as there may be a performance hit to checking circular references.
- CheckCircularRef bool
- // RecursiveEmptyCheck controls whether we descend into interfaces, structs and pointers
- // when checking if a value is empty.
- //
- // Note that this may make OmitEmpty more expensive, as it incurs a lot more reflect calls.
- RecursiveEmptyCheck bool
- // Raw controls whether we encode Raw values.
- // This is a "dangerous" option and must be explicitly set.
- // If set, we blindly encode Raw values as-is, without checking
- // if they are a correct representation of a value in that format.
- // If unset, we error out.
- Raw bool
- // AsSymbols defines what should be encoded as symbols.
- //
- // Encoding as symbols can reduce the encoded size significantly.
- //
- // However, during decoding, each string to be encoded as a symbol must
- // be checked to see if it has been seen before. Consequently, encoding time
- // will increase if using symbols, because string comparisons has a clear cost.
- //
- // Sample values:
- // AsSymbolNone
- // AsSymbolAll
- // AsSymbolMapStringKeys
- // AsSymbolMapStringKeysFlag | AsSymbolStructFieldNameFlag
- AsSymbols AsSymbolFlag
- }
- // ---------------------------------------------
- type simpleIoEncWriterWriter struct {
- w io.Writer
- bw io.ByteWriter
- sw ioEncStringWriter
- bs [1]byte
- }
- func (o *simpleIoEncWriterWriter) WriteByte(c byte) (err error) {
- if o.bw != nil {
- return o.bw.WriteByte(c)
- }
- // _, err = o.w.Write([]byte{c})
- o.bs[0] = c
- _, err = o.w.Write(o.bs[:])
- return
- }
- func (o *simpleIoEncWriterWriter) WriteString(s string) (n int, err error) {
- if o.sw != nil {
- return o.sw.WriteString(s)
- }
- // return o.w.Write([]byte(s))
- return o.w.Write(bytesView(s))
- }
- func (o *simpleIoEncWriterWriter) Write(p []byte) (n int, err error) {
- return o.w.Write(p)
- }
- // ----------------------------------------
- // ioEncWriter implements encWriter and can write to an io.Writer implementation
- type ioEncWriter struct {
- w ioEncWriterWriter
- s simpleIoEncWriterWriter
- // x [8]byte // temp byte array re-used internally for efficiency
- }
- func (z *ioEncWriter) writeb(bs []byte) {
- if len(bs) == 0 {
- return
- }
- n, err := z.w.Write(bs)
- if err != nil {
- panic(err)
- }
- if n != len(bs) {
- panic(fmt.Errorf("incorrect num bytes written. Expecting: %v, Wrote: %v", len(bs), n))
- }
- }
- func (z *ioEncWriter) writestr(s string) {
- if len(s) == 0 {
- return
- }
- n, err := z.w.WriteString(s)
- if err != nil {
- panic(err)
- }
- if n != len(s) {
- panic(fmt.Errorf("incorrect num bytes written. Expecting: %v, Wrote: %v", len(s), n))
- }
- }
- func (z *ioEncWriter) writen1(b byte) {
- if err := z.w.WriteByte(b); err != nil {
- panic(err)
- }
- }
- func (z *ioEncWriter) writen2(b1, b2 byte) {
- for _, b := range [...]byte{b1, b2} {
- if err := z.w.WriteByte(b); err != nil {
- panic(err)
- }
- }
- }
- func (z *ioEncWriter) writen4(b1, b2, b3, b4 byte) {
- for _, b := range [...]byte{b1, b2, b3, b4} {
- if err := z.w.WriteByte(b); err != nil {
- panic(err)
- }
- }
- }
- func (z *ioEncWriter) writen5(b1, b2, b3, b4, b5 byte) {
- for _, b := range [...]byte{b1, b2, b3, b4, b5} {
- if err := z.w.WriteByte(b); err != nil {
- panic(err)
- }
- }
- }
- func (z *ioEncWriter) atEndOfEncode() {}
- // ----------------------------------------
- // bytesEncWriter implements encWriter and can write to an byte slice.
- // It is used by Marshal function.
- type bytesEncWriter struct {
- b []byte
- c int // cursor
- out *[]byte // write out on atEndOfEncode
- }
- func (z *bytesEncWriter) writeb(s []byte) {
- slen := len(s)
- if slen == 0 {
- return
- }
- oc, a := z.growNoAlloc(slen)
- if a {
- z.growAlloc(slen, oc)
- }
- copy(z.b[oc:], s)
- }
- func (z *bytesEncWriter) writestr(s string) {
- slen := len(s)
- if slen == 0 {
- return
- }
- oc, a := z.growNoAlloc(slen)
- if a {
- z.growAlloc(slen, oc)
- }
- copy(z.b[oc:], s)
- }
- func (z *bytesEncWriter) writen1(b1 byte) {
- oc, a := z.growNoAlloc(1)
- if a {
- z.growAlloc(1, oc)
- }
- z.b[oc] = b1
- }
- func (z *bytesEncWriter) writen2(b1, b2 byte) {
- oc, a := z.growNoAlloc(2)
- if a {
- z.growAlloc(2, oc)
- }
- z.b[oc+1] = b2
- z.b[oc] = b1
- }
- func (z *bytesEncWriter) writen4(b1, b2, b3, b4 byte) {
- oc, a := z.growNoAlloc(4)
- if a {
- z.growAlloc(4, oc)
- }
- z.b[oc+3] = b4
- z.b[oc+2] = b3
- z.b[oc+1] = b2
- z.b[oc] = b1
- }
- func (z *bytesEncWriter) writen5(b1, b2, b3, b4, b5 byte) {
- oc, a := z.growNoAlloc(5)
- if a {
- z.growAlloc(5, oc)
- }
- z.b[oc+4] = b5
- z.b[oc+3] = b4
- z.b[oc+2] = b3
- z.b[oc+1] = b2
- z.b[oc] = b1
- }
- func (z *bytesEncWriter) atEndOfEncode() {
- *(z.out) = z.b[:z.c]
- }
- // have a growNoalloc(n int), which can be inlined.
- // if allocation is needed, then call growAlloc(n int)
- func (z *bytesEncWriter) growNoAlloc(n int) (oldcursor int, allocNeeded bool) {
- oldcursor = z.c
- z.c = z.c + n
- if z.c > len(z.b) {
- if z.c > cap(z.b) {
- allocNeeded = true
- } else {
- z.b = z.b[:cap(z.b)]
- }
- }
- return
- }
- func (z *bytesEncWriter) growAlloc(n int, oldcursor int) {
- // appendslice logic (if cap < 1024, *2, else *1.25): more expensive. many copy calls.
- // bytes.Buffer model (2*cap + n): much better
- // bs := make([]byte, 2*cap(z.b)+n)
- bs := make([]byte, growCap(cap(z.b), 1, n))
- copy(bs, z.b[:oldcursor])
- z.b = bs
- }
- // ---------------------------------------------
- func (e *Encoder) builtin(f *codecFnInfo, rv reflect.Value) {
- e.e.EncodeBuiltin(f.ti.rtid, rv2i(rv))
- }
- func (e *Encoder) raw(f *codecFnInfo, rv reflect.Value) {
- e.rawBytes(rv2i(rv).(Raw))
- }
- func (e *Encoder) rawExt(f *codecFnInfo, rv reflect.Value) {
- // rev := rv2i(rv).(RawExt)
- // e.e.EncodeRawExt(&rev, e)
- var re *RawExt
- if rv.CanAddr() {
- re = rv2i(rv.Addr()).(*RawExt)
- } else {
- rev := rv2i(rv).(RawExt)
- re = &rev
- }
- e.e.EncodeRawExt(re, e)
- }
- func (e *Encoder) ext(f *codecFnInfo, rv reflect.Value) {
- // if this is a struct|array and it was addressable, then pass the address directly (not the value)
- if k := rv.Kind(); (k == reflect.Struct || k == reflect.Array) && rv.CanAddr() {
- rv = rv.Addr()
- }
- e.e.EncodeExt(rv2i(rv), f.xfTag, f.xfFn, e)
- }
- func (e *Encoder) getValueForMarshalInterface(rv reflect.Value, indir int8) (v interface{}, proceed bool) {
- if indir == 0 {
- v = rv2i(rv)
- } else if indir == -1 {
- // If a non-pointer was passed to Encode(), then that value is not addressable.
- // Take addr if addressable, else copy value to an addressable value.
- if rv.CanAddr() {
- v = rv2i(rv.Addr())
- } else {
- rv2 := reflect.New(rv.Type())
- rv2.Elem().Set(rv)
- v = rv2i(rv2)
- }
- } else {
- for j := int8(0); j < indir; j++ {
- if rv.IsNil() {
- e.e.EncodeNil()
- return
- }
- rv = rv.Elem()
- }
- v = rv2i(rv)
- }
- return v, true
- }
- func (e *Encoder) selferMarshal(f *codecFnInfo, rv reflect.Value) {
- if v, proceed := e.getValueForMarshalInterface(rv, f.ti.csIndir); proceed {
- v.(Selfer).CodecEncodeSelf(e)
- }
- }
- func (e *Encoder) binaryMarshal(f *codecFnInfo, rv reflect.Value) {
- if v, proceed := e.getValueForMarshalInterface(rv, f.ti.bmIndir); proceed {
- bs, fnerr := v.(encoding.BinaryMarshaler).MarshalBinary()
- e.marshal(bs, fnerr, false, c_RAW)
- }
- }
- func (e *Encoder) textMarshal(f *codecFnInfo, rv reflect.Value) {
- if v, proceed := e.getValueForMarshalInterface(rv, f.ti.tmIndir); proceed {
- bs, fnerr := v.(encoding.TextMarshaler).MarshalText()
- e.marshal(bs, fnerr, false, c_UTF8)
- }
- }
- func (e *Encoder) jsonMarshal(f *codecFnInfo, rv reflect.Value) {
- if v, proceed := e.getValueForMarshalInterface(rv, f.ti.jmIndir); proceed {
- bs, fnerr := v.(jsonMarshaler).MarshalJSON()
- e.marshal(bs, fnerr, true, c_UTF8)
- }
- }
- func (e *Encoder) kBool(f *codecFnInfo, rv reflect.Value) {
- e.e.EncodeBool(rv.Bool())
- }
- func (e *Encoder) kString(f *codecFnInfo, rv reflect.Value) {
- e.e.EncodeString(c_UTF8, rv.String())
- }
- func (e *Encoder) kFloat64(f *codecFnInfo, rv reflect.Value) {
- e.e.EncodeFloat64(rv.Float())
- }
- func (e *Encoder) kFloat32(f *codecFnInfo, rv reflect.Value) {
- e.e.EncodeFloat32(float32(rv.Float()))
- }
- func (e *Encoder) kInt(f *codecFnInfo, rv reflect.Value) {
- e.e.EncodeInt(rv.Int())
- }
- func (e *Encoder) kUint(f *codecFnInfo, rv reflect.Value) {
- e.e.EncodeUint(rv.Uint())
- }
- func (e *Encoder) kInvalid(f *codecFnInfo, rv reflect.Value) {
- e.e.EncodeNil()
- }
- func (e *Encoder) kErr(f *codecFnInfo, rv reflect.Value) {
- e.errorf("unsupported kind %s, for %#v", rv.Kind(), rv)
- }
- func (e *Encoder) kSlice(f *codecFnInfo, rv reflect.Value) {
- ti := f.ti
- // array may be non-addressable, so we have to manage with care
- // (don't call rv.Bytes, rv.Slice, etc).
- // E.g. type struct S{B [2]byte};
- // Encode(S{}) will bomb on "panic: slice of unaddressable array".
- if f.seq != seqTypeArray {
- if rv.IsNil() {
- e.e.EncodeNil()
- return
- }
- // If in this method, then there was no extension function defined.
- // So it's okay to treat as []byte.
- if ti.rtid == uint8SliceTypId {
- e.e.EncodeStringBytes(c_RAW, rv.Bytes())
- return
- }
- }
- cr := e.cr
- rtelem := ti.rt.Elem()
- l := rv.Len()
- if ti.rtid == uint8SliceTypId || rtelem.Kind() == reflect.Uint8 {
- switch f.seq {
- case seqTypeArray:
- if rv.CanAddr() {
- e.e.EncodeStringBytes(c_RAW, rv.Slice(0, l).Bytes())
- } else {
- var bs []byte
- if l <= cap(e.b) {
- bs = e.b[:l]
- } else {
- bs = make([]byte, l)
- }
- reflect.Copy(reflect.ValueOf(bs), rv)
- e.e.EncodeStringBytes(c_RAW, bs)
- }
- return
- case seqTypeSlice:
- e.e.EncodeStringBytes(c_RAW, rv.Bytes())
- return
- }
- }
- if ti.rtid == uint8SliceTypId && f.seq == seqTypeChan {
- bs := e.b[:0]
- // do not use range, so that the number of elements encoded
- // does not change, and encoding does not hang waiting on someone to close chan.
- // for b := range rv2i(rv).(<-chan byte) { bs = append(bs, b) }
- ch := rv2i(rv).(<-chan byte)
- for i := 0; i < l; i++ {
- bs = append(bs, <-ch)
- }
- e.e.EncodeStringBytes(c_RAW, bs)
- return
- }
- if ti.mbs {
- if l%2 == 1 {
- e.errorf("mapBySlice requires even slice length, but got %v", l)
- return
- }
- e.e.EncodeMapStart(l / 2)
- } else {
- e.e.EncodeArrayStart(l)
- }
- if l > 0 {
- var fn *codecFn
- var recognizedVtyp = useLookupRecognizedTypes && isRecognizedRtidOrPtr(rt2id(rtelem))
- if !recognizedVtyp {
- for rtelem.Kind() == reflect.Ptr {
- rtelem = rtelem.Elem()
- }
- // if kind is reflect.Interface, do not pre-determine the
- // encoding type, because preEncodeValue may break it down to
- // a concrete type and kInterface will bomb.
- if rtelem.Kind() != reflect.Interface {
- fn = e.cf.get(rtelem, true, true)
- }
- }
- // TODO: Consider perf implication of encoding odd index values as symbols if type is string
- for j := 0; j < l; j++ {
- if cr != nil {
- if ti.mbs {
- if j%2 == 0 {
- cr.sendContainerState(containerMapKey)
- } else {
- cr.sendContainerState(containerMapValue)
- }
- } else {
- cr.sendContainerState(containerArrayElem)
- }
- }
- if f.seq == seqTypeChan {
- if rv2, ok2 := rv.Recv(); ok2 {
- if useLookupRecognizedTypes && recognizedVtyp {
- e.encode(rv2i(rv2))
- } else {
- e.encodeValue(rv2, fn, true)
- }
- } else {
- e.e.EncodeNil() // WE HAVE TO DO SOMETHING, so nil if nothing received.
- }
- } else {
- if useLookupRecognizedTypes && recognizedVtyp {
- e.encode(rv2i(rv.Index(j)))
- } else {
- e.encodeValue(rv.Index(j), fn, true)
- }
- }
- }
- }
- if cr != nil {
- if ti.mbs {
- cr.sendContainerState(containerMapEnd)
- } else {
- cr.sendContainerState(containerArrayEnd)
- }
- }
- }
- func (e *Encoder) kStructNoOmitempty(f *codecFnInfo, rv reflect.Value) {
- fti := f.ti
- cr := e.cr
- tisfi := fti.sfip
- toMap := !(fti.toArray || e.h.StructToArray)
- if toMap {
- tisfi = fti.sfi
- }
- ee := e.e
- sfn := structFieldNode{v: rv, update: false}
- if toMap {
- ee.EncodeMapStart(len(tisfi))
- // asSymbols := e.h.AsSymbols&AsSymbolStructFieldNameFlag != 0
- asSymbols := e.h.AsSymbols == AsSymbolDefault || e.h.AsSymbols&AsSymbolStructFieldNameFlag != 0
- if cr == nil {
- for _, si := range tisfi {
- if asSymbols {
- ee.EncodeSymbol(si.encName)
- } else {
- ee.EncodeString(c_UTF8, si.encName)
- }
- e.encodeValue(sfn.field(si), nil, true)
- }
- } else {
- for _, si := range tisfi {
- cr.sendContainerState(containerMapKey)
- if asSymbols {
- ee.EncodeSymbol(si.encName)
- } else {
- ee.EncodeString(c_UTF8, si.encName)
- }
- cr.sendContainerState(containerMapValue)
- e.encodeValue(sfn.field(si), nil, true)
- }
- cr.sendContainerState(containerMapEnd)
- }
- } else {
- ee.EncodeArrayStart(len(tisfi))
- if cr == nil {
- for _, si := range tisfi {
- e.encodeValue(sfn.field(si), nil, true)
- }
- } else {
- for _, si := range tisfi {
- cr.sendContainerState(containerArrayElem)
- e.encodeValue(sfn.field(si), nil, true)
- }
- cr.sendContainerState(containerArrayEnd)
- }
- }
- }
- func (e *Encoder) kStruct(f *codecFnInfo, rv reflect.Value) {
- fti := f.ti
- cr := e.cr
- tisfi := fti.sfip
- toMap := !(fti.toArray || e.h.StructToArray)
- // if toMap, use the sorted array. If toArray, use unsorted array (to match sequence in struct)
- if toMap {
- tisfi = fti.sfi
- }
- newlen := len(fti.sfi)
- ee := e.e
- // Use sync.Pool to reduce allocating slices unnecessarily.
- // The cost of sync.Pool is less than the cost of new allocation.
- //
- // Each element of the array pools one of encStructPool(8|16|32|64).
- // It allows the re-use of slices up to 64 in length.
- // A performance cost of encoding structs was collecting
- // which values were empty and should be omitted.
- // We needed slices of reflect.Value and string to collect them.
- // This shared pool reduces the amount of unnecessary creation we do.
- // The cost is that of locking sometimes, but sync.Pool is efficient
- // enough to reduce thread contention.
- var spool *sync.Pool
- var poolv interface{}
- var fkvs []stringRv
- if newlen <= 8 {
- spool, poolv = pool.stringRv8()
- fkvs = poolv.(*[8]stringRv)[:newlen]
- } else if newlen <= 16 {
- spool, poolv = pool.stringRv16()
- fkvs = poolv.(*[16]stringRv)[:newlen]
- } else if newlen <= 32 {
- spool, poolv = pool.stringRv32()
- fkvs = poolv.(*[32]stringRv)[:newlen]
- } else if newlen <= 64 {
- spool, poolv = pool.stringRv64()
- fkvs = poolv.(*[64]stringRv)[:newlen]
- } else if newlen <= 128 {
- spool, poolv = pool.stringRv128()
- fkvs = poolv.(*[128]stringRv)[:newlen]
- } else {
- fkvs = make([]stringRv, newlen)
- }
- newlen = 0
- var kv stringRv
- recur := e.h.RecursiveEmptyCheck
- sfn := structFieldNode{v: rv, update: false}
- for _, si := range tisfi {
- // kv.r = si.field(rv, false)
- kv.r = sfn.field(si)
- if toMap {
- if si.omitEmpty && isEmptyValue(kv.r, recur, recur) {
- continue
- }
- kv.v = si.encName
- } else {
- // use the zero value.
- // if a reference or struct, set to nil (so you do not output too much)
- if si.omitEmpty && isEmptyValue(kv.r, recur, recur) {
- switch kv.r.Kind() {
- case reflect.Struct, reflect.Interface, reflect.Ptr, reflect.Array, reflect.Map, reflect.Slice:
- kv.r = reflect.Value{} //encode as nil
- }
- }
- }
- fkvs[newlen] = kv
- newlen++
- }
- if toMap {
- ee.EncodeMapStart(newlen)
- // asSymbols := e.h.AsSymbols&AsSymbolStructFieldNameFlag != 0
- asSymbols := e.h.AsSymbols == AsSymbolDefault || e.h.AsSymbols&AsSymbolStructFieldNameFlag != 0
- if cr == nil {
- for j := 0; j < newlen; j++ {
- kv = fkvs[j]
- if asSymbols {
- ee.EncodeSymbol(kv.v)
- } else {
- ee.EncodeString(c_UTF8, kv.v)
- }
- e.encodeValue(kv.r, nil, true)
- }
- } else {
- for j := 0; j < newlen; j++ {
- kv = fkvs[j]
- cr.sendContainerState(containerMapKey)
- if asSymbols {
- ee.EncodeSymbol(kv.v)
- } else {
- ee.EncodeString(c_UTF8, kv.v)
- }
- cr.sendContainerState(containerMapValue)
- e.encodeValue(kv.r, nil, true)
- }
- cr.sendContainerState(containerMapEnd)
- }
- } else {
- ee.EncodeArrayStart(newlen)
- if cr == nil {
- for j := 0; j < newlen; j++ {
- e.encodeValue(fkvs[j].r, nil, true)
- }
- } else {
- for j := 0; j < newlen; j++ {
- cr.sendContainerState(containerArrayElem)
- e.encodeValue(fkvs[j].r, nil, true)
- }
- cr.sendContainerState(containerArrayEnd)
- }
- }
- // do not use defer. Instead, use explicit pool return at end of function.
- // defer has a cost we are trying to avoid.
- // If there is a panic and these slices are not returned, it is ok.
- if spool != nil {
- spool.Put(poolv)
- }
- }
- func (e *Encoder) kMap(f *codecFnInfo, rv reflect.Value) {
- ee := e.e
- if rv.IsNil() {
- ee.EncodeNil()
- return
- }
- l := rv.Len()
- ee.EncodeMapStart(l)
- cr := e.cr
- if l == 0 {
- if cr != nil {
- cr.sendContainerState(containerMapEnd)
- }
- return
- }
- var asSymbols bool
- // determine the underlying key and val encFn's for the map.
- // This eliminates some work which is done for each loop iteration i.e.
- // rv.Type(), ref.ValueOf(rt).Pointer(), then check map/list for fn.
- //
- // However, if kind is reflect.Interface, do not pre-determine the
- // encoding type, because preEncodeValue may break it down to
- // a concrete type and kInterface will bomb.
- var keyFn, valFn *codecFn
- ti := f.ti
- rtkey0 := ti.rt.Key()
- rtkey := rtkey0
- rtval0 := ti.rt.Elem()
- rtval := rtval0
- rtkeyid := rt2id(rtkey0)
- rtvalid := rt2id(rtval0)
- for rtval.Kind() == reflect.Ptr {
- rtval = rtval.Elem()
- }
- if rtval.Kind() != reflect.Interface {
- valFn = e.cf.get(rtval, true, true)
- }
- mks := rv.MapKeys()
- if e.h.Canonical {
- e.kMapCanonical(rtkey, rv, mks, valFn, asSymbols)
- if cr != nil {
- cr.sendContainerState(containerMapEnd)
- }
- return
- }
- var recognizedKtyp, recognizedVtyp bool
- var keyTypeIsString = rtkeyid == stringTypId
- if keyTypeIsString {
- asSymbols = e.h.AsSymbols&AsSymbolMapStringKeysFlag != 0
- } else {
- if useLookupRecognizedTypes {
- if recognizedKtyp = isRecognizedRtidOrPtr(rtkeyid); recognizedKtyp {
- goto LABEL1
- }
- }
- for rtkey.Kind() == reflect.Ptr {
- rtkey = rtkey.Elem()
- }
- if rtkey.Kind() != reflect.Interface {
- rtkeyid = rt2id(rtkey)
- keyFn = e.cf.get(rtkey, true, true)
- }
- }
- // for j, lmks := 0, len(mks); j < lmks; j++ {
- LABEL1:
- recognizedVtyp = useLookupRecognizedTypes && isRecognizedRtidOrPtr(rtvalid)
- for j := range mks {
- if cr != nil {
- cr.sendContainerState(containerMapKey)
- }
- if keyTypeIsString {
- if asSymbols {
- ee.EncodeSymbol(mks[j].String())
- } else {
- ee.EncodeString(c_UTF8, mks[j].String())
- }
- } else if useLookupRecognizedTypes && recognizedKtyp {
- e.encode(rv2i(mks[j]))
- } else {
- e.encodeValue(mks[j], keyFn, true)
- }
- if cr != nil {
- cr.sendContainerState(containerMapValue)
- }
- if useLookupRecognizedTypes && recognizedVtyp {
- e.encode(rv2i(rv.MapIndex(mks[j])))
- } else {
- e.encodeValue(rv.MapIndex(mks[j]), valFn, true)
- }
- }
- if cr != nil {
- cr.sendContainerState(containerMapEnd)
- }
- }
- func (e *Encoder) kMapCanonical(rtkey reflect.Type, rv reflect.Value, mks []reflect.Value, valFn *codecFn, asSymbols bool) {
- ee := e.e
- cr := e.cr
- // we previously did out-of-band if an extension was registered.
- // This is not necessary, as the natural kind is sufficient for ordering.
- // WHAT IS THIS? rtkeyid can never be a []uint8, per spec
- // if rtkeyid == uint8SliceTypId {
- // mksv := make([]bytesRv, len(mks))
- // for i, k := range mks {
- // v := &mksv[i]
- // v.r = k
- // v.v = k.Bytes()
- // }
- // sort.Sort(bytesRvSlice(mksv))
- // for i := range mksv {
- // if cr != nil {
- // cr.sendContainerState(containerMapKey)
- // }
- // ee.EncodeStringBytes(c_RAW, mksv[i].v)
- // if cr != nil {
- // cr.sendContainerState(containerMapValue)
- // }
- // e.encodeValue(rv.MapIndex(mksv[i].r), valFn, true)
- // }
- // return
- // }
- switch rtkey.Kind() {
- case reflect.Bool:
- mksv := make([]boolRv, len(mks))
- for i, k := range mks {
- v := &mksv[i]
- v.r = k
- v.v = k.Bool()
- }
- sort.Sort(boolRvSlice(mksv))
- for i := range mksv {
- if cr != nil {
- cr.sendContainerState(containerMapKey)
- }
- ee.EncodeBool(mksv[i].v)
- if cr != nil {
- cr.sendContainerState(containerMapValue)
- }
- e.encodeValue(rv.MapIndex(mksv[i].r), valFn, true)
- }
- case reflect.String:
- mksv := make([]stringRv, len(mks))
- for i, k := range mks {
- v := &mksv[i]
- v.r = k
- v.v = k.String()
- }
- sort.Sort(stringRvSlice(mksv))
- for i := range mksv {
- if cr != nil {
- cr.sendContainerState(containerMapKey)
- }
- if asSymbols {
- ee.EncodeSymbol(mksv[i].v)
- } else {
- ee.EncodeString(c_UTF8, mksv[i].v)
- }
- if cr != nil {
- cr.sendContainerState(containerMapValue)
- }
- e.encodeValue(rv.MapIndex(mksv[i].r), valFn, true)
- }
- case reflect.Uint8, reflect.Uint16, reflect.Uint32, reflect.Uint64, reflect.Uint, reflect.Uintptr:
- mksv := make([]uintRv, len(mks))
- for i, k := range mks {
- v := &mksv[i]
- v.r = k
- v.v = k.Uint()
- }
- sort.Sort(uintRvSlice(mksv))
- for i := range mksv {
- if cr != nil {
- cr.sendContainerState(containerMapKey)
- }
- ee.EncodeUint(mksv[i].v)
- if cr != nil {
- cr.sendContainerState(containerMapValue)
- }
- e.encodeValue(rv.MapIndex(mksv[i].r), valFn, true)
- }
- case reflect.Int8, reflect.Int16, reflect.Int32, reflect.Int64, reflect.Int:
- mksv := make([]intRv, len(mks))
- for i, k := range mks {
- v := &mksv[i]
- v.r = k
- v.v = k.Int()
- }
- sort.Sort(intRvSlice(mksv))
- for i := range mksv {
- if cr != nil {
- cr.sendContainerState(containerMapKey)
- }
- ee.EncodeInt(mksv[i].v)
- if cr != nil {
- cr.sendContainerState(containerMapValue)
- }
- e.encodeValue(rv.MapIndex(mksv[i].r), valFn, true)
- }
- case reflect.Float32:
- mksv := make([]floatRv, len(mks))
- for i, k := range mks {
- v := &mksv[i]
- v.r = k
- v.v = k.Float()
- }
- sort.Sort(floatRvSlice(mksv))
- for i := range mksv {
- if cr != nil {
- cr.sendContainerState(containerMapKey)
- }
- ee.EncodeFloat32(float32(mksv[i].v))
- if cr != nil {
- cr.sendContainerState(containerMapValue)
- }
- e.encodeValue(rv.MapIndex(mksv[i].r), valFn, true)
- }
- case reflect.Float64:
- mksv := make([]floatRv, len(mks))
- for i, k := range mks {
- v := &mksv[i]
- v.r = k
- v.v = k.Float()
- }
- sort.Sort(floatRvSlice(mksv))
- for i := range mksv {
- if cr != nil {
- cr.sendContainerState(containerMapKey)
- }
- ee.EncodeFloat64(mksv[i].v)
- if cr != nil {
- cr.sendContainerState(containerMapValue)
- }
- e.encodeValue(rv.MapIndex(mksv[i].r), valFn, true)
- }
- default:
- // out-of-band
- // first encode each key to a []byte first, then sort them, then record
- var mksv []byte = make([]byte, 0, len(mks)*16) // temporary byte slice for the encoding
- e2 := NewEncoderBytes(&mksv, e.hh)
- mksbv := make([]bytesRv, len(mks))
- for i, k := range mks {
- v := &mksbv[i]
- l := len(mksv)
- e2.MustEncode(k)
- v.r = k
- v.v = mksv[l:]
- }
- sort.Sort(bytesRvSlice(mksbv))
- for j := range mksbv {
- if cr != nil {
- cr.sendContainerState(containerMapKey)
- }
- e.asis(mksbv[j].v)
- if cr != nil {
- cr.sendContainerState(containerMapValue)
- }
- e.encodeValue(rv.MapIndex(mksbv[j].r), valFn, true)
- }
- }
- }
- // // --------------------------------------------------
- // An Encoder writes an object to an output stream in the codec format.
- type Encoder struct {
- // hopefully, reduce derefencing cost by laying the encWriter inside the Encoder
- e encDriver
- // NOTE: Encoder shouldn't call it's write methods,
- // as the handler MAY need to do some coordination.
- w encWriter
- hh Handle
- h *BasicHandle
- // ---- cpu cache line boundary?
- wi ioEncWriter
- wb bytesEncWriter
- cr containerStateRecv
- as encDriverAsis
- // ---- cpu cache line boundary?
- ci set
- err error
- b [scratchByteArrayLen]byte
- cf codecFner
- }
- // NewEncoder returns an Encoder for encoding into an io.Writer.
- //
- // For efficiency, Users are encouraged to pass in a memory buffered writer
- // (eg bufio.Writer, bytes.Buffer).
- func NewEncoder(w io.Writer, h Handle) *Encoder {
- e := newEncoder(h)
- e.Reset(w)
- return e
- }
- // NewEncoderBytes returns an encoder for encoding directly and efficiently
- // into a byte slice, using zero-copying to temporary slices.
- //
- // It will potentially replace the output byte slice pointed to.
- // After encoding, the out parameter contains the encoded contents.
- func NewEncoderBytes(out *[]byte, h Handle) *Encoder {
- e := newEncoder(h)
- e.ResetBytes(out)
- return e
- }
- func newEncoder(h Handle) *Encoder {
- e := &Encoder{hh: h, h: h.getBasicHandle()}
- e.e = h.newEncDriver(e)
- e.as, _ = e.e.(encDriverAsis)
- e.cr, _ = e.e.(containerStateRecv)
- return e
- }
- // Reset the Encoder with a new output stream.
- //
- // This accommodates using the state of the Encoder,
- // where it has "cached" information about sub-engines.
- func (e *Encoder) Reset(w io.Writer) {
- ww, ok := w.(ioEncWriterWriter)
- if ok {
- e.wi.w = ww
- } else {
- sww := &e.wi.s
- sww.w = w
- sww.bw, _ = w.(io.ByteWriter)
- sww.sw, _ = w.(ioEncStringWriter)
- e.wi.w = sww
- //ww = bufio.NewWriterSize(w, defEncByteBufSize)
- }
- e.w = &e.wi
- e.e.reset()
- e.cf.reset(e.hh)
- e.err = nil
- }
- func (e *Encoder) ResetBytes(out *[]byte) {
- in := *out
- if in == nil {
- in = make([]byte, defEncByteBufSize)
- }
- e.wb.b, e.wb.out, e.wb.c = in, out, 0
- e.w = &e.wb
- e.e.reset()
- e.cf.reset(e.hh)
- e.err = nil
- }
- // Encode writes an object into a stream.
- //
- // Encoding can be configured via the struct tag for the fields.
- // The "codec" key in struct field's tag value is the key name,
- // followed by an optional comma and options.
- // Note that the "json" key is used in the absence of the "codec" key.
- //
- // To set an option on all fields (e.g. omitempty on all fields), you
- // can create a field called _struct, and set flags on it.
- //
- // Struct values "usually" encode as maps. Each exported struct field is encoded unless:
- // - the field's tag is "-", OR
- // - the field is empty (empty or the zero value) and its tag specifies the "omitempty" option.
- //
- // When encoding as a map, the first string in the tag (before the comma)
- // is the map key string to use when encoding.
- //
- // However, struct values may encode as arrays. This happens when:
- // - StructToArray Encode option is set, OR
- // - the tag on the _struct field sets the "toarray" option
- // Note that omitempty is ignored when encoding struct values as arrays,
- // as an entry must be encoded for each field, to maintain its position.
- //
- // Values with types that implement MapBySlice are encoded as stream maps.
- //
- // The empty values (for omitempty option) are false, 0, any nil pointer
- // or interface value, and any array, slice, map, or string of length zero.
- //
- // Anonymous fields are encoded inline except:
- // - the struct tag specifies a replacement name (first value)
- // - the field is of an interface type
- //
- // Examples:
- //
- // // NOTE: 'json:' can be used as struct tag key, in place 'codec:' below.
- // type MyStruct struct {
- // _struct bool `codec:",omitempty"` //set omitempty for every field
- // Field1 string `codec:"-"` //skip this field
- // Field2 int `codec:"myName"` //Use key "myName" in encode stream
- // Field3 int32 `codec:",omitempty"` //use key "Field3". Omit if empty.
- // Field4 bool `codec:"f4,omitempty"` //use key "f4". Omit if empty.
- // io.Reader //use key "Reader".
- // MyStruct `codec:"my1" //use key "my1".
- // MyStruct //inline it
- // ...
- // }
- //
- // type MyStruct struct {
- // _struct bool `codec:",toarray"` //encode struct as an array
- // }
- //
- // The mode of encoding is based on the type of the value. When a value is seen:
- // - If a Selfer, call its CodecEncodeSelf method
- // - If an extension is registered for it, call that extension function
- // - If it implements encoding.(Binary|Text|JSON)Marshaler, call its Marshal(Binary|Text|JSON) method
- // - Else encode it based on its reflect.Kind
- //
- // Note that struct field names and keys in map[string]XXX will be treated as symbols.
- // Some formats support symbols (e.g. binc) and will properly encode the string
- // only once in the stream, and use a tag to refer to it thereafter.
- func (e *Encoder) Encode(v interface{}) (err error) {
- defer panicToErrs2(&e.err, &err)
- e.MustEncode(v)
- return
- }
- // MustEncode is like Encode, but panics if unable to Encode.
- // This provides insight to the code location that triggered the error.
- func (e *Encoder) MustEncode(v interface{}) {
- if e.err != nil {
- panic(e.err)
- }
- e.encode(v)
- e.w.atEndOfEncode()
- }
- func (e *Encoder) encode(iv interface{}) {
- if iv == nil || definitelyNil(iv) {
- e.e.EncodeNil()
- return
- }
- if v, ok := iv.(Selfer); ok {
- v.CodecEncodeSelf(e)
- return
- }
- switch v := iv.(type) {
- // case nil:
- // e.e.EncodeNil()
- // case Selfer:
- // v.CodecEncodeSelf(e)
- case Raw:
- e.rawBytes(v)
- case reflect.Value:
- e.encodeValue(v, nil, true)
- case string:
- e.e.EncodeString(c_UTF8, v)
- case bool:
- e.e.EncodeBool(v)
- case int:
- e.e.EncodeInt(int64(v))
- case int8:
- e.e.EncodeInt(int64(v))
- case int16:
- e.e.EncodeInt(int64(v))
- case int32:
- e.e.EncodeInt(int64(v))
- case int64:
- e.e.EncodeInt(v)
- case uint:
- e.e.EncodeUint(uint64(v))
- case uint8:
- e.e.EncodeUint(uint64(v))
- case uint16:
- e.e.EncodeUint(uint64(v))
- case uint32:
- e.e.EncodeUint(uint64(v))
- case uint64:
- e.e.EncodeUint(v)
- case uintptr:
- e.e.EncodeUint(uint64(v))
- case float32:
- e.e.EncodeFloat32(v)
- case float64:
- e.e.EncodeFloat64(v)
- case []uint8:
- e.e.EncodeStringBytes(c_RAW, v)
- case *string:
- e.e.EncodeString(c_UTF8, *v)
- case *bool:
- e.e.EncodeBool(*v)
- case *int:
- e.e.EncodeInt(int64(*v))
- case *int8:
- e.e.EncodeInt(int64(*v))
- case *int16:
- e.e.EncodeInt(int64(*v))
- case *int32:
- e.e.EncodeInt(int64(*v))
- case *int64:
- e.e.EncodeInt(*v)
- case *uint:
- e.e.EncodeUint(uint64(*v))
- case *uint8:
- e.e.EncodeUint(uint64(*v))
- case *uint16:
- e.e.EncodeUint(uint64(*v))
- case *uint32:
- e.e.EncodeUint(uint64(*v))
- case *uint64:
- e.e.EncodeUint(*v)
- case *uintptr:
- e.e.EncodeUint(uint64(*v))
- case *float32:
- e.e.EncodeFloat32(*v)
- case *float64:
- e.e.EncodeFloat64(*v)
- case *[]uint8:
- e.e.EncodeStringBytes(c_RAW, *v)
- default:
- if !fastpathEncodeTypeSwitch(iv, e) {
- e.encodeValue(reflect.ValueOf(iv), nil, false)
- }
- }
- }
- func (e *Encoder) encodeValue(rv reflect.Value, fn *codecFn, checkFastpath bool) {
- // if a valid fn is passed, it MUST BE for the dereferenced type of rv
- var sptr uintptr
- TOP:
- switch rv.Kind() {
- case reflect.Ptr:
- if rv.IsNil() {
- e.e.EncodeNil()
- return
- }
- rv = rv.Elem()
- if e.h.CheckCircularRef && rv.Kind() == reflect.Struct {
- // TODO: Movable pointers will be an issue here. Future problem.
- sptr = rv.UnsafeAddr()
- break TOP
- }
- goto TOP
- case reflect.Interface:
- if rv.IsNil() {
- e.e.EncodeNil()
- return
- }
- rv = rv.Elem()
- goto TOP
- case reflect.Slice, reflect.Map:
- if rv.IsNil() {
- e.e.EncodeNil()
- return
- }
- case reflect.Invalid, reflect.Func:
- e.e.EncodeNil()
- return
- }
- if sptr != 0 && (&e.ci).add(sptr) {
- e.errorf("circular reference found: # %d", sptr)
- }
- if fn == nil {
- rt := rv.Type()
- // TODO: calling isRecognizedRtid here is a major slowdown
- if false && useLookupRecognizedTypes && isRecognizedRtidOrPtr(rt2id(rt)) {
- e.encode(rv2i(rv))
- return
- }
- // always pass checkCodecSelfer=true, in case T or ****T is passed, where *T is a Selfer
- fn = e.cf.get(rt, checkFastpath, true)
- }
- fn.fe(e, &fn.i, rv)
- if sptr != 0 {
- (&e.ci).remove(sptr)
- }
- }
- func (e *Encoder) marshal(bs []byte, fnerr error, asis bool, c charEncoding) {
- if fnerr != nil {
- panic(fnerr)
- }
- if bs == nil {
- e.e.EncodeNil()
- } else if asis {
- e.asis(bs)
- } else {
- e.e.EncodeStringBytes(c, bs)
- }
- }
- func (e *Encoder) asis(v []byte) {
- if e.as == nil {
- e.w.writeb(v)
- } else {
- e.as.EncodeAsis(v)
- }
- }
- func (e *Encoder) rawBytes(vv Raw) {
- v := []byte(vv)
- if !e.h.Raw {
- e.errorf("Raw values cannot be encoded: %v", v)
- }
- if e.as == nil {
- e.w.writeb(v)
- } else {
- e.as.EncodeAsis(v)
- }
- }
- func (e *Encoder) errorf(format string, params ...interface{}) {
- err := fmt.Errorf(format, params...)
- panic(err)
- }
|