cbor.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566
  1. // Copyright (c) 2012-2015 Ugorji Nwoke. All rights reserved.
  2. // Use of this source code is governed by a MIT license found in the LICENSE file.
  3. package codec
  4. import "math"
  5. const (
  6. cborMajorUint byte = iota
  7. cborMajorNegInt
  8. cborMajorBytes
  9. cborMajorText
  10. cborMajorArray
  11. cborMajorMap
  12. cborMajorTag
  13. cborMajorOther
  14. )
  15. const (
  16. cborBdFalse byte = 0xf4 + iota
  17. cborBdTrue
  18. cborBdNil
  19. cborBdUndefined
  20. cborBdExt
  21. cborBdFloat16
  22. cborBdFloat32
  23. cborBdFloat64
  24. )
  25. const (
  26. cborBdIndefiniteBytes byte = 0x5f
  27. cborBdIndefiniteString = 0x7f
  28. cborBdIndefiniteArray = 0x9f
  29. cborBdIndefiniteMap = 0xbf
  30. cborBdBreak = 0xff
  31. )
  32. const (
  33. CborStreamBytes byte = 0x5f
  34. CborStreamString = 0x7f
  35. CborStreamArray = 0x9f
  36. CborStreamMap = 0xbf
  37. CborStreamBreak = 0xff
  38. )
  39. const (
  40. cborBaseUint byte = 0x00
  41. cborBaseNegInt = 0x20
  42. cborBaseBytes = 0x40
  43. cborBaseString = 0x60
  44. cborBaseArray = 0x80
  45. cborBaseMap = 0xa0
  46. cborBaseTag = 0xc0
  47. cborBaseSimple = 0xe0
  48. )
  49. // -------------------
  50. type cborEncDriver struct {
  51. e *Encoder
  52. w encWriter
  53. h *CborHandle
  54. noBuiltInTypes
  55. encNoSeparator
  56. x [8]byte
  57. }
  58. func (e *cborEncDriver) EncodeNil() {
  59. e.w.writen1(cborBdNil)
  60. }
  61. func (e *cborEncDriver) EncodeBool(b bool) {
  62. if b {
  63. e.w.writen1(cborBdTrue)
  64. } else {
  65. e.w.writen1(cborBdFalse)
  66. }
  67. }
  68. func (e *cborEncDriver) EncodeFloat32(f float32) {
  69. e.w.writen1(cborBdFloat32)
  70. bigenHelper{e.x[:4], e.w}.writeUint32(math.Float32bits(f))
  71. }
  72. func (e *cborEncDriver) EncodeFloat64(f float64) {
  73. e.w.writen1(cborBdFloat64)
  74. bigenHelper{e.x[:8], e.w}.writeUint64(math.Float64bits(f))
  75. }
  76. func (e *cborEncDriver) encUint(v uint64, bd byte) {
  77. if v <= 0x17 {
  78. e.w.writen1(byte(v) + bd)
  79. } else if v <= math.MaxUint8 {
  80. e.w.writen2(bd+0x18, uint8(v))
  81. } else if v <= math.MaxUint16 {
  82. e.w.writen1(bd + 0x19)
  83. bigenHelper{e.x[:2], e.w}.writeUint16(uint16(v))
  84. } else if v <= math.MaxUint32 {
  85. e.w.writen1(bd + 0x1a)
  86. bigenHelper{e.x[:4], e.w}.writeUint32(uint32(v))
  87. } else { // if v <= math.MaxUint64 {
  88. e.w.writen1(bd + 0x1b)
  89. bigenHelper{e.x[:8], e.w}.writeUint64(v)
  90. }
  91. }
  92. func (e *cborEncDriver) EncodeInt(v int64) {
  93. if v < 0 {
  94. e.encUint(uint64(-1-v), cborBaseNegInt)
  95. } else {
  96. e.encUint(uint64(v), cborBaseUint)
  97. }
  98. }
  99. func (e *cborEncDriver) EncodeUint(v uint64) {
  100. e.encUint(v, cborBaseUint)
  101. }
  102. func (e *cborEncDriver) encLen(bd byte, length int) {
  103. e.encUint(uint64(length), bd)
  104. }
  105. func (e *cborEncDriver) EncodeExt(rv interface{}, xtag uint64, ext Ext, en *Encoder) {
  106. e.encUint(uint64(xtag), cborBaseTag)
  107. if v := ext.ConvertExt(rv); v == nil {
  108. e.EncodeNil()
  109. } else {
  110. en.encode(v)
  111. }
  112. }
  113. func (e *cborEncDriver) EncodeRawExt(re *RawExt, en *Encoder) {
  114. e.encUint(uint64(re.Tag), cborBaseTag)
  115. if re.Data != nil {
  116. en.encode(re.Data)
  117. } else if re.Value == nil {
  118. e.EncodeNil()
  119. } else {
  120. en.encode(re.Value)
  121. }
  122. }
  123. func (e *cborEncDriver) EncodeArrayStart(length int) {
  124. e.encLen(cborBaseArray, length)
  125. }
  126. func (e *cborEncDriver) EncodeMapStart(length int) {
  127. e.encLen(cborBaseMap, length)
  128. }
  129. func (e *cborEncDriver) EncodeString(c charEncoding, v string) {
  130. e.encLen(cborBaseString, len(v))
  131. e.w.writestr(v)
  132. }
  133. func (e *cborEncDriver) EncodeSymbol(v string) {
  134. e.EncodeString(c_UTF8, v)
  135. }
  136. func (e *cborEncDriver) EncodeStringBytes(c charEncoding, v []byte) {
  137. e.encLen(cborBaseBytes, len(v))
  138. e.w.writeb(v)
  139. }
  140. // ----------------------
  141. type cborDecDriver struct {
  142. d *Decoder
  143. h *CborHandle
  144. r decReader
  145. br bool // bytes reader
  146. bdRead bool
  147. bdType valueType
  148. bd byte
  149. b [scratchByteArrayLen]byte
  150. noBuiltInTypes
  151. decNoSeparator
  152. }
  153. func (d *cborDecDriver) readNextBd() {
  154. d.bd = d.r.readn1()
  155. d.bdRead = true
  156. d.bdType = valueTypeUnset
  157. }
  158. func (d *cborDecDriver) IsContainerType(vt valueType) (bv bool) {
  159. switch vt {
  160. case valueTypeNil:
  161. return d.bd == cborBdNil
  162. case valueTypeBytes:
  163. return d.bd == cborBdIndefiniteBytes || (d.bd >= cborBaseBytes && d.bd < cborBaseString)
  164. case valueTypeString:
  165. return d.bd == cborBdIndefiniteString || (d.bd >= cborBaseString && d.bd < cborBaseArray)
  166. case valueTypeArray:
  167. return d.bd == cborBdIndefiniteArray || (d.bd >= cborBaseArray && d.bd < cborBaseMap)
  168. case valueTypeMap:
  169. return d.bd == cborBdIndefiniteMap || (d.bd >= cborBaseMap && d.bd < cborBaseTag)
  170. }
  171. d.d.errorf("isContainerType: unsupported parameter: %v", vt)
  172. return // "unreachable"
  173. }
  174. func (d *cborDecDriver) TryDecodeAsNil() bool {
  175. if !d.bdRead {
  176. d.readNextBd()
  177. }
  178. // treat Nil and Undefined as nil values
  179. if d.bd == cborBdNil || d.bd == cborBdUndefined {
  180. d.bdRead = false
  181. return true
  182. }
  183. return false
  184. }
  185. func (d *cborDecDriver) CheckBreak() bool {
  186. if !d.bdRead {
  187. d.readNextBd()
  188. }
  189. if d.bd == cborBdBreak {
  190. d.bdRead = false
  191. return true
  192. }
  193. return false
  194. }
  195. func (d *cborDecDriver) decUint() (ui uint64) {
  196. v := d.bd & 0x1f
  197. if v <= 0x17 {
  198. ui = uint64(v)
  199. } else {
  200. if v == 0x18 {
  201. ui = uint64(d.r.readn1())
  202. } else if v == 0x19 {
  203. ui = uint64(bigen.Uint16(d.r.readx(2)))
  204. } else if v == 0x1a {
  205. ui = uint64(bigen.Uint32(d.r.readx(4)))
  206. } else if v == 0x1b {
  207. ui = uint64(bigen.Uint64(d.r.readx(8)))
  208. } else {
  209. d.d.errorf("decUint: Invalid descriptor: %v", d.bd)
  210. return
  211. }
  212. }
  213. return
  214. }
  215. func (d *cborDecDriver) decCheckInteger() (neg bool) {
  216. if !d.bdRead {
  217. d.readNextBd()
  218. }
  219. major := d.bd >> 5
  220. if major == cborMajorUint {
  221. } else if major == cborMajorNegInt {
  222. neg = true
  223. } else {
  224. d.d.errorf("invalid major: %v (bd: %v)", major, d.bd)
  225. return
  226. }
  227. return
  228. }
  229. func (d *cborDecDriver) DecodeInt(bitsize uint8) (i int64) {
  230. neg := d.decCheckInteger()
  231. ui := d.decUint()
  232. // check if this number can be converted to an int without overflow
  233. var overflow bool
  234. if neg {
  235. if i, overflow = chkOvf.SignedInt(ui + 1); overflow {
  236. d.d.errorf("cbor: overflow converting %v to signed integer", ui+1)
  237. return
  238. }
  239. i = -i
  240. } else {
  241. if i, overflow = chkOvf.SignedInt(ui); overflow {
  242. d.d.errorf("cbor: overflow converting %v to signed integer", ui)
  243. return
  244. }
  245. }
  246. if chkOvf.Int(i, bitsize) {
  247. d.d.errorf("cbor: overflow integer: %v", i)
  248. return
  249. }
  250. d.bdRead = false
  251. return
  252. }
  253. func (d *cborDecDriver) DecodeUint(bitsize uint8) (ui uint64) {
  254. if d.decCheckInteger() {
  255. d.d.errorf("Assigning negative signed value to unsigned type")
  256. return
  257. }
  258. ui = d.decUint()
  259. if chkOvf.Uint(ui, bitsize) {
  260. d.d.errorf("cbor: overflow integer: %v", ui)
  261. return
  262. }
  263. d.bdRead = false
  264. return
  265. }
  266. func (d *cborDecDriver) DecodeFloat(chkOverflow32 bool) (f float64) {
  267. if !d.bdRead {
  268. d.readNextBd()
  269. }
  270. if bd := d.bd; bd == cborBdFloat16 {
  271. f = float64(math.Float32frombits(halfFloatToFloatBits(bigen.Uint16(d.r.readx(2)))))
  272. } else if bd == cborBdFloat32 {
  273. f = float64(math.Float32frombits(bigen.Uint32(d.r.readx(4))))
  274. } else if bd == cborBdFloat64 {
  275. f = math.Float64frombits(bigen.Uint64(d.r.readx(8)))
  276. } else if bd >= cborBaseUint && bd < cborBaseBytes {
  277. f = float64(d.DecodeInt(64))
  278. } else {
  279. d.d.errorf("Float only valid from float16/32/64: Invalid descriptor: %v", bd)
  280. return
  281. }
  282. if chkOverflow32 && chkOvf.Float32(f) {
  283. d.d.errorf("cbor: float32 overflow: %v", f)
  284. return
  285. }
  286. d.bdRead = false
  287. return
  288. }
  289. // bool can be decoded from bool only (single byte).
  290. func (d *cborDecDriver) DecodeBool() (b bool) {
  291. if !d.bdRead {
  292. d.readNextBd()
  293. }
  294. if bd := d.bd; bd == cborBdTrue {
  295. b = true
  296. } else if bd == cborBdFalse {
  297. } else {
  298. d.d.errorf("Invalid single-byte value for bool: %s: %x", msgBadDesc, d.bd)
  299. return
  300. }
  301. d.bdRead = false
  302. return
  303. }
  304. func (d *cborDecDriver) ReadMapStart() (length int) {
  305. d.bdRead = false
  306. if d.bd == cborBdIndefiniteMap {
  307. return -1
  308. }
  309. return d.decLen()
  310. }
  311. func (d *cborDecDriver) ReadArrayStart() (length int) {
  312. d.bdRead = false
  313. if d.bd == cborBdIndefiniteArray {
  314. return -1
  315. }
  316. return d.decLen()
  317. }
  318. func (d *cborDecDriver) decLen() int {
  319. return int(d.decUint())
  320. }
  321. func (d *cborDecDriver) decAppendIndefiniteBytes(bs []byte) []byte {
  322. d.bdRead = false
  323. for {
  324. if d.CheckBreak() {
  325. break
  326. }
  327. if major := d.bd >> 5; major != cborMajorBytes && major != cborMajorText {
  328. d.d.errorf("cbor: expect bytes or string major type in indefinite string/bytes; got: %v, byte: %v", major, d.bd)
  329. return nil
  330. }
  331. n := d.decLen()
  332. oldLen := len(bs)
  333. newLen := oldLen + n
  334. if newLen > cap(bs) {
  335. bs2 := make([]byte, newLen, 2*cap(bs)+n)
  336. copy(bs2, bs)
  337. bs = bs2
  338. } else {
  339. bs = bs[:newLen]
  340. }
  341. d.r.readb(bs[oldLen:newLen])
  342. // bs = append(bs, d.r.readn()...)
  343. d.bdRead = false
  344. }
  345. d.bdRead = false
  346. return bs
  347. }
  348. func (d *cborDecDriver) DecodeBytes(bs []byte, isstring, zerocopy bool) (bsOut []byte) {
  349. if !d.bdRead {
  350. d.readNextBd()
  351. }
  352. if d.bd == cborBdNil || d.bd == cborBdUndefined {
  353. d.bdRead = false
  354. return nil
  355. }
  356. if d.bd == cborBdIndefiniteBytes || d.bd == cborBdIndefiniteString {
  357. if bs == nil {
  358. return d.decAppendIndefiniteBytes(nil)
  359. }
  360. return d.decAppendIndefiniteBytes(bs[:0])
  361. }
  362. clen := d.decLen()
  363. d.bdRead = false
  364. if zerocopy {
  365. if d.br {
  366. return d.r.readx(clen)
  367. } else if len(bs) == 0 {
  368. bs = d.b[:]
  369. }
  370. }
  371. return decByteSlice(d.r, clen, bs)
  372. }
  373. func (d *cborDecDriver) DecodeString() (s string) {
  374. return string(d.DecodeBytes(d.b[:], true, true))
  375. }
  376. func (d *cborDecDriver) DecodeExt(rv interface{}, xtag uint64, ext Ext) (realxtag uint64) {
  377. if !d.bdRead {
  378. d.readNextBd()
  379. }
  380. u := d.decUint()
  381. d.bdRead = false
  382. realxtag = u
  383. if ext == nil {
  384. re := rv.(*RawExt)
  385. re.Tag = realxtag
  386. d.d.decode(&re.Value)
  387. } else if xtag != realxtag {
  388. d.d.errorf("Wrong extension tag. Got %b. Expecting: %v", realxtag, xtag)
  389. return
  390. } else {
  391. var v interface{}
  392. d.d.decode(&v)
  393. ext.UpdateExt(rv, v)
  394. }
  395. d.bdRead = false
  396. return
  397. }
  398. func (d *cborDecDriver) DecodeNaked() (v interface{}, vt valueType, decodeFurther bool) {
  399. if !d.bdRead {
  400. d.readNextBd()
  401. }
  402. switch d.bd {
  403. case cborBdNil:
  404. vt = valueTypeNil
  405. case cborBdFalse:
  406. vt = valueTypeBool
  407. v = false
  408. case cborBdTrue:
  409. vt = valueTypeBool
  410. v = true
  411. case cborBdFloat16, cborBdFloat32:
  412. vt = valueTypeFloat
  413. v = d.DecodeFloat(true)
  414. case cborBdFloat64:
  415. vt = valueTypeFloat
  416. v = d.DecodeFloat(false)
  417. case cborBdIndefiniteBytes:
  418. vt = valueTypeBytes
  419. v = d.DecodeBytes(nil, false, false)
  420. case cborBdIndefiniteString:
  421. vt = valueTypeString
  422. v = d.DecodeString()
  423. case cborBdIndefiniteArray:
  424. vt = valueTypeArray
  425. decodeFurther = true
  426. case cborBdIndefiniteMap:
  427. vt = valueTypeMap
  428. decodeFurther = true
  429. default:
  430. switch {
  431. case d.bd >= cborBaseUint && d.bd < cborBaseNegInt:
  432. if d.h.SignedInteger {
  433. vt = valueTypeInt
  434. v = d.DecodeInt(64)
  435. } else {
  436. vt = valueTypeUint
  437. v = d.DecodeUint(64)
  438. }
  439. case d.bd >= cborBaseNegInt && d.bd < cborBaseBytes:
  440. vt = valueTypeInt
  441. v = d.DecodeInt(64)
  442. case d.bd >= cborBaseBytes && d.bd < cborBaseString:
  443. vt = valueTypeBytes
  444. v = d.DecodeBytes(nil, false, false)
  445. case d.bd >= cborBaseString && d.bd < cborBaseArray:
  446. vt = valueTypeString
  447. v = d.DecodeString()
  448. case d.bd >= cborBaseArray && d.bd < cborBaseMap:
  449. vt = valueTypeArray
  450. decodeFurther = true
  451. case d.bd >= cborBaseMap && d.bd < cborBaseTag:
  452. vt = valueTypeMap
  453. decodeFurther = true
  454. case d.bd >= cborBaseTag && d.bd < cborBaseSimple:
  455. vt = valueTypeExt
  456. var re RawExt
  457. ui := d.decUint()
  458. d.bdRead = false
  459. re.Tag = ui
  460. d.d.decode(&re.Value)
  461. v = &re
  462. // decodeFurther = true
  463. default:
  464. d.d.errorf("decodeNaked: Unrecognized d.bd: 0x%x", d.bd)
  465. return
  466. }
  467. }
  468. if !decodeFurther {
  469. d.bdRead = false
  470. }
  471. return
  472. }
  473. // -------------------------
  474. // CborHandle is a Handle for the CBOR encoding format,
  475. // defined at http://tools.ietf.org/html/rfc7049 and documented further at http://cbor.io .
  476. //
  477. // CBOR is comprehensively supported, including support for:
  478. // - indefinite-length arrays/maps/bytes/strings
  479. // - (extension) tags in range 0..0xffff (0 .. 65535)
  480. // - half, single and double-precision floats
  481. // - all numbers (1, 2, 4 and 8-byte signed and unsigned integers)
  482. // - nil, true, false, ...
  483. // - arrays and maps, bytes and text strings
  484. //
  485. // None of the optional extensions (with tags) defined in the spec are supported out-of-the-box.
  486. // Users can implement them as needed (using SetExt), including spec-documented ones:
  487. // - timestamp, BigNum, BigFloat, Decimals, Encoded Text (e.g. URL, regexp, base64, MIME Message), etc.
  488. //
  489. // To encode with indefinite lengths (streaming), users will use
  490. // (Must)Encode methods of *Encoder, along with writing CborStreamXXX constants.
  491. //
  492. // For example, to encode "one-byte" as an indefinite length string:
  493. // var buf bytes.Buffer
  494. // e := NewEncoder(&buf, new(CborHandle))
  495. // buf.WriteByte(CborStreamString)
  496. // e.MustEncode("one-")
  497. // e.MustEncode("byte")
  498. // buf.WriteByte(CborStreamBreak)
  499. // encodedBytes := buf.Bytes()
  500. // var vv interface{}
  501. // NewDecoderBytes(buf.Bytes(), new(CborHandle)).MustDecode(&vv)
  502. // // Now, vv contains the same string "one-byte"
  503. //
  504. type CborHandle struct {
  505. BasicHandle
  506. binaryEncodingType
  507. }
  508. func (h *CborHandle) newEncDriver(e *Encoder) encDriver {
  509. return &cborEncDriver{e: e, w: e.w, h: h}
  510. }
  511. func (h *CborHandle) newDecDriver(d *Decoder) decDriver {
  512. return &cborDecDriver{d: d, r: d.r, h: h, br: d.bytes}
  513. }
  514. var _ decDriver = (*cborDecDriver)(nil)
  515. var _ encDriver = (*cborEncDriver)(nil)