decode.go 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687
  1. // Copyright 2019 The Go Authors. All rights reserved.
  2. // Use of this source code is governed by a BSD-style
  3. // license that can be found in the LICENSE file.
  4. package protojson
  5. import (
  6. "encoding/base64"
  7. "fmt"
  8. "math"
  9. "strconv"
  10. "strings"
  11. "google.golang.org/protobuf/internal/encoding/json"
  12. "google.golang.org/protobuf/internal/encoding/messageset"
  13. "google.golang.org/protobuf/internal/errors"
  14. "google.golang.org/protobuf/internal/flags"
  15. "google.golang.org/protobuf/internal/pragma"
  16. "google.golang.org/protobuf/internal/set"
  17. "google.golang.org/protobuf/proto"
  18. pref "google.golang.org/protobuf/reflect/protoreflect"
  19. "google.golang.org/protobuf/reflect/protoregistry"
  20. )
  21. // Unmarshal reads the given []byte into the given proto.Message.
  22. func Unmarshal(b []byte, m proto.Message) error {
  23. return UnmarshalOptions{}.Unmarshal(b, m)
  24. }
  25. // UnmarshalOptions is a configurable JSON format parser.
  26. type UnmarshalOptions struct {
  27. pragma.NoUnkeyedLiterals
  28. // If AllowPartial is set, input for messages that will result in missing
  29. // required fields will not return an error.
  30. AllowPartial bool
  31. // If DiscardUnknown is set, unknown fields are ignored.
  32. DiscardUnknown bool
  33. // Resolver is used for looking up types when unmarshaling
  34. // google.protobuf.Any messages or extension fields.
  35. // If nil, this defaults to using protoregistry.GlobalTypes.
  36. Resolver interface {
  37. protoregistry.MessageTypeResolver
  38. protoregistry.ExtensionTypeResolver
  39. }
  40. decoder *json.Decoder
  41. }
  42. // Unmarshal reads the given []byte and populates the given proto.Message using
  43. // options in UnmarshalOptions object. It will clear the message first before
  44. // setting the fields. If it returns an error, the given message may be
  45. // partially set.
  46. func (o UnmarshalOptions) Unmarshal(b []byte, m proto.Message) error {
  47. // TODO: Determine if we would like to have an option for merging or only
  48. // have merging behavior. We should at least be consistent with textproto
  49. // marshaling.
  50. proto.Reset(m)
  51. if o.Resolver == nil {
  52. o.Resolver = protoregistry.GlobalTypes
  53. }
  54. o.decoder = json.NewDecoder(b)
  55. if err := o.unmarshalMessage(m.ProtoReflect(), false); err != nil {
  56. return err
  57. }
  58. // Check for EOF.
  59. val, err := o.decoder.Read()
  60. if err != nil {
  61. return err
  62. }
  63. if val.Type() != json.EOF {
  64. return unexpectedJSONError{val}
  65. }
  66. if o.AllowPartial {
  67. return nil
  68. }
  69. return proto.IsInitialized(m)
  70. }
  71. // unexpectedJSONError is an error that contains the unexpected json.Value. This
  72. // is returned by methods to provide callers the read json.Value that it did not
  73. // expect.
  74. // TODO: Consider moving this to internal/encoding/json for consistency with
  75. // errors that package returns.
  76. type unexpectedJSONError struct {
  77. value json.Value
  78. }
  79. func (e unexpectedJSONError) Error() string {
  80. return newError("unexpected value %s", e.value).Error()
  81. }
  82. // newError returns an error object. If one of the values passed in is of
  83. // json.Value type, it produces an error with position info.
  84. func newError(f string, x ...interface{}) error {
  85. var hasValue bool
  86. var line, column int
  87. for i := 0; i < len(x); i++ {
  88. if val, ok := x[i].(json.Value); ok {
  89. line, column = val.Position()
  90. hasValue = true
  91. break
  92. }
  93. }
  94. e := errors.New(f, x...)
  95. if hasValue {
  96. return errors.New("(line %d:%d): %v", line, column, e)
  97. }
  98. return e
  99. }
  100. // unmarshalMessage unmarshals a message into the given protoreflect.Message.
  101. func (o UnmarshalOptions) unmarshalMessage(m pref.Message, skipTypeURL bool) error {
  102. if isCustomType(m.Descriptor().FullName()) {
  103. return o.unmarshalCustomType(m)
  104. }
  105. jval, err := o.decoder.Read()
  106. if err != nil {
  107. return err
  108. }
  109. if jval.Type() != json.StartObject {
  110. return unexpectedJSONError{jval}
  111. }
  112. if err := o.unmarshalFields(m, skipTypeURL); err != nil {
  113. return err
  114. }
  115. return nil
  116. }
  117. // unmarshalFields unmarshals the fields into the given protoreflect.Message.
  118. func (o UnmarshalOptions) unmarshalFields(m pref.Message, skipTypeURL bool) error {
  119. messageDesc := m.Descriptor()
  120. if !flags.ProtoLegacy && messageset.IsMessageSet(messageDesc) {
  121. return errors.New("no support for proto1 MessageSets")
  122. }
  123. var seenNums set.Ints
  124. var seenOneofs set.Ints
  125. fieldDescs := messageDesc.Fields()
  126. for {
  127. // Read field name.
  128. jval, err := o.decoder.Read()
  129. if err != nil {
  130. return err
  131. }
  132. switch jval.Type() {
  133. default:
  134. return unexpectedJSONError{jval}
  135. case json.EndObject:
  136. return nil
  137. case json.Name:
  138. // Continue below.
  139. }
  140. name, err := jval.Name()
  141. if err != nil {
  142. return err
  143. }
  144. // Unmarshaling a non-custom embedded message in Any will contain the
  145. // JSON field "@type" which should be skipped because it is not a field
  146. // of the embedded message, but simply an artifact of the Any format.
  147. if skipTypeURL && name == "@type" {
  148. o.decoder.Read()
  149. continue
  150. }
  151. // Get the FieldDescriptor.
  152. var fd pref.FieldDescriptor
  153. if strings.HasPrefix(name, "[") && strings.HasSuffix(name, "]") {
  154. // Only extension names are in [name] format.
  155. extName := pref.FullName(name[1 : len(name)-1])
  156. extType, err := o.findExtension(extName)
  157. if err != nil && err != protoregistry.NotFound {
  158. return errors.New("unable to resolve [%v]: %v", extName, err)
  159. }
  160. if extType != nil {
  161. fd = extType.TypeDescriptor()
  162. if !messageDesc.ExtensionRanges().Has(fd.Number()) || fd.ContainingMessage().FullName() != messageDesc.FullName() {
  163. return errors.New("message %v cannot be extended by %v", messageDesc.FullName(), fd.FullName())
  164. }
  165. }
  166. } else {
  167. // The name can either be the JSON name or the proto field name.
  168. fd = fieldDescs.ByJSONName(name)
  169. if fd == nil {
  170. fd = fieldDescs.ByName(pref.Name(name))
  171. }
  172. if fd != nil && fd.IsWeak() && fd.Message().IsPlaceholder() {
  173. fd = nil // reset since the weak reference is not linked in
  174. }
  175. }
  176. if fd == nil {
  177. // Field is unknown.
  178. if o.DiscardUnknown {
  179. if err := skipJSONValue(o.decoder); err != nil {
  180. return err
  181. }
  182. continue
  183. }
  184. return newError("%v contains unknown field %s", messageDesc.FullName(), jval)
  185. }
  186. // Do not allow duplicate fields.
  187. num := uint64(fd.Number())
  188. if seenNums.Has(num) {
  189. return newError("%v contains repeated field %s", messageDesc.FullName(), jval)
  190. }
  191. seenNums.Set(num)
  192. // No need to set values for JSON null unless the field type is
  193. // google.protobuf.Value or google.protobuf.NullValue.
  194. if o.decoder.Peek() == json.Null && !isKnownValue(fd) && !isNullValue(fd) {
  195. o.decoder.Read()
  196. continue
  197. }
  198. switch {
  199. case fd.IsList():
  200. list := m.Mutable(fd).List()
  201. if err := o.unmarshalList(list, fd); err != nil {
  202. return errors.New("%v|%q: %v", fd.FullName(), name, err)
  203. }
  204. case fd.IsMap():
  205. mmap := m.Mutable(fd).Map()
  206. if err := o.unmarshalMap(mmap, fd); err != nil {
  207. return errors.New("%v|%q: %v", fd.FullName(), name, err)
  208. }
  209. default:
  210. // If field is a oneof, check if it has already been set.
  211. if od := fd.ContainingOneof(); od != nil {
  212. idx := uint64(od.Index())
  213. if seenOneofs.Has(idx) {
  214. return errors.New("%v: oneof is already set", od.FullName())
  215. }
  216. seenOneofs.Set(idx)
  217. }
  218. // Required or optional fields.
  219. if err := o.unmarshalSingular(m, fd); err != nil {
  220. return errors.New("%v|%q: %v", fd.FullName(), name, err)
  221. }
  222. }
  223. }
  224. }
  225. // findExtension returns protoreflect.ExtensionType from the resolver if found.
  226. func (o UnmarshalOptions) findExtension(xtName pref.FullName) (pref.ExtensionType, error) {
  227. xt, err := o.Resolver.FindExtensionByName(xtName)
  228. if err == nil {
  229. return xt, nil
  230. }
  231. return messageset.FindMessageSetExtension(o.Resolver, xtName)
  232. }
  233. func isKnownValue(fd pref.FieldDescriptor) bool {
  234. md := fd.Message()
  235. return md != nil && md.FullName() == "google.protobuf.Value"
  236. }
  237. func isNullValue(fd pref.FieldDescriptor) bool {
  238. ed := fd.Enum()
  239. return ed != nil && ed.FullName() == "google.protobuf.NullValue"
  240. }
  241. // unmarshalSingular unmarshals to the non-repeated field specified by the given
  242. // FieldDescriptor.
  243. func (o UnmarshalOptions) unmarshalSingular(m pref.Message, fd pref.FieldDescriptor) error {
  244. var val pref.Value
  245. var err error
  246. switch fd.Kind() {
  247. case pref.MessageKind, pref.GroupKind:
  248. val = m.NewField(fd)
  249. err = o.unmarshalMessage(val.Message(), false)
  250. default:
  251. val, err = o.unmarshalScalar(fd)
  252. }
  253. if err != nil {
  254. return err
  255. }
  256. m.Set(fd, val)
  257. return nil
  258. }
  259. // unmarshalScalar unmarshals to a scalar/enum protoreflect.Value specified by
  260. // the given FieldDescriptor.
  261. func (o UnmarshalOptions) unmarshalScalar(fd pref.FieldDescriptor) (pref.Value, error) {
  262. const b32 int = 32
  263. const b64 int = 64
  264. jval, err := o.decoder.Read()
  265. if err != nil {
  266. return pref.Value{}, err
  267. }
  268. kind := fd.Kind()
  269. switch kind {
  270. case pref.BoolKind:
  271. return unmarshalBool(jval)
  272. case pref.Int32Kind, pref.Sint32Kind, pref.Sfixed32Kind:
  273. return unmarshalInt(jval, b32)
  274. case pref.Int64Kind, pref.Sint64Kind, pref.Sfixed64Kind:
  275. return unmarshalInt(jval, b64)
  276. case pref.Uint32Kind, pref.Fixed32Kind:
  277. return unmarshalUint(jval, b32)
  278. case pref.Uint64Kind, pref.Fixed64Kind:
  279. return unmarshalUint(jval, b64)
  280. case pref.FloatKind:
  281. return unmarshalFloat(jval, b32)
  282. case pref.DoubleKind:
  283. return unmarshalFloat(jval, b64)
  284. case pref.StringKind:
  285. pval, err := unmarshalString(jval)
  286. if err != nil {
  287. return pval, err
  288. }
  289. return pval, nil
  290. case pref.BytesKind:
  291. return unmarshalBytes(jval)
  292. case pref.EnumKind:
  293. return unmarshalEnum(jval, fd)
  294. }
  295. panic(fmt.Sprintf("invalid scalar kind %v", kind))
  296. }
  297. func unmarshalBool(jval json.Value) (pref.Value, error) {
  298. if jval.Type() != json.Bool {
  299. return pref.Value{}, unexpectedJSONError{jval}
  300. }
  301. b, err := jval.Bool()
  302. return pref.ValueOf(b), err
  303. }
  304. func unmarshalInt(jval json.Value, bitSize int) (pref.Value, error) {
  305. switch jval.Type() {
  306. case json.Number:
  307. return getInt(jval, bitSize)
  308. case json.String:
  309. // Decode number from string.
  310. s := strings.TrimSpace(jval.String())
  311. if len(s) != len(jval.String()) {
  312. return pref.Value{}, errors.New("invalid number %v", jval.Raw())
  313. }
  314. dec := json.NewDecoder([]byte(s))
  315. jval, err := dec.Read()
  316. if err != nil {
  317. return pref.Value{}, err
  318. }
  319. return getInt(jval, bitSize)
  320. }
  321. return pref.Value{}, unexpectedJSONError{jval}
  322. }
  323. func getInt(jval json.Value, bitSize int) (pref.Value, error) {
  324. n, err := jval.Int(bitSize)
  325. if err != nil {
  326. return pref.Value{}, err
  327. }
  328. if bitSize == 32 {
  329. return pref.ValueOf(int32(n)), nil
  330. }
  331. return pref.ValueOf(n), nil
  332. }
  333. func unmarshalUint(jval json.Value, bitSize int) (pref.Value, error) {
  334. switch jval.Type() {
  335. case json.Number:
  336. return getUint(jval, bitSize)
  337. case json.String:
  338. // Decode number from string.
  339. s := strings.TrimSpace(jval.String())
  340. if len(s) != len(jval.String()) {
  341. return pref.Value{}, errors.New("invalid number %v", jval.Raw())
  342. }
  343. dec := json.NewDecoder([]byte(s))
  344. jval, err := dec.Read()
  345. if err != nil {
  346. return pref.Value{}, err
  347. }
  348. return getUint(jval, bitSize)
  349. }
  350. return pref.Value{}, unexpectedJSONError{jval}
  351. }
  352. func getUint(jval json.Value, bitSize int) (pref.Value, error) {
  353. n, err := jval.Uint(bitSize)
  354. if err != nil {
  355. return pref.Value{}, err
  356. }
  357. if bitSize == 32 {
  358. return pref.ValueOf(uint32(n)), nil
  359. }
  360. return pref.ValueOf(n), nil
  361. }
  362. func unmarshalFloat(jval json.Value, bitSize int) (pref.Value, error) {
  363. switch jval.Type() {
  364. case json.Number:
  365. return getFloat(jval, bitSize)
  366. case json.String:
  367. s := jval.String()
  368. switch s {
  369. case "NaN":
  370. if bitSize == 32 {
  371. return pref.ValueOf(float32(math.NaN())), nil
  372. }
  373. return pref.ValueOf(math.NaN()), nil
  374. case "Infinity":
  375. if bitSize == 32 {
  376. return pref.ValueOf(float32(math.Inf(+1))), nil
  377. }
  378. return pref.ValueOf(math.Inf(+1)), nil
  379. case "-Infinity":
  380. if bitSize == 32 {
  381. return pref.ValueOf(float32(math.Inf(-1))), nil
  382. }
  383. return pref.ValueOf(math.Inf(-1)), nil
  384. }
  385. // Decode number from string.
  386. if len(s) != len(strings.TrimSpace(s)) {
  387. return pref.Value{}, errors.New("invalid number %v", jval.Raw())
  388. }
  389. dec := json.NewDecoder([]byte(s))
  390. jval, err := dec.Read()
  391. if err != nil {
  392. return pref.Value{}, err
  393. }
  394. return getFloat(jval, bitSize)
  395. }
  396. return pref.Value{}, unexpectedJSONError{jval}
  397. }
  398. func getFloat(jval json.Value, bitSize int) (pref.Value, error) {
  399. n, err := jval.Float(bitSize)
  400. if err != nil {
  401. return pref.Value{}, err
  402. }
  403. if bitSize == 32 {
  404. return pref.ValueOf(float32(n)), nil
  405. }
  406. return pref.ValueOf(n), nil
  407. }
  408. func unmarshalString(jval json.Value) (pref.Value, error) {
  409. if jval.Type() != json.String {
  410. return pref.Value{}, unexpectedJSONError{jval}
  411. }
  412. return pref.ValueOf(jval.String()), nil
  413. }
  414. func unmarshalBytes(jval json.Value) (pref.Value, error) {
  415. if jval.Type() != json.String {
  416. return pref.Value{}, unexpectedJSONError{jval}
  417. }
  418. s := jval.String()
  419. enc := base64.StdEncoding
  420. if strings.ContainsAny(s, "-_") {
  421. enc = base64.URLEncoding
  422. }
  423. if len(s)%4 != 0 {
  424. enc = enc.WithPadding(base64.NoPadding)
  425. }
  426. b, err := enc.DecodeString(s)
  427. if err != nil {
  428. return pref.Value{}, err
  429. }
  430. return pref.ValueOf(b), nil
  431. }
  432. func unmarshalEnum(jval json.Value, fd pref.FieldDescriptor) (pref.Value, error) {
  433. switch jval.Type() {
  434. case json.String:
  435. // Lookup EnumNumber based on name.
  436. s := jval.String()
  437. if enumVal := fd.Enum().Values().ByName(pref.Name(s)); enumVal != nil {
  438. return pref.ValueOf(enumVal.Number()), nil
  439. }
  440. return pref.Value{}, newError("invalid enum value %q", jval)
  441. case json.Number:
  442. n, err := jval.Int(32)
  443. if err != nil {
  444. return pref.Value{}, err
  445. }
  446. return pref.ValueOf(pref.EnumNumber(n)), nil
  447. case json.Null:
  448. // This is only valid for google.protobuf.NullValue.
  449. if isNullValue(fd) {
  450. return pref.ValueOf(pref.EnumNumber(0)), nil
  451. }
  452. }
  453. return pref.Value{}, unexpectedJSONError{jval}
  454. }
  455. func (o UnmarshalOptions) unmarshalList(list pref.List, fd pref.FieldDescriptor) error {
  456. jval, err := o.decoder.Read()
  457. if err != nil {
  458. return err
  459. }
  460. if jval.Type() != json.StartArray {
  461. return unexpectedJSONError{jval}
  462. }
  463. switch fd.Kind() {
  464. case pref.MessageKind, pref.GroupKind:
  465. for {
  466. val := list.NewElement()
  467. err := o.unmarshalMessage(val.Message(), false)
  468. if err != nil {
  469. if e, ok := err.(unexpectedJSONError); ok {
  470. if e.value.Type() == json.EndArray {
  471. // Done with list.
  472. return nil
  473. }
  474. }
  475. return err
  476. }
  477. list.Append(val)
  478. }
  479. default:
  480. for {
  481. val, err := o.unmarshalScalar(fd)
  482. if err != nil {
  483. if e, ok := err.(unexpectedJSONError); ok {
  484. if e.value.Type() == json.EndArray {
  485. // Done with list.
  486. return nil
  487. }
  488. }
  489. return err
  490. }
  491. list.Append(val)
  492. }
  493. }
  494. return nil
  495. }
  496. func (o UnmarshalOptions) unmarshalMap(mmap pref.Map, fd pref.FieldDescriptor) error {
  497. jval, err := o.decoder.Read()
  498. if err != nil {
  499. return err
  500. }
  501. if jval.Type() != json.StartObject {
  502. return unexpectedJSONError{jval}
  503. }
  504. // Determine ahead whether map entry is a scalar type or a message type in
  505. // order to call the appropriate unmarshalMapValue func inside the for loop
  506. // below.
  507. var unmarshalMapValue func() (pref.Value, error)
  508. switch fd.MapValue().Kind() {
  509. case pref.MessageKind, pref.GroupKind:
  510. unmarshalMapValue = func() (pref.Value, error) {
  511. val := mmap.NewValue()
  512. if err := o.unmarshalMessage(val.Message(), false); err != nil {
  513. return pref.Value{}, err
  514. }
  515. return val, nil
  516. }
  517. default:
  518. unmarshalMapValue = func() (pref.Value, error) {
  519. return o.unmarshalScalar(fd.MapValue())
  520. }
  521. }
  522. Loop:
  523. for {
  524. // Read field name.
  525. jval, err := o.decoder.Read()
  526. if err != nil {
  527. return err
  528. }
  529. switch jval.Type() {
  530. default:
  531. return unexpectedJSONError{jval}
  532. case json.EndObject:
  533. break Loop
  534. case json.Name:
  535. // Continue.
  536. }
  537. name, err := jval.Name()
  538. if err != nil {
  539. return err
  540. }
  541. // Unmarshal field name.
  542. pkey, err := unmarshalMapKey(name, fd.MapKey())
  543. if err != nil {
  544. return err
  545. }
  546. // Check for duplicate field name.
  547. if mmap.Has(pkey) {
  548. return newError("duplicate map key %q", jval)
  549. }
  550. // Read and unmarshal field value.
  551. pval, err := unmarshalMapValue()
  552. if err != nil {
  553. return err
  554. }
  555. mmap.Set(pkey, pval)
  556. }
  557. return nil
  558. }
  559. // unmarshalMapKey converts given string into a protoreflect.MapKey. A map key type is any
  560. // integral or string type.
  561. func unmarshalMapKey(name string, fd pref.FieldDescriptor) (pref.MapKey, error) {
  562. const b32 = 32
  563. const b64 = 64
  564. const base10 = 10
  565. kind := fd.Kind()
  566. switch kind {
  567. case pref.StringKind:
  568. return pref.ValueOf(name).MapKey(), nil
  569. case pref.BoolKind:
  570. switch name {
  571. case "true":
  572. return pref.ValueOf(true).MapKey(), nil
  573. case "false":
  574. return pref.ValueOf(false).MapKey(), nil
  575. }
  576. return pref.MapKey{}, errors.New("invalid value for boolean key %q", name)
  577. case pref.Int32Kind, pref.Sint32Kind, pref.Sfixed32Kind:
  578. n, err := strconv.ParseInt(name, base10, b32)
  579. if err != nil {
  580. return pref.MapKey{}, err
  581. }
  582. return pref.ValueOf(int32(n)).MapKey(), nil
  583. case pref.Int64Kind, pref.Sint64Kind, pref.Sfixed64Kind:
  584. n, err := strconv.ParseInt(name, base10, b64)
  585. if err != nil {
  586. return pref.MapKey{}, err
  587. }
  588. return pref.ValueOf(int64(n)).MapKey(), nil
  589. case pref.Uint32Kind, pref.Fixed32Kind:
  590. n, err := strconv.ParseUint(name, base10, b32)
  591. if err != nil {
  592. return pref.MapKey{}, err
  593. }
  594. return pref.ValueOf(uint32(n)).MapKey(), nil
  595. case pref.Uint64Kind, pref.Fixed64Kind:
  596. n, err := strconv.ParseUint(name, base10, b64)
  597. if err != nil {
  598. return pref.MapKey{}, err
  599. }
  600. return pref.ValueOf(uint64(n)).MapKey(), nil
  601. }
  602. panic(fmt.Sprintf("%s: invalid kind %s for map key", fd.FullName(), kind))
  603. }