text_parser.go 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853
  1. // Copyright 2010 The Go Authors. All rights reserved.
  2. // Use of this source code is governed by a BSD-style
  3. // license that can be found in the LICENSE file.
  4. package proto
  5. // Functions for parsing the Text protocol buffer format.
  6. // TODO: message sets.
  7. import (
  8. "encoding"
  9. "errors"
  10. "fmt"
  11. "reflect"
  12. "strconv"
  13. "strings"
  14. "unicode/utf8"
  15. )
  16. // Error string emitted when deserializing Any and fields are already set
  17. const anyRepeatedlyUnpacked = "Any message unpacked multiple times, or %q already set"
  18. type ParseError struct {
  19. Message string
  20. Line int // 1-based line number
  21. Offset int // 0-based byte offset from start of input
  22. }
  23. func (p *ParseError) Error() string {
  24. if p.Line == 1 {
  25. // show offset only for first line
  26. return fmt.Sprintf("line 1.%d: %v", p.Offset, p.Message)
  27. }
  28. return fmt.Sprintf("line %d: %v", p.Line, p.Message)
  29. }
  30. type token struct {
  31. value string
  32. err *ParseError
  33. line int // line number
  34. offset int // byte number from start of input, not start of line
  35. unquoted string // the unquoted version of value, if it was a quoted string
  36. }
  37. func (t *token) String() string {
  38. if t.err == nil {
  39. return fmt.Sprintf("%q (line=%d, offset=%d)", t.value, t.line, t.offset)
  40. }
  41. return fmt.Sprintf("parse error: %v", t.err)
  42. }
  43. type textParser struct {
  44. s string // remaining input
  45. done bool // whether the parsing is finished (success or error)
  46. backed bool // whether back() was called
  47. offset, line int
  48. cur token
  49. }
  50. func newTextParser(s string) *textParser {
  51. p := new(textParser)
  52. p.s = s
  53. p.line = 1
  54. p.cur.line = 1
  55. return p
  56. }
  57. func (p *textParser) errorf(format string, a ...interface{}) *ParseError {
  58. pe := &ParseError{fmt.Sprintf(format, a...), p.cur.line, p.cur.offset}
  59. p.cur.err = pe
  60. p.done = true
  61. return pe
  62. }
  63. // Numbers and identifiers are matched by [-+._A-Za-z0-9]
  64. func isIdentOrNumberChar(c byte) bool {
  65. switch {
  66. case 'A' <= c && c <= 'Z', 'a' <= c && c <= 'z':
  67. return true
  68. case '0' <= c && c <= '9':
  69. return true
  70. }
  71. switch c {
  72. case '-', '+', '.', '_':
  73. return true
  74. }
  75. return false
  76. }
  77. func isWhitespace(c byte) bool {
  78. switch c {
  79. case ' ', '\t', '\n', '\r':
  80. return true
  81. }
  82. return false
  83. }
  84. func isQuote(c byte) bool {
  85. switch c {
  86. case '"', '\'':
  87. return true
  88. }
  89. return false
  90. }
  91. func (p *textParser) skipWhitespace() {
  92. i := 0
  93. for i < len(p.s) && (isWhitespace(p.s[i]) || p.s[i] == '#') {
  94. if p.s[i] == '#' {
  95. // comment; skip to end of line or input
  96. for i < len(p.s) && p.s[i] != '\n' {
  97. i++
  98. }
  99. if i == len(p.s) {
  100. break
  101. }
  102. }
  103. if p.s[i] == '\n' {
  104. p.line++
  105. }
  106. i++
  107. }
  108. p.offset += i
  109. p.s = p.s[i:len(p.s)]
  110. if len(p.s) == 0 {
  111. p.done = true
  112. }
  113. }
  114. func (p *textParser) advance() {
  115. // Skip whitespace
  116. p.skipWhitespace()
  117. if p.done {
  118. return
  119. }
  120. // Start of non-whitespace
  121. p.cur.err = nil
  122. p.cur.offset, p.cur.line = p.offset, p.line
  123. p.cur.unquoted = ""
  124. switch p.s[0] {
  125. case '<', '>', '{', '}', ':', '[', ']', ';', ',', '/':
  126. // Single symbol
  127. p.cur.value, p.s = p.s[0:1], p.s[1:len(p.s)]
  128. case '"', '\'':
  129. // Quoted string
  130. i := 1
  131. for i < len(p.s) && p.s[i] != p.s[0] && p.s[i] != '\n' {
  132. if p.s[i] == '\\' && i+1 < len(p.s) {
  133. // skip escaped char
  134. i++
  135. }
  136. i++
  137. }
  138. if i >= len(p.s) || p.s[i] != p.s[0] {
  139. p.errorf("unmatched quote")
  140. return
  141. }
  142. unq, err := unquoteC(p.s[1:i], rune(p.s[0]))
  143. if err != nil {
  144. p.errorf("invalid quoted string %s: %v", p.s[0:i+1], err)
  145. return
  146. }
  147. p.cur.value, p.s = p.s[0:i+1], p.s[i+1:len(p.s)]
  148. p.cur.unquoted = unq
  149. default:
  150. i := 0
  151. for i < len(p.s) && isIdentOrNumberChar(p.s[i]) {
  152. i++
  153. }
  154. if i == 0 {
  155. p.errorf("unexpected byte %#x", p.s[0])
  156. return
  157. }
  158. p.cur.value, p.s = p.s[0:i], p.s[i:len(p.s)]
  159. }
  160. p.offset += len(p.cur.value)
  161. }
  162. var (
  163. errBadUTF8 = errors.New("proto: bad UTF-8")
  164. )
  165. func unquoteC(s string, quote rune) (string, error) {
  166. // This is based on C++'s tokenizer.cc.
  167. // Despite its name, this is *not* parsing C syntax.
  168. // For instance, "\0" is an invalid quoted string.
  169. // Avoid allocation in trivial cases.
  170. simple := true
  171. for _, r := range s {
  172. if r == '\\' || r == quote {
  173. simple = false
  174. break
  175. }
  176. }
  177. if simple {
  178. return s, nil
  179. }
  180. buf := make([]byte, 0, 3*len(s)/2)
  181. for len(s) > 0 {
  182. r, n := utf8.DecodeRuneInString(s)
  183. if r == utf8.RuneError && n == 1 {
  184. return "", errBadUTF8
  185. }
  186. s = s[n:]
  187. if r != '\\' {
  188. if r < utf8.RuneSelf {
  189. buf = append(buf, byte(r))
  190. } else {
  191. buf = append(buf, string(r)...)
  192. }
  193. continue
  194. }
  195. ch, tail, err := unescape(s)
  196. if err != nil {
  197. return "", err
  198. }
  199. buf = append(buf, ch...)
  200. s = tail
  201. }
  202. return string(buf), nil
  203. }
  204. func unescape(s string) (ch string, tail string, err error) {
  205. r, n := utf8.DecodeRuneInString(s)
  206. if r == utf8.RuneError && n == 1 {
  207. return "", "", errBadUTF8
  208. }
  209. s = s[n:]
  210. switch r {
  211. case 'a':
  212. return "\a", s, nil
  213. case 'b':
  214. return "\b", s, nil
  215. case 'f':
  216. return "\f", s, nil
  217. case 'n':
  218. return "\n", s, nil
  219. case 'r':
  220. return "\r", s, nil
  221. case 't':
  222. return "\t", s, nil
  223. case 'v':
  224. return "\v", s, nil
  225. case '?':
  226. return "?", s, nil // trigraph workaround
  227. case '\'', '"', '\\':
  228. return string(r), s, nil
  229. case '0', '1', '2', '3', '4', '5', '6', '7':
  230. if len(s) < 2 {
  231. return "", "", fmt.Errorf(`\%c requires 2 following digits`, r)
  232. }
  233. ss := string(r) + s[:2]
  234. s = s[2:]
  235. i, err := strconv.ParseUint(ss, 8, 8)
  236. if err != nil {
  237. return "", "", fmt.Errorf(`\%s contains non-octal digits`, ss)
  238. }
  239. return string([]byte{byte(i)}), s, nil
  240. case 'x', 'X', 'u', 'U':
  241. var n int
  242. switch r {
  243. case 'x', 'X':
  244. n = 2
  245. case 'u':
  246. n = 4
  247. case 'U':
  248. n = 8
  249. }
  250. if len(s) < n {
  251. return "", "", fmt.Errorf(`\%c requires %d following digits`, r, n)
  252. }
  253. ss := s[:n]
  254. s = s[n:]
  255. i, err := strconv.ParseUint(ss, 16, 64)
  256. if err != nil {
  257. return "", "", fmt.Errorf(`\%c%s contains non-hexadecimal digits`, r, ss)
  258. }
  259. if r == 'x' || r == 'X' {
  260. return string([]byte{byte(i)}), s, nil
  261. }
  262. if i > utf8.MaxRune {
  263. return "", "", fmt.Errorf(`\%c%s is not a valid Unicode code point`, r, ss)
  264. }
  265. return string(i), s, nil
  266. }
  267. return "", "", fmt.Errorf(`unknown escape \%c`, r)
  268. }
  269. // Back off the parser by one token. Can only be done between calls to next().
  270. // It makes the next advance() a no-op.
  271. func (p *textParser) back() { p.backed = true }
  272. // Advances the parser and returns the new current token.
  273. func (p *textParser) next() *token {
  274. if p.backed || p.done {
  275. p.backed = false
  276. return &p.cur
  277. }
  278. p.advance()
  279. if p.done {
  280. p.cur.value = ""
  281. } else if len(p.cur.value) > 0 && isQuote(p.cur.value[0]) {
  282. // Look for multiple quoted strings separated by whitespace,
  283. // and concatenate them.
  284. cat := p.cur
  285. for {
  286. p.skipWhitespace()
  287. if p.done || !isQuote(p.s[0]) {
  288. break
  289. }
  290. p.advance()
  291. if p.cur.err != nil {
  292. return &p.cur
  293. }
  294. cat.value += " " + p.cur.value
  295. cat.unquoted += p.cur.unquoted
  296. }
  297. p.done = false // parser may have seen EOF, but we want to return cat
  298. p.cur = cat
  299. }
  300. return &p.cur
  301. }
  302. func (p *textParser) consumeToken(s string) error {
  303. tok := p.next()
  304. if tok.err != nil {
  305. return tok.err
  306. }
  307. if tok.value != s {
  308. p.back()
  309. return p.errorf("expected %q, found %q", s, tok.value)
  310. }
  311. return nil
  312. }
  313. // Return a RequiredNotSetError indicating which required field was not set.
  314. func (p *textParser) missingRequiredFieldError(sv reflect.Value) *RequiredNotSetError {
  315. st := sv.Type()
  316. sprops := GetProperties(st)
  317. for i := 0; i < st.NumField(); i++ {
  318. if !isNil(sv.Field(i)) {
  319. continue
  320. }
  321. props := sprops.Prop[i]
  322. if props.Required {
  323. return &RequiredNotSetError{fmt.Sprintf("%v.%v", st, props.OrigName)}
  324. }
  325. }
  326. return &RequiredNotSetError{fmt.Sprintf("%v.<unknown field name>", st)} // should not happen
  327. }
  328. // Returns the index in the struct for the named field, as well as the parsed tag properties.
  329. func structFieldByName(sprops *StructProperties, name string) (int, *Properties, bool) {
  330. i, ok := sprops.decoderOrigNames[name]
  331. if ok {
  332. return i, sprops.Prop[i], true
  333. }
  334. return -1, nil, false
  335. }
  336. // Consume a ':' from the input stream (if the next token is a colon),
  337. // returning an error if a colon is needed but not present.
  338. func (p *textParser) checkForColon(props *Properties, typ reflect.Type) *ParseError {
  339. tok := p.next()
  340. if tok.err != nil {
  341. return tok.err
  342. }
  343. if tok.value != ":" {
  344. // Colon is optional when the field is a group or message.
  345. needColon := true
  346. switch props.Wire {
  347. case "group":
  348. needColon = false
  349. case "bytes":
  350. // A "bytes" field is either a message, a string, or a repeated field;
  351. // those three become *T, *string and []T respectively, so we can check for
  352. // this field being a pointer to a non-string.
  353. if typ.Kind() == reflect.Ptr {
  354. // *T or *string
  355. if typ.Elem().Kind() == reflect.String {
  356. break
  357. }
  358. } else if typ.Kind() == reflect.Slice {
  359. // []T or []*T
  360. if typ.Elem().Kind() != reflect.Ptr {
  361. break
  362. }
  363. } else if typ.Kind() == reflect.String {
  364. // The proto3 exception is for a string field,
  365. // which requires a colon.
  366. break
  367. }
  368. needColon = false
  369. }
  370. if needColon {
  371. return p.errorf("expected ':', found %q", tok.value)
  372. }
  373. p.back()
  374. }
  375. return nil
  376. }
  377. func (p *textParser) readStruct(sv reflect.Value, terminator string) error {
  378. st := sv.Type()
  379. sprops := GetProperties(st)
  380. reqCount := sprops.reqCount
  381. var reqFieldErr error
  382. fieldSet := make(map[string]bool)
  383. // A struct is a sequence of "name: value", terminated by one of
  384. // '>' or '}', or the end of the input. A name may also be
  385. // "[extension]" or "[type/url]".
  386. //
  387. // The whole struct can also be an expanded Any message, like:
  388. // [type/url] < ... struct contents ... >
  389. for {
  390. tok := p.next()
  391. if tok.err != nil {
  392. return tok.err
  393. }
  394. if tok.value == terminator {
  395. break
  396. }
  397. if tok.value == "[" {
  398. // Looks like an extension or an Any.
  399. //
  400. // TODO: Check whether we need to handle
  401. // namespace rooted names (e.g. ".something.Foo").
  402. extName, err := p.consumeExtName()
  403. if err != nil {
  404. return err
  405. }
  406. if s := strings.LastIndex(extName, "/"); s >= 0 {
  407. // If it contains a slash, it's an Any type URL.
  408. messageName := extName[s+1:]
  409. mt := MessageType(messageName)
  410. if mt == nil {
  411. return p.errorf("unrecognized message %q in google.protobuf.Any", messageName)
  412. }
  413. tok = p.next()
  414. if tok.err != nil {
  415. return tok.err
  416. }
  417. // consume an optional colon
  418. if tok.value == ":" {
  419. tok = p.next()
  420. if tok.err != nil {
  421. return tok.err
  422. }
  423. }
  424. var terminator string
  425. switch tok.value {
  426. case "<":
  427. terminator = ">"
  428. case "{":
  429. terminator = "}"
  430. default:
  431. return p.errorf("expected '{' or '<', found %q", tok.value)
  432. }
  433. v := reflect.New(mt.Elem())
  434. if pe := p.readStruct(v.Elem(), terminator); pe != nil {
  435. return pe
  436. }
  437. b, err := Marshal(v.Interface().(Message))
  438. if err != nil {
  439. return p.errorf("failed to marshal message of type %q: %v", messageName, err)
  440. }
  441. if fieldSet["type_url"] {
  442. return p.errorf(anyRepeatedlyUnpacked, "type_url")
  443. }
  444. if fieldSet["value"] {
  445. return p.errorf(anyRepeatedlyUnpacked, "value")
  446. }
  447. sv.FieldByName("TypeUrl").SetString(extName)
  448. sv.FieldByName("Value").SetBytes(b)
  449. fieldSet["type_url"] = true
  450. fieldSet["value"] = true
  451. continue
  452. }
  453. var desc *ExtensionDesc
  454. // This could be faster, but it's functional.
  455. // TODO: Do something smarter than a linear scan.
  456. for _, d := range RegisteredExtensions(reflect.New(st).Interface().(Message)) {
  457. if d.Name == extName {
  458. desc = d
  459. break
  460. }
  461. }
  462. if desc == nil {
  463. return p.errorf("unrecognized extension %q", extName)
  464. }
  465. props := &Properties{}
  466. props.Parse(desc.Tag)
  467. typ := reflect.TypeOf(desc.ExtensionType)
  468. if err := p.checkForColon(props, typ); err != nil {
  469. return err
  470. }
  471. rep := desc.repeated()
  472. // Read the extension structure, and set it in
  473. // the value we're constructing.
  474. var ext reflect.Value
  475. if !rep {
  476. ext = reflect.New(typ).Elem()
  477. } else {
  478. ext = reflect.New(typ.Elem()).Elem()
  479. }
  480. if err := p.readAny(ext, props); err != nil {
  481. if _, ok := err.(*RequiredNotSetError); !ok {
  482. return err
  483. }
  484. reqFieldErr = err
  485. }
  486. ep := sv.Addr().Interface().(Message)
  487. if !rep {
  488. SetExtension(ep, desc, ext.Interface())
  489. } else {
  490. old, err := GetExtension(ep, desc)
  491. var sl reflect.Value
  492. if err == nil {
  493. sl = reflect.ValueOf(old) // existing slice
  494. } else {
  495. sl = reflect.MakeSlice(typ, 0, 1)
  496. }
  497. sl = reflect.Append(sl, ext)
  498. SetExtension(ep, desc, sl.Interface())
  499. }
  500. if err := p.consumeOptionalSeparator(); err != nil {
  501. return err
  502. }
  503. continue
  504. }
  505. // This is a normal, non-extension field.
  506. name := tok.value
  507. var dst reflect.Value
  508. fi, props, ok := structFieldByName(sprops, name)
  509. if ok {
  510. dst = sv.Field(fi)
  511. } else if oop, ok := sprops.OneofTypes[name]; ok {
  512. // It is a oneof.
  513. props = oop.Prop
  514. nv := reflect.New(oop.Type.Elem())
  515. dst = nv.Elem().Field(0)
  516. field := sv.Field(oop.Field)
  517. if !field.IsNil() {
  518. return p.errorf("field '%s' would overwrite already parsed oneof '%s'", name, sv.Type().Field(oop.Field).Name)
  519. }
  520. field.Set(nv)
  521. }
  522. if !dst.IsValid() {
  523. return p.errorf("unknown field name %q in %v", name, st)
  524. }
  525. if dst.Kind() == reflect.Map {
  526. // Consume any colon.
  527. if err := p.checkForColon(props, dst.Type()); err != nil {
  528. return err
  529. }
  530. // Construct the map if it doesn't already exist.
  531. if dst.IsNil() {
  532. dst.Set(reflect.MakeMap(dst.Type()))
  533. }
  534. key := reflect.New(dst.Type().Key()).Elem()
  535. val := reflect.New(dst.Type().Elem()).Elem()
  536. // The map entry should be this sequence of tokens:
  537. // < key : KEY value : VALUE >
  538. // However, implementations may omit key or value, and technically
  539. // we should support them in any order. See b/28924776 for a time
  540. // this went wrong.
  541. tok := p.next()
  542. var terminator string
  543. switch tok.value {
  544. case "<":
  545. terminator = ">"
  546. case "{":
  547. terminator = "}"
  548. default:
  549. return p.errorf("expected '{' or '<', found %q", tok.value)
  550. }
  551. for {
  552. tok := p.next()
  553. if tok.err != nil {
  554. return tok.err
  555. }
  556. if tok.value == terminator {
  557. break
  558. }
  559. switch tok.value {
  560. case "key":
  561. if err := p.consumeToken(":"); err != nil {
  562. return err
  563. }
  564. if err := p.readAny(key, props.MapKeyProp); err != nil {
  565. return err
  566. }
  567. if err := p.consumeOptionalSeparator(); err != nil {
  568. return err
  569. }
  570. case "value":
  571. if err := p.checkForColon(props.MapValProp, dst.Type().Elem()); err != nil {
  572. return err
  573. }
  574. if err := p.readAny(val, props.MapValProp); err != nil {
  575. return err
  576. }
  577. if err := p.consumeOptionalSeparator(); err != nil {
  578. return err
  579. }
  580. default:
  581. p.back()
  582. return p.errorf(`expected "key", "value", or %q, found %q`, terminator, tok.value)
  583. }
  584. }
  585. dst.SetMapIndex(key, val)
  586. continue
  587. }
  588. // Check that it's not already set if it's not a repeated field.
  589. if !props.Repeated && fieldSet[name] {
  590. return p.errorf("non-repeated field %q was repeated", name)
  591. }
  592. if err := p.checkForColon(props, dst.Type()); err != nil {
  593. return err
  594. }
  595. // Parse into the field.
  596. fieldSet[name] = true
  597. if err := p.readAny(dst, props); err != nil {
  598. if _, ok := err.(*RequiredNotSetError); !ok {
  599. return err
  600. }
  601. reqFieldErr = err
  602. }
  603. if props.Required {
  604. reqCount--
  605. }
  606. if err := p.consumeOptionalSeparator(); err != nil {
  607. return err
  608. }
  609. }
  610. if reqCount > 0 {
  611. return p.missingRequiredFieldError(sv)
  612. }
  613. return reqFieldErr
  614. }
  615. // consumeExtName consumes extension name or expanded Any type URL and the
  616. // following ']'. It returns the name or URL consumed.
  617. func (p *textParser) consumeExtName() (string, error) {
  618. tok := p.next()
  619. if tok.err != nil {
  620. return "", tok.err
  621. }
  622. // If extension name or type url is quoted, it's a single token.
  623. if len(tok.value) > 2 && isQuote(tok.value[0]) && tok.value[len(tok.value)-1] == tok.value[0] {
  624. name, err := unquoteC(tok.value[1:len(tok.value)-1], rune(tok.value[0]))
  625. if err != nil {
  626. return "", err
  627. }
  628. return name, p.consumeToken("]")
  629. }
  630. // Consume everything up to "]"
  631. var parts []string
  632. for tok.value != "]" {
  633. parts = append(parts, tok.value)
  634. tok = p.next()
  635. if tok.err != nil {
  636. return "", p.errorf("unrecognized type_url or extension name: %s", tok.err)
  637. }
  638. if p.done && tok.value != "]" {
  639. return "", p.errorf("unclosed type_url or extension name")
  640. }
  641. }
  642. return strings.Join(parts, ""), nil
  643. }
  644. // consumeOptionalSeparator consumes an optional semicolon or comma.
  645. // It is used in readStruct to provide backward compatibility.
  646. func (p *textParser) consumeOptionalSeparator() error {
  647. tok := p.next()
  648. if tok.err != nil {
  649. return tok.err
  650. }
  651. if tok.value != ";" && tok.value != "," {
  652. p.back()
  653. }
  654. return nil
  655. }
  656. func (p *textParser) readAny(v reflect.Value, props *Properties) error {
  657. tok := p.next()
  658. if tok.err != nil {
  659. return tok.err
  660. }
  661. if tok.value == "" {
  662. return p.errorf("unexpected EOF")
  663. }
  664. switch fv := v; fv.Kind() {
  665. case reflect.Slice:
  666. at := v.Type()
  667. if at.Elem().Kind() == reflect.Uint8 {
  668. // Special case for []byte
  669. if tok.value[0] != '"' && tok.value[0] != '\'' {
  670. // Deliberately written out here, as the error after
  671. // this switch statement would write "invalid []byte: ...",
  672. // which is not as user-friendly.
  673. return p.errorf("invalid string: %v", tok.value)
  674. }
  675. bytes := []byte(tok.unquoted)
  676. fv.Set(reflect.ValueOf(bytes))
  677. return nil
  678. }
  679. // Repeated field.
  680. if tok.value == "[" {
  681. // Repeated field with list notation, like [1,2,3].
  682. for {
  683. fv.Set(reflect.Append(fv, reflect.New(at.Elem()).Elem()))
  684. err := p.readAny(fv.Index(fv.Len()-1), props)
  685. if err != nil {
  686. return err
  687. }
  688. tok := p.next()
  689. if tok.err != nil {
  690. return tok.err
  691. }
  692. if tok.value == "]" {
  693. break
  694. }
  695. if tok.value != "," {
  696. return p.errorf("Expected ']' or ',' found %q", tok.value)
  697. }
  698. }
  699. return nil
  700. }
  701. // One value of the repeated field.
  702. p.back()
  703. fv.Set(reflect.Append(fv, reflect.New(at.Elem()).Elem()))
  704. return p.readAny(fv.Index(fv.Len()-1), props)
  705. case reflect.Bool:
  706. // true/1/t/True or false/f/0/False.
  707. switch tok.value {
  708. case "true", "1", "t", "True":
  709. fv.SetBool(true)
  710. return nil
  711. case "false", "0", "f", "False":
  712. fv.SetBool(false)
  713. return nil
  714. }
  715. case reflect.Float32, reflect.Float64:
  716. v := tok.value
  717. // Ignore 'f' for compatibility with output generated by C++, but don't
  718. // remove 'f' when the value is "-inf" or "inf".
  719. if strings.HasSuffix(v, "f") && tok.value != "-inf" && tok.value != "inf" {
  720. v = v[:len(v)-1]
  721. }
  722. if f, err := strconv.ParseFloat(v, fv.Type().Bits()); err == nil {
  723. fv.SetFloat(f)
  724. return nil
  725. }
  726. case reflect.Int32:
  727. if x, err := strconv.ParseInt(tok.value, 0, 32); err == nil {
  728. fv.SetInt(x)
  729. return nil
  730. }
  731. if len(props.Enum) == 0 {
  732. break
  733. }
  734. m, ok := enumValueMaps[props.Enum]
  735. if !ok {
  736. break
  737. }
  738. x, ok := m[tok.value]
  739. if !ok {
  740. break
  741. }
  742. fv.SetInt(int64(x))
  743. return nil
  744. case reflect.Int64:
  745. if x, err := strconv.ParseInt(tok.value, 0, 64); err == nil {
  746. fv.SetInt(x)
  747. return nil
  748. }
  749. case reflect.Ptr:
  750. // A basic field (indirected through pointer), or a repeated message/group
  751. p.back()
  752. fv.Set(reflect.New(fv.Type().Elem()))
  753. return p.readAny(fv.Elem(), props)
  754. case reflect.String:
  755. if tok.value[0] == '"' || tok.value[0] == '\'' {
  756. fv.SetString(tok.unquoted)
  757. return nil
  758. }
  759. case reflect.Struct:
  760. var terminator string
  761. switch tok.value {
  762. case "{":
  763. terminator = "}"
  764. case "<":
  765. terminator = ">"
  766. default:
  767. return p.errorf("expected '{' or '<', found %q", tok.value)
  768. }
  769. // TODO: Handle nested messages which implement encoding.TextUnmarshaler.
  770. return p.readStruct(fv, terminator)
  771. case reflect.Uint32:
  772. if x, err := strconv.ParseUint(tok.value, 0, 32); err == nil {
  773. fv.SetUint(uint64(x))
  774. return nil
  775. }
  776. case reflect.Uint64:
  777. if x, err := strconv.ParseUint(tok.value, 0, 64); err == nil {
  778. fv.SetUint(x)
  779. return nil
  780. }
  781. }
  782. return p.errorf("invalid %v: %v", v.Type(), tok.value)
  783. }
  784. // UnmarshalText reads a protocol buffer in Text format. UnmarshalText resets pb
  785. // before starting to unmarshal, so any existing data in pb is always removed.
  786. // If a required field is not set and no other error occurs,
  787. // UnmarshalText returns *RequiredNotSetError.
  788. func UnmarshalText(s string, pb Message) error {
  789. if um, ok := pb.(encoding.TextUnmarshaler); ok {
  790. return um.UnmarshalText([]byte(s))
  791. }
  792. pb.Reset()
  793. v := reflect.ValueOf(pb)
  794. return newTextParser(s).readStruct(v.Elem(), "")
  795. }