message.go 3.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170
  1. package sarama
  2. import (
  3. "bytes"
  4. "compress/gzip"
  5. "fmt"
  6. "io/ioutil"
  7. "time"
  8. "github.com/eapache/go-xerial-snappy"
  9. )
  10. // CompressionCodec represents the various compression codecs recognized by Kafka in messages.
  11. type CompressionCodec int8
  12. // only the last two bits are really used
  13. const compressionCodecMask int8 = 0x03
  14. const (
  15. CompressionNone CompressionCodec = 0
  16. CompressionGZIP CompressionCodec = 1
  17. CompressionSnappy CompressionCodec = 2
  18. )
  19. type Message struct {
  20. Codec CompressionCodec // codec used to compress the message contents
  21. Key []byte // the message key, may be nil
  22. Value []byte // the message contents
  23. Set *MessageSet // the message set a message might wrap
  24. Version int8 // v1 requires Kafka 0.10
  25. Timestamp time.Time // the timestamp of the message (version 1+ only)
  26. compressedCache []byte
  27. compressedSize int // used for computing the compression ratio metrics
  28. }
  29. func (m *Message) encode(pe packetEncoder) error {
  30. pe.push(&crc32Field{})
  31. pe.putInt8(m.Version)
  32. attributes := int8(m.Codec) & compressionCodecMask
  33. pe.putInt8(attributes)
  34. if m.Version >= 1 {
  35. pe.putInt64(m.Timestamp.UnixNano() / int64(time.Millisecond))
  36. }
  37. err := pe.putBytes(m.Key)
  38. if err != nil {
  39. return err
  40. }
  41. var payload []byte
  42. if m.compressedCache != nil {
  43. payload = m.compressedCache
  44. m.compressedCache = nil
  45. } else if m.Value != nil {
  46. switch m.Codec {
  47. case CompressionNone:
  48. payload = m.Value
  49. case CompressionGZIP:
  50. var buf bytes.Buffer
  51. writer := gzip.NewWriter(&buf)
  52. if _, err = writer.Write(m.Value); err != nil {
  53. return err
  54. }
  55. if err = writer.Close(); err != nil {
  56. return err
  57. }
  58. m.compressedCache = buf.Bytes()
  59. payload = m.compressedCache
  60. case CompressionSnappy:
  61. tmp := snappy.Encode(m.Value)
  62. m.compressedCache = tmp
  63. payload = m.compressedCache
  64. default:
  65. return PacketEncodingError{fmt.Sprintf("unsupported compression codec (%d)", m.Codec)}
  66. }
  67. // Keep in mind the compressed payload size for metric gathering
  68. m.compressedSize = len(payload)
  69. }
  70. if err = pe.putBytes(payload); err != nil {
  71. return err
  72. }
  73. return pe.pop()
  74. }
  75. func (m *Message) decode(pd packetDecoder) (err error) {
  76. err = pd.push(&crc32Field{})
  77. if err != nil {
  78. return err
  79. }
  80. m.Version, err = pd.getInt8()
  81. if err != nil {
  82. return err
  83. }
  84. attribute, err := pd.getInt8()
  85. if err != nil {
  86. return err
  87. }
  88. m.Codec = CompressionCodec(attribute & compressionCodecMask)
  89. if m.Version >= 1 {
  90. millis, err := pd.getInt64()
  91. if err != nil {
  92. return err
  93. }
  94. m.Timestamp = time.Unix(millis/1000, (millis%1000)*int64(time.Millisecond))
  95. }
  96. m.Key, err = pd.getBytes()
  97. if err != nil {
  98. return err
  99. }
  100. m.Value, err = pd.getBytes()
  101. if err != nil {
  102. return err
  103. }
  104. // Required for deep equal assertion during tests but might be useful
  105. // for future metrics about the compression ratio in fetch requests
  106. m.compressedSize = len(m.Value)
  107. switch m.Codec {
  108. case CompressionNone:
  109. // nothing to do
  110. case CompressionGZIP:
  111. if m.Value == nil {
  112. break
  113. }
  114. reader, err := gzip.NewReader(bytes.NewReader(m.Value))
  115. if err != nil {
  116. return err
  117. }
  118. if m.Value, err = ioutil.ReadAll(reader); err != nil {
  119. return err
  120. }
  121. if err := m.decodeSet(); err != nil {
  122. return err
  123. }
  124. case CompressionSnappy:
  125. if m.Value == nil {
  126. break
  127. }
  128. if m.Value, err = snappy.Decode(m.Value); err != nil {
  129. return err
  130. }
  131. if err := m.decodeSet(); err != nil {
  132. return err
  133. }
  134. default:
  135. return PacketDecodingError{fmt.Sprintf("invalid compression specified (%d)", m.Codec)}
  136. }
  137. return pd.pop()
  138. }
  139. // decodes a message set from a previousy encoded bulk-message
  140. func (m *Message) decodeSet() (err error) {
  141. pd := realDecoder{raw: m.Value}
  142. m.Set = &MessageSet{}
  143. return m.Set.decode(&pd)
  144. }