message.go 4.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200
  1. package sarama
  2. import (
  3. "bytes"
  4. "compress/gzip"
  5. "fmt"
  6. "io/ioutil"
  7. "time"
  8. "github.com/eapache/go-xerial-snappy"
  9. "github.com/pierrec/lz4"
  10. )
  11. // CompressionCodec represents the various compression codecs recognized by Kafka in messages.
  12. type CompressionCodec int8
  13. // only the last two bits are really used
  14. const compressionCodecMask int8 = 0x03
  15. const (
  16. CompressionNone CompressionCodec = 0
  17. CompressionGZIP CompressionCodec = 1
  18. CompressionSnappy CompressionCodec = 2
  19. CompressionLZ4 CompressionCodec = 3
  20. )
  21. type Message struct {
  22. Codec CompressionCodec // codec used to compress the message contents
  23. Key []byte // the message key, may be nil
  24. Value []byte // the message contents
  25. Set *MessageSet // the message set a message might wrap
  26. Version int8 // v1 requires Kafka 0.10
  27. Timestamp time.Time // the timestamp of the message (version 1+ only)
  28. compressedCache []byte
  29. compressedSize int // used for computing the compression ratio metrics
  30. }
  31. func (m *Message) encode(pe packetEncoder) error {
  32. pe.push(newCRC32Field(crcIEEE))
  33. pe.putInt8(m.Version)
  34. attributes := int8(m.Codec) & compressionCodecMask
  35. pe.putInt8(attributes)
  36. if m.Version >= 1 {
  37. if err := (Timestamp{&m.Timestamp}).encode(pe); err != nil {
  38. return err
  39. }
  40. }
  41. err := pe.putBytes(m.Key)
  42. if err != nil {
  43. return err
  44. }
  45. var payload []byte
  46. if m.compressedCache != nil {
  47. payload = m.compressedCache
  48. m.compressedCache = nil
  49. } else if m.Value != nil {
  50. switch m.Codec {
  51. case CompressionNone:
  52. payload = m.Value
  53. case CompressionGZIP:
  54. var buf bytes.Buffer
  55. writer := gzip.NewWriter(&buf)
  56. if _, err = writer.Write(m.Value); err != nil {
  57. return err
  58. }
  59. if err = writer.Close(); err != nil {
  60. return err
  61. }
  62. m.compressedCache = buf.Bytes()
  63. payload = m.compressedCache
  64. case CompressionSnappy:
  65. tmp := snappy.Encode(m.Value)
  66. m.compressedCache = tmp
  67. payload = m.compressedCache
  68. case CompressionLZ4:
  69. var buf bytes.Buffer
  70. writer := lz4.NewWriter(&buf)
  71. if _, err = writer.Write(m.Value); err != nil {
  72. return err
  73. }
  74. if err = writer.Close(); err != nil {
  75. return err
  76. }
  77. m.compressedCache = buf.Bytes()
  78. payload = m.compressedCache
  79. default:
  80. return PacketEncodingError{fmt.Sprintf("unsupported compression codec (%d)", m.Codec)}
  81. }
  82. // Keep in mind the compressed payload size for metric gathering
  83. m.compressedSize = len(payload)
  84. }
  85. if err = pe.putBytes(payload); err != nil {
  86. return err
  87. }
  88. return pe.pop()
  89. }
  90. func (m *Message) decode(pd packetDecoder) (err error) {
  91. err = pd.push(newCRC32Field(crcIEEE))
  92. if err != nil {
  93. return err
  94. }
  95. m.Version, err = pd.getInt8()
  96. if err != nil {
  97. return err
  98. }
  99. if m.Version > 1 {
  100. return PacketDecodingError{fmt.Sprintf("unknown magic byte (%v)", m.Version)}
  101. }
  102. attribute, err := pd.getInt8()
  103. if err != nil {
  104. return err
  105. }
  106. m.Codec = CompressionCodec(attribute & compressionCodecMask)
  107. if m.Version == 1 {
  108. if err := (Timestamp{&m.Timestamp}).decode(pd); err != nil {
  109. return err
  110. }
  111. }
  112. m.Key, err = pd.getBytes()
  113. if err != nil {
  114. return err
  115. }
  116. m.Value, err = pd.getBytes()
  117. if err != nil {
  118. return err
  119. }
  120. // Required for deep equal assertion during tests but might be useful
  121. // for future metrics about the compression ratio in fetch requests
  122. m.compressedSize = len(m.Value)
  123. switch m.Codec {
  124. case CompressionNone:
  125. // nothing to do
  126. case CompressionGZIP:
  127. if m.Value == nil {
  128. break
  129. }
  130. reader, err := gzip.NewReader(bytes.NewReader(m.Value))
  131. if err != nil {
  132. return err
  133. }
  134. if m.Value, err = ioutil.ReadAll(reader); err != nil {
  135. return err
  136. }
  137. if err := m.decodeSet(); err != nil {
  138. return err
  139. }
  140. case CompressionSnappy:
  141. if m.Value == nil {
  142. break
  143. }
  144. if m.Value, err = snappy.Decode(m.Value); err != nil {
  145. return err
  146. }
  147. if err := m.decodeSet(); err != nil {
  148. return err
  149. }
  150. case CompressionLZ4:
  151. if m.Value == nil {
  152. break
  153. }
  154. reader := lz4.NewReader(bytes.NewReader(m.Value))
  155. if m.Value, err = ioutil.ReadAll(reader); err != nil {
  156. return err
  157. }
  158. if err := m.decodeSet(); err != nil {
  159. return err
  160. }
  161. default:
  162. return PacketDecodingError{fmt.Sprintf("invalid compression specified (%d)", m.Codec)}
  163. }
  164. return pd.pop()
  165. }
  166. // decodes a message set from a previousy encoded bulk-message
  167. func (m *Message) decodeSet() (err error) {
  168. pd := realDecoder{raw: m.Value}
  169. m.Set = &MessageSet{}
  170. return m.Set.decode(&pd)
  171. }