message.go 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216
  1. package sarama
  2. import (
  3. "bytes"
  4. "compress/gzip"
  5. "fmt"
  6. "io/ioutil"
  7. "time"
  8. "github.com/eapache/go-xerial-snappy"
  9. "github.com/pierrec/lz4"
  10. )
  11. // CompressionCodec represents the various compression codecs recognized by Kafka in messages.
  12. type CompressionCodec int8
  13. // only the last two bits are really used
  14. const compressionCodecMask int8 = 0x03
  15. const (
  16. CompressionNone CompressionCodec = 0
  17. CompressionGZIP CompressionCodec = 1
  18. CompressionSnappy CompressionCodec = 2
  19. CompressionLZ4 CompressionCodec = 3
  20. )
  21. type Message struct {
  22. Codec CompressionCodec // codec used to compress the message contents
  23. Key []byte // the message key, may be nil
  24. Value []byte // the message contents
  25. Set *MessageSet // the message set a message might wrap
  26. Version int8 // v1 requires Kafka 0.10
  27. Timestamp time.Time // the timestamp of the message (version 1+ only)
  28. compressedCache []byte
  29. compressedSize int // used for computing the compression ratio metrics
  30. }
  31. func (m *Message) encode(pe packetEncoder) error {
  32. pe.push(&crc32Field{})
  33. pe.putInt8(m.Version)
  34. attributes := int8(m.Codec) & compressionCodecMask
  35. pe.putInt8(attributes)
  36. if m.Version >= 1 {
  37. timestamp := int64(-1)
  38. if !m.Timestamp.Before(time.Unix(0, 0)) {
  39. timestamp = m.Timestamp.UnixNano() / int64(time.Millisecond)
  40. } else if !m.Timestamp.IsZero() {
  41. return PacketEncodingError{fmt.Sprintf("invalid timestamp (%v)", m.Timestamp)}
  42. }
  43. pe.putInt64(timestamp)
  44. }
  45. err := pe.putBytes(m.Key)
  46. if err != nil {
  47. return err
  48. }
  49. var payload []byte
  50. if m.compressedCache != nil {
  51. payload = m.compressedCache
  52. m.compressedCache = nil
  53. } else if m.Value != nil {
  54. switch m.Codec {
  55. case CompressionNone:
  56. payload = m.Value
  57. case CompressionGZIP:
  58. var buf bytes.Buffer
  59. writer := gzip.NewWriter(&buf)
  60. if _, err = writer.Write(m.Value); err != nil {
  61. return err
  62. }
  63. if err = writer.Close(); err != nil {
  64. return err
  65. }
  66. m.compressedCache = buf.Bytes()
  67. payload = m.compressedCache
  68. case CompressionSnappy:
  69. tmp := snappy.Encode(m.Value)
  70. m.compressedCache = tmp
  71. payload = m.compressedCache
  72. case CompressionLZ4:
  73. var buf bytes.Buffer
  74. writer := lz4.NewWriter(&buf)
  75. if _, err = writer.Write(m.Value); err != nil {
  76. return err
  77. }
  78. if err = writer.Close(); err != nil {
  79. return err
  80. }
  81. m.compressedCache = buf.Bytes()
  82. payload = m.compressedCache
  83. default:
  84. return PacketEncodingError{fmt.Sprintf("unsupported compression codec (%d)", m.Codec)}
  85. }
  86. // Keep in mind the compressed payload size for metric gathering
  87. m.compressedSize = len(payload)
  88. }
  89. if err = pe.putBytes(payload); err != nil {
  90. return err
  91. }
  92. return pe.pop()
  93. }
  94. func (m *Message) decode(pd packetDecoder) (err error) {
  95. err = pd.push(&crc32Field{})
  96. if err != nil {
  97. return err
  98. }
  99. m.Version, err = pd.getInt8()
  100. if err != nil {
  101. return err
  102. }
  103. if m.Version > 1 {
  104. return PacketDecodingError{fmt.Sprintf("unknown magic byte (%v)", m.Version)}
  105. }
  106. attribute, err := pd.getInt8()
  107. if err != nil {
  108. return err
  109. }
  110. m.Codec = CompressionCodec(attribute & compressionCodecMask)
  111. if m.Version == 1 {
  112. millis, err := pd.getInt64()
  113. if err != nil {
  114. return err
  115. }
  116. // negative timestamps are invalid, in these cases we should return
  117. // a zero time
  118. timestamp := time.Time{}
  119. if millis >= 0 {
  120. timestamp = time.Unix(millis/1000, (millis%1000)*int64(time.Millisecond))
  121. }
  122. m.Timestamp = timestamp
  123. }
  124. m.Key, err = pd.getBytes()
  125. if err != nil {
  126. return err
  127. }
  128. m.Value, err = pd.getBytes()
  129. if err != nil {
  130. return err
  131. }
  132. // Required for deep equal assertion during tests but might be useful
  133. // for future metrics about the compression ratio in fetch requests
  134. m.compressedSize = len(m.Value)
  135. switch m.Codec {
  136. case CompressionNone:
  137. // nothing to do
  138. case CompressionGZIP:
  139. if m.Value == nil {
  140. break
  141. }
  142. reader, err := gzip.NewReader(bytes.NewReader(m.Value))
  143. if err != nil {
  144. return err
  145. }
  146. if m.Value, err = ioutil.ReadAll(reader); err != nil {
  147. return err
  148. }
  149. if err := m.decodeSet(); err != nil {
  150. return err
  151. }
  152. case CompressionSnappy:
  153. if m.Value == nil {
  154. break
  155. }
  156. if m.Value, err = snappy.Decode(m.Value); err != nil {
  157. return err
  158. }
  159. if err := m.decodeSet(); err != nil {
  160. return err
  161. }
  162. case CompressionLZ4:
  163. if m.Value == nil {
  164. break
  165. }
  166. reader := lz4.NewReader(bytes.NewReader(m.Value))
  167. if m.Value, err = ioutil.ReadAll(reader); err != nil {
  168. return err
  169. }
  170. if err := m.decodeSet(); err != nil {
  171. return err
  172. }
  173. default:
  174. return PacketDecodingError{fmt.Sprintf("invalid compression specified (%d)", m.Codec)}
  175. }
  176. return pd.pop()
  177. }
  178. // decodes a message set from a previousy encoded bulk-message
  179. func (m *Message) decodeSet() (err error) {
  180. pd := realDecoder{raw: m.Value}
  181. m.Set = &MessageSet{}
  182. return m.Set.decode(&pd)
  183. }