message.go 4.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189
  1. package sarama
  2. import (
  3. "bytes"
  4. "compress/gzip"
  5. "fmt"
  6. "io/ioutil"
  7. "time"
  8. "github.com/eapache/go-xerial-snappy"
  9. "github.com/pierrec/lz4"
  10. )
  11. // CompressionCodec represents the various compression codecs recognized by Kafka in messages.
  12. type CompressionCodec int8
  13. // only the last two bits are really used
  14. const compressionCodecMask int8 = 0x03
  15. const (
  16. CompressionNone CompressionCodec = 0
  17. CompressionGZIP CompressionCodec = 1
  18. CompressionSnappy CompressionCodec = 2
  19. CompressionLZ4 CompressionCodec = 3
  20. )
  21. type Message struct {
  22. Codec CompressionCodec // codec used to compress the message contents
  23. Key []byte // the message key, may be nil
  24. Value []byte // the message contents
  25. Set *MessageSet // the message set a message might wrap
  26. Version int8 // v1 requires Kafka 0.10
  27. Timestamp time.Time // the timestamp of the message (version 1+ only)
  28. compressedCache []byte
  29. }
  30. func (m *Message) encode(pe packetEncoder) error {
  31. pe.push(&crc32Field{})
  32. pe.putInt8(m.Version)
  33. attributes := int8(m.Codec) & compressionCodecMask
  34. pe.putInt8(attributes)
  35. if m.Version >= 1 {
  36. pe.putInt64(m.Timestamp.UnixNano() / int64(time.Millisecond))
  37. }
  38. err := pe.putBytes(m.Key)
  39. if err != nil {
  40. return err
  41. }
  42. var payload []byte
  43. if m.compressedCache != nil {
  44. payload = m.compressedCache
  45. m.compressedCache = nil
  46. } else if m.Value != nil {
  47. switch m.Codec {
  48. case CompressionNone:
  49. payload = m.Value
  50. case CompressionGZIP:
  51. var buf bytes.Buffer
  52. writer := gzip.NewWriter(&buf)
  53. if _, err = writer.Write(m.Value); err != nil {
  54. return err
  55. }
  56. if err = writer.Close(); err != nil {
  57. return err
  58. }
  59. m.compressedCache = buf.Bytes()
  60. payload = m.compressedCache
  61. case CompressionSnappy:
  62. tmp := snappy.Encode(m.Value)
  63. m.compressedCache = tmp
  64. payload = m.compressedCache
  65. case CompressionLZ4:
  66. var buf bytes.Buffer
  67. writer := lz4.NewWriter(&buf)
  68. if _, err = writer.Write(m.Value); err != nil {
  69. return err
  70. }
  71. if err = writer.Close(); err != nil {
  72. return err
  73. }
  74. m.compressedCache = buf.Bytes()
  75. payload = m.compressedCache
  76. default:
  77. return PacketEncodingError{fmt.Sprintf("unsupported compression codec (%d)", m.Codec)}
  78. }
  79. }
  80. if err = pe.putBytes(payload); err != nil {
  81. return err
  82. }
  83. return pe.pop()
  84. }
  85. func (m *Message) decode(pd packetDecoder) (err error) {
  86. err = pd.push(&crc32Field{})
  87. if err != nil {
  88. return err
  89. }
  90. m.Version, err = pd.getInt8()
  91. if err != nil {
  92. return err
  93. }
  94. attribute, err := pd.getInt8()
  95. if err != nil {
  96. return err
  97. }
  98. m.Codec = CompressionCodec(attribute & compressionCodecMask)
  99. if m.Version >= 1 {
  100. millis, err := pd.getInt64()
  101. if err != nil {
  102. return err
  103. }
  104. m.Timestamp = time.Unix(millis/1000, (millis%1000)*int64(time.Millisecond))
  105. }
  106. m.Key, err = pd.getBytes()
  107. if err != nil {
  108. return err
  109. }
  110. m.Value, err = pd.getBytes()
  111. if err != nil {
  112. return err
  113. }
  114. switch m.Codec {
  115. case CompressionNone:
  116. // nothing to do
  117. case CompressionGZIP:
  118. if m.Value == nil {
  119. break
  120. }
  121. reader, err := gzip.NewReader(bytes.NewReader(m.Value))
  122. if err != nil {
  123. return err
  124. }
  125. if m.Value, err = ioutil.ReadAll(reader); err != nil {
  126. return err
  127. }
  128. if err := m.decodeSet(); err != nil {
  129. return err
  130. }
  131. case CompressionSnappy:
  132. if m.Value == nil {
  133. break
  134. }
  135. if m.Value, err = snappy.Decode(m.Value); err != nil {
  136. return err
  137. }
  138. if err := m.decodeSet(); err != nil {
  139. return err
  140. }
  141. case CompressionLZ4:
  142. if m.Value == nil {
  143. break
  144. }
  145. reader := lz4.NewReader(bytes.NewReader(m.Value))
  146. if m.Value, err = ioutil.ReadAll(reader); err != nil {
  147. return err
  148. }
  149. if err := m.decodeSet(); err != nil {
  150. return err
  151. }
  152. default:
  153. return PacketDecodingError{fmt.Sprintf("invalid compression specified (%d)", m.Codec)}
  154. }
  155. return pd.pop()
  156. }
  157. // decodes a message set from a previousy encoded bulk-message
  158. func (m *Message) decodeSet() (err error) {
  159. pd := realDecoder{raw: m.Value}
  160. m.Set = &MessageSet{}
  161. return m.Set.decode(&pd)
  162. }