123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153 |
- package sarama
- import (
- "bytes"
- "compress/gzip"
- "fmt"
- "io/ioutil"
- )
- // CompressionCodec represents the various compression codecs recognized by Kafka in messages.
- type CompressionCodec int8
- // only the last two bits are really used
- const compressionCodecMask int8 = 0x03
- const (
- CompressionNone CompressionCodec = 0
- CompressionGZIP CompressionCodec = 1
- CompressionSnappy CompressionCodec = 2
- )
- // The spec just says: "This is a version id used to allow backwards compatible evolution of the message
- // binary format." but it doesn't say what the current value is, so presumably 0...
- const messageFormat int8 = 0
- type Message struct {
- Codec CompressionCodec // codec used to compress the message contents
- Key []byte // the message key, may be nil
- Value []byte // the message contents
- Set *MessageSet // the message set a message might wrap
- compressedCache []byte
- }
- func (m *Message) encode(pe packetEncoder) error {
- pe.push(&crc32Field{})
- pe.putInt8(messageFormat)
- attributes := int8(m.Codec) & compressionCodecMask
- pe.putInt8(attributes)
- err := pe.putBytes(m.Key)
- if err != nil {
- return err
- }
- var payload []byte
- if m.compressedCache != nil {
- payload = m.compressedCache
- m.compressedCache = nil
- } else {
- switch m.Codec {
- case CompressionNone:
- payload = m.Value
- case CompressionGZIP:
- var buf bytes.Buffer
- writer := gzip.NewWriter(&buf)
- if _, err = writer.Write(m.Value); err != nil {
- return err
- }
- if err = writer.Close(); err != nil {
- return err
- }
- m.compressedCache = buf.Bytes()
- payload = m.compressedCache
- case CompressionSnappy:
- tmp := snappyEncode(m.Value)
- m.compressedCache = tmp
- payload = m.compressedCache
- default:
- return PacketEncodingError{fmt.Sprintf("unsupported compression codec (%d)", m.Codec)}
- }
- }
- if err = pe.putBytes(payload); err != nil {
- return err
- }
- return pe.pop()
- }
- func (m *Message) decode(pd packetDecoder) (err error) {
- err = pd.push(&crc32Field{})
- if err != nil {
- return err
- }
- format, err := pd.getInt8()
- if err != nil {
- return err
- }
- if format != messageFormat {
- return PacketDecodingError{"unexpected messageFormat"}
- }
- attribute, err := pd.getInt8()
- if err != nil {
- return err
- }
- m.Codec = CompressionCodec(attribute & compressionCodecMask)
- m.Key, err = pd.getBytes()
- if err != nil {
- return err
- }
- m.Value, err = pd.getBytes()
- if err != nil {
- return err
- }
- switch m.Codec {
- case CompressionNone:
- // nothing to do
- case CompressionGZIP:
- if m.Value == nil {
- return PacketDecodingError{"GZIP compression specified, but no data to uncompress"}
- }
- reader, err := gzip.NewReader(bytes.NewReader(m.Value))
- if err != nil {
- return err
- }
- if m.Value, err = ioutil.ReadAll(reader); err != nil {
- return err
- }
- if err := m.decodeSet(); err != nil {
- return err
- }
- case CompressionSnappy:
- if m.Value == nil {
- return PacketDecodingError{"Snappy compression specified, but no data to uncompress"}
- }
- if m.Value, err = snappyDecode(m.Value); err != nil {
- return err
- }
- if err := m.decodeSet(); err != nil {
- return err
- }
- default:
- return PacketDecodingError{fmt.Sprintf("invalid compression specified (%d)", m.Codec)}
- }
- return pd.pop()
- }
- // decodes a message set from a previousy encoded bulk-message
- func (m *Message) decodeSet() (err error) {
- pd := realDecoder{raw: m.Value}
- m.Set = &MessageSet{}
- return m.Set.decode(&pd)
- }
|