writer.go 6.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273
  1. package lz4
  2. import (
  3. "encoding/binary"
  4. "fmt"
  5. "io"
  6. "github.com/pierrec/lz4/internal/xxh32"
  7. )
  8. // Writer implements the LZ4 frame encoder.
  9. type Writer struct {
  10. Header
  11. // Handler called when a block has been successfully written out.
  12. // It provides the number of bytes written.
  13. OnBlockDone func(size int)
  14. buf [19]byte // magic number(4) + header(flags(2)+[Size(8)+DictID(4)]+checksum(1)) does not exceed 19 bytes
  15. dst io.Writer // Destination.
  16. checksum xxh32.XXHZero // Frame checksum.
  17. zdata []byte // Compressed data.
  18. data []byte // Data to be compressed.
  19. idx int // Index into data.
  20. hashtable [winSize]int // Hash table used in CompressBlock().
  21. }
  22. // NewWriter returns a new LZ4 frame encoder.
  23. // No access to the underlying io.Writer is performed.
  24. // The supplied Header is checked at the first Write.
  25. // It is ok to change it before the first Write but then not until a Reset() is performed.
  26. func NewWriter(dst io.Writer) *Writer {
  27. return &Writer{dst: dst}
  28. }
  29. // writeHeader builds and writes the header (magic+header) to the underlying io.Writer.
  30. func (z *Writer) writeHeader() error {
  31. // Default to 4Mb if BlockMaxSize is not set.
  32. if z.Header.BlockMaxSize == 0 {
  33. z.Header.BlockMaxSize = bsMapID[7]
  34. }
  35. // The only option that needs to be validated.
  36. bSize := z.Header.BlockMaxSize
  37. bSizeID, ok := bsMapValue[bSize]
  38. if !ok {
  39. return fmt.Errorf("lz4: invalid block max size: %d", bSize)
  40. }
  41. // Allocate the compressed/uncompressed buffers.
  42. // The compressed buffer cannot exceed the uncompressed one.
  43. if n := 2 * bSize; cap(z.zdata) < n {
  44. z.zdata = make([]byte, n, n)
  45. }
  46. z.data = z.zdata[:bSize]
  47. z.zdata = z.zdata[:cap(z.zdata)][bSize:]
  48. z.idx = 0
  49. // Size is optional.
  50. buf := z.buf[:]
  51. // Set the fixed size data: magic number, block max size and flags.
  52. binary.LittleEndian.PutUint32(buf[0:], frameMagic)
  53. flg := byte(Version << 6)
  54. flg |= 1 << 5 // No block dependency.
  55. if z.Header.BlockChecksum {
  56. flg |= 1 << 4
  57. }
  58. if z.Header.Size > 0 {
  59. flg |= 1 << 3
  60. }
  61. if !z.Header.NoChecksum {
  62. flg |= 1 << 2
  63. }
  64. buf[4] = flg
  65. buf[5] = bSizeID << 4
  66. // Current buffer size: magic(4) + flags(1) + block max size (1).
  67. n := 6
  68. // Optional items.
  69. if z.Header.Size > 0 {
  70. binary.LittleEndian.PutUint64(buf[n:], z.Header.Size)
  71. n += 8
  72. }
  73. // The header checksum includes the flags, block max size and optional Size.
  74. buf[n] = byte(xxh32.ChecksumZero(buf[4:n]) >> 8 & 0xFF)
  75. z.checksum.Reset()
  76. // Header ready, write it out.
  77. if _, err := z.dst.Write(buf[0 : n+1]); err != nil {
  78. return err
  79. }
  80. z.Header.done = true
  81. if debugFlag {
  82. debug("wrote header %v", z.Header)
  83. }
  84. return nil
  85. }
  86. // Write compresses data from the supplied buffer into the underlying io.Writer.
  87. // Write does not return until the data has been written.
  88. func (z *Writer) Write(buf []byte) (int, error) {
  89. if !z.Header.done {
  90. if err := z.writeHeader(); err != nil {
  91. return 0, err
  92. }
  93. }
  94. if debugFlag {
  95. debug("input buffer len=%d index=%d", len(buf), z.idx)
  96. }
  97. zn := len(z.data)
  98. var n int
  99. for len(buf) > 0 {
  100. if z.idx == 0 && len(buf) >= zn {
  101. // Avoid a copy as there is enough data for a block.
  102. if err := z.compressBlock(buf[:zn]); err != nil {
  103. return n, err
  104. }
  105. n += zn
  106. buf = buf[zn:]
  107. continue
  108. }
  109. // Accumulate the data to be compressed.
  110. m := copy(z.data[z.idx:], buf)
  111. n += m
  112. z.idx += m
  113. buf = buf[m:]
  114. if debugFlag {
  115. debug("%d bytes copied to buf, current index %d", n, z.idx)
  116. }
  117. if z.idx < len(z.data) {
  118. // Buffer not filled.
  119. if debugFlag {
  120. debug("need more data for compression")
  121. }
  122. return n, nil
  123. }
  124. // Buffer full.
  125. if err := z.compressBlock(z.data); err != nil {
  126. return n, err
  127. }
  128. z.idx = 0
  129. }
  130. return n, nil
  131. }
  132. // compressBlock compresses a block.
  133. func (z *Writer) compressBlock(data []byte) error {
  134. if !z.NoChecksum {
  135. z.checksum.Write(data)
  136. }
  137. // The compressed block size cannot exceed the input's.
  138. var zn int
  139. var err error
  140. if level := z.Header.CompressionLevel; level != 0 {
  141. zn, err = CompressBlockHC(data, z.zdata, level)
  142. } else {
  143. zn, err = CompressBlock(data, z.zdata, z.hashtable[:])
  144. }
  145. var zdata []byte
  146. var bLen uint32
  147. if debugFlag {
  148. debug("block compression %d => %d", len(data), zn)
  149. }
  150. if err == nil && zn > 0 && zn < len(data) {
  151. // Compressible and compressed size smaller than uncompressed: ok!
  152. bLen = uint32(zn)
  153. zdata = z.zdata[:zn]
  154. } else {
  155. // Uncompressed block.
  156. bLen = uint32(len(data)) | compressedBlockFlag
  157. zdata = data
  158. }
  159. if debugFlag {
  160. debug("block compression to be written len=%d data len=%d", bLen, len(zdata))
  161. }
  162. // Write the block.
  163. if err := z.writeUint32(bLen); err != nil {
  164. return err
  165. }
  166. written, err := z.dst.Write(zdata)
  167. if err != nil {
  168. return err
  169. }
  170. if h := z.OnBlockDone; h != nil {
  171. h(written)
  172. }
  173. if !z.BlockChecksum {
  174. if debugFlag {
  175. debug("current frame checksum %x", z.checksum.Sum32())
  176. }
  177. return nil
  178. }
  179. checksum := xxh32.ChecksumZero(zdata)
  180. if debugFlag {
  181. debug("block checksum %x", checksum)
  182. defer func() { debug("current frame checksum %x", z.checksum.Sum32()) }()
  183. }
  184. return z.writeUint32(checksum)
  185. }
  186. // Flush flushes any pending compressed data to the underlying writer.
  187. // Flush does not return until the data has been written.
  188. // If the underlying writer returns an error, Flush returns that error.
  189. func (z *Writer) Flush() error {
  190. if debugFlag {
  191. debug("flush with index %d", z.idx)
  192. }
  193. if z.idx == 0 {
  194. return nil
  195. }
  196. if err := z.compressBlock(z.data[:z.idx]); err != nil {
  197. return err
  198. }
  199. z.idx = 0
  200. return nil
  201. }
  202. // Close closes the Writer, flushing any unwritten data to the underlying io.Writer, but does not close the underlying io.Writer.
  203. func (z *Writer) Close() error {
  204. if !z.Header.done {
  205. if err := z.writeHeader(); err != nil {
  206. return err
  207. }
  208. }
  209. if err := z.Flush(); err != nil {
  210. return err
  211. }
  212. if debugFlag {
  213. debug("writing last empty block")
  214. }
  215. if err := z.writeUint32(0); err != nil {
  216. return err
  217. }
  218. if z.NoChecksum {
  219. return nil
  220. }
  221. checksum := z.checksum.Sum32()
  222. if debugFlag {
  223. debug("stream checksum %x", checksum)
  224. }
  225. return z.writeUint32(checksum)
  226. }
  227. // Reset clears the state of the Writer z such that it is equivalent to its
  228. // initial state from NewWriter, but instead writing to w.
  229. // No access to the underlying io.Writer is performed.
  230. func (z *Writer) Reset(w io.Writer) {
  231. z.Header = Header{}
  232. z.dst = w
  233. z.checksum.Reset()
  234. z.zdata = z.zdata[:0]
  235. z.data = z.data[:0]
  236. z.idx = 0
  237. }
  238. // writeUint32 writes a uint32 to the underlying writer.
  239. func (z *Writer) writeUint32(x uint32) error {
  240. buf := z.buf[:4]
  241. binary.LittleEndian.PutUint32(buf, x)
  242. _, err := z.dst.Write(buf)
  243. return err
  244. }