frame.go 7.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340
  1. package lz4
  2. import (
  3. "encoding/binary"
  4. "fmt"
  5. "io"
  6. "io/ioutil"
  7. "github.com/pierrec/lz4/internal/xxh32"
  8. )
  9. //go:generate go run gen.go
  10. type Frame struct {
  11. Magic uint32
  12. Descriptor FrameDescriptor
  13. Blocks Blocks
  14. Checksum uint32
  15. checksum xxh32.XXHZero
  16. }
  17. func (f *Frame) initW(w *_Writer) {
  18. f.Magic = frameMagic
  19. f.Descriptor.initW(w)
  20. f.Blocks.initW(w)
  21. f.checksum.Reset()
  22. }
  23. func (f *Frame) closeW(w *_Writer) error {
  24. if err := f.Blocks.closeW(w); err != nil {
  25. return err
  26. }
  27. buf := w.buf[:0]
  28. if f.Descriptor.Flags.ContentChecksum() {
  29. buf = f.checksum.Sum(buf)
  30. }
  31. // End mark (data block size of uint32(0)).
  32. buf = append(buf, 0, 0, 0, 0)
  33. _, err := w.src.Write(buf)
  34. return err
  35. }
  36. func (f *Frame) initR(r *_Reader) error {
  37. if f.Magic > 0 {
  38. // Header already read.
  39. return nil
  40. }
  41. newFrame:
  42. if err := readUint32(r.src, r.buf[:], &f.Magic); err != nil {
  43. return err
  44. }
  45. switch m := f.Magic; {
  46. case m == frameMagic:
  47. // All 16 values of frameSkipMagic are valid.
  48. case m>>8 == frameSkipMagic>>8:
  49. var skip uint32
  50. if err := binary.Read(r.src, binary.LittleEndian, &skip); err != nil {
  51. return err
  52. }
  53. if _, err := io.CopyN(ioutil.Discard, r.src, int64(skip)); err != nil {
  54. return err
  55. }
  56. goto newFrame
  57. default:
  58. return ErrInvalid
  59. }
  60. if err := f.Descriptor.initR(r); err != nil {
  61. return err
  62. }
  63. f.Blocks.initR(r)
  64. f.checksum.Reset()
  65. return nil
  66. }
  67. func (f *Frame) closeR(r *_Reader) error {
  68. f.Magic = 0
  69. if !f.Descriptor.Flags.ContentChecksum() {
  70. return nil
  71. }
  72. if err := readUint32(r.src, r.buf[:], &f.Checksum); err != nil {
  73. return err
  74. }
  75. if c := f.checksum.Sum32(); c != f.Checksum {
  76. return fmt.Errorf("%w: got %x; expected %x", ErrInvalidFrameChecksum, c, f.Checksum)
  77. }
  78. return nil
  79. }
  80. type FrameDescriptor struct {
  81. Flags DescriptorFlags
  82. ContentSize uint64
  83. Checksum uint8
  84. }
  85. func (fd *FrameDescriptor) initW(_ *_Writer) {
  86. fd.Flags.VersionSet(1)
  87. fd.Flags.BlockIndependenceSet(false)
  88. }
  89. func (fd *FrameDescriptor) write(w *_Writer) error {
  90. if fd.Checksum > 0 {
  91. // Header already written.
  92. return nil
  93. }
  94. buf := w.buf[:]
  95. binary.LittleEndian.PutUint16(buf, uint16(fd.Flags))
  96. var checksum uint32
  97. if fd.Flags.Size() {
  98. checksum = xxh32.ChecksumZero10(uint16(fd.Flags), fd.ContentSize)
  99. binary.LittleEndian.PutUint64(buf[2:], fd.ContentSize)
  100. buf = buf[:10]
  101. } else {
  102. checksum = xxh32.Uint32Zero(uint32(fd.Flags))
  103. buf = buf[:2]
  104. }
  105. fd.Checksum = byte(checksum >> 8)
  106. buf = append(buf, fd.Checksum)
  107. _, err := w.src.Write(buf)
  108. return err
  109. }
  110. func (fd *FrameDescriptor) initR(r *_Reader) error {
  111. buf := r.buf[:2]
  112. if _, err := io.ReadFull(r.src, buf); err != nil {
  113. return err
  114. }
  115. descr := binary.LittleEndian.Uint64(buf)
  116. fd.Flags = DescriptorFlags(descr)
  117. var checksum uint32
  118. if fd.Flags.Size() {
  119. buf = buf[:9]
  120. if _, err := io.ReadFull(r.src, buf); err != nil {
  121. return err
  122. }
  123. fd.ContentSize = binary.LittleEndian.Uint64(buf)
  124. checksum = xxh32.ChecksumZero10(uint16(fd.Flags), fd.ContentSize)
  125. } else {
  126. buf = buf[:1]
  127. var err error
  128. if br, ok := r.src.(io.ByteReader); ok {
  129. buf[0], err = br.ReadByte()
  130. } else {
  131. _, err = io.ReadFull(r.src, buf)
  132. }
  133. if err != nil {
  134. return err
  135. }
  136. checksum = xxh32.Uint32Zero(uint32(fd.Flags))
  137. }
  138. fd.Checksum = buf[len(buf)-1]
  139. if c := byte(checksum >> 8); fd.Checksum != c {
  140. return fmt.Errorf("lz4: %w: got %x; expected %x", ErrInvalidHeaderChecksum, c, fd.Checksum)
  141. }
  142. return nil
  143. }
  144. type Blocks struct {
  145. Block *FrameDataBlock
  146. Blocks chan chan *FrameDataBlock
  147. err error
  148. }
  149. func (b *Blocks) initW(w *_Writer) {
  150. size := w.frame.Descriptor.Flags.BlockSizeIndex()
  151. if w.isNotConcurrent() {
  152. b.Blocks = nil
  153. b.Block = newFrameDataBlock(size)
  154. return
  155. }
  156. if cap(b.Blocks) != w.num {
  157. b.Blocks = make(chan chan *FrameDataBlock, w.num)
  158. }
  159. // goroutine managing concurrent block compression goroutines.
  160. go func() {
  161. // Process next block compression item.
  162. for c := range b.Blocks {
  163. // Read the next compressed block result.
  164. // Waiting here ensures that the blocks are output in the order they were sent.
  165. // The incoming channel is always closed as it indicates to the caller that
  166. // the block has been processed.
  167. block := <-c
  168. if block == nil {
  169. // Notify the block compression routine that we are done with its result.
  170. // This is used when a sentinel block is sent to terminate the compression.
  171. close(c)
  172. return
  173. }
  174. // Do not attempt to write the block upon any previous failure.
  175. if b.err == nil {
  176. // Write the block.
  177. if err := block.write(w); err != nil && b.err == nil {
  178. // Keep the first error.
  179. b.err = err
  180. // All pending compression goroutines need to shut down, so we need to keep going.
  181. }
  182. }
  183. close(c)
  184. }
  185. }()
  186. }
  187. func (b *Blocks) closeW(w *_Writer) error {
  188. if w.isNotConcurrent() {
  189. b.Block.closeW(w)
  190. b.Block = nil
  191. return nil
  192. }
  193. c := make(chan *FrameDataBlock)
  194. b.Blocks <- c
  195. c <- nil
  196. <-c
  197. err := b.err
  198. b.err = nil
  199. return err
  200. }
  201. func (b *Blocks) initR(r *_Reader) {
  202. size := r.frame.Descriptor.Flags.BlockSizeIndex()
  203. b.Block = newFrameDataBlock(size)
  204. }
  205. func newFrameDataBlock(size BlockSizeIndex) *FrameDataBlock {
  206. return &FrameDataBlock{Data: size.get()}
  207. }
  208. type FrameDataBlock struct {
  209. Size DataBlockSize
  210. Data []byte
  211. Checksum uint32
  212. }
  213. func (b *FrameDataBlock) closeW(w *_Writer) {
  214. size := w.frame.Descriptor.Flags.BlockSizeIndex()
  215. size.put(b.Data)
  216. }
  217. // Block compression errors are ignored since the buffer is sized appropriately.
  218. func (b *FrameDataBlock) compress(w *_Writer, src []byte, ht []int) *FrameDataBlock {
  219. dst := b.Data
  220. var n int
  221. switch w.level {
  222. case Fast:
  223. n, _ = CompressBlock(src, dst, ht)
  224. default:
  225. n, _ = CompressBlockHC(src, dst, w.level, ht)
  226. }
  227. if n == 0 {
  228. b.Size.compressedSet(false)
  229. dst = src
  230. } else {
  231. b.Size.compressedSet(true)
  232. dst = dst[:n]
  233. }
  234. b.Data = dst
  235. b.Size.sizeSet(len(dst))
  236. if w.frame.Descriptor.Flags.BlockChecksum() {
  237. b.Checksum = xxh32.ChecksumZero(src)
  238. }
  239. if w.frame.Descriptor.Flags.ContentChecksum() {
  240. _, _ = w.frame.checksum.Write(src)
  241. }
  242. return b
  243. }
  244. func (b *FrameDataBlock) write(w *_Writer) error {
  245. buf := w.buf[:]
  246. out := w.src
  247. binary.LittleEndian.PutUint32(buf, uint32(b.Size))
  248. if _, err := out.Write(buf[:4]); err != nil {
  249. return err
  250. }
  251. if _, err := out.Write(b.Data); err != nil {
  252. return err
  253. }
  254. if b.Checksum == 0 {
  255. return nil
  256. }
  257. binary.LittleEndian.PutUint32(buf, b.Checksum)
  258. _, err := out.Write(buf[:4])
  259. return err
  260. }
  261. func (b *FrameDataBlock) uncompress(r *_Reader, dst []byte) (int, error) {
  262. var x uint32
  263. if err := readUint32(r.src, r.buf[:], &x); err != nil {
  264. return 0, err
  265. }
  266. b.Size = DataBlockSize(x)
  267. if b.Size == 0 {
  268. return 0, io.EOF
  269. }
  270. isCompressed := b.Size.compressed()
  271. var data []byte
  272. if isCompressed {
  273. data = b.Data
  274. } else {
  275. data = dst
  276. }
  277. if _, err := io.ReadFull(r.src, data[:b.Size.size()]); err != nil {
  278. return 0, err
  279. }
  280. if isCompressed {
  281. n, err := UncompressBlock(data, dst)
  282. if err != nil {
  283. return 0, err
  284. }
  285. data = dst[:n]
  286. }
  287. if r.frame.Descriptor.Flags.BlockChecksum() {
  288. if err := readUint32(r.src, r.buf[:], &b.Checksum); err != nil {
  289. return 0, err
  290. }
  291. if c := xxh32.ChecksumZero(data); c != b.Checksum {
  292. return 0, fmt.Errorf("lz4: %w: got %x; expected %x", ErrInvalidBlockChecksum, c, b.Checksum)
  293. }
  294. }
  295. if r.frame.Descriptor.Flags.ContentChecksum() {
  296. _, _ = r.frame.checksum.Write(data)
  297. }
  298. return len(data), nil
  299. }
  300. func readUint32(r io.Reader, buf []byte, x *uint32) error {
  301. if _, err := io.ReadFull(r, buf[:4]); err != nil {
  302. return err
  303. }
  304. *x = binary.LittleEndian.Uint32(buf)
  305. return nil
  306. }