123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387 |
- // Copyright 2010 The Go Authors. All rights reserved.
- // Use of this source code is governed by a BSD-style
- // license that can be found in the LICENSE file.
- /*
- Package zip provides support for reading and writing ZIP archives.
- See: https://www.pkware.com/appnote
- This package does not support disk spanning.
- A note about ZIP64:
- To be backwards compatible the FileHeader has both 32 and 64 bit Size
- fields. The 64 bit fields will always contain the correct value and
- for normal archives both fields will be the same. For files requiring
- the ZIP64 format the 32 bit fields will be 0xffffffff and the 64 bit
- fields must be used instead.
- */
- package zip
- import (
- "os"
- "path"
- "time"
- )
- // Compression methods.
- const (
- Store uint16 = 0 // no compression
- Deflate uint16 = 8 // DEFLATE compressed
- )
- const (
- fileHeaderSignature = 0x04034b50
- directoryHeaderSignature = 0x02014b50
- directoryEndSignature = 0x06054b50
- directory64LocSignature = 0x07064b50
- directory64EndSignature = 0x06064b50
- dataDescriptorSignature = 0x08074b50 // de-facto standard; required by OS X Finder
- fileHeaderLen = 30 // + filename + extra
- directoryHeaderLen = 46 // + filename + extra + comment
- directoryEndLen = 22 // + comment
- dataDescriptorLen = 16 // four uint32: descriptor signature, crc32, compressed size, size
- dataDescriptor64Len = 24 // descriptor with 8 byte sizes
- directory64LocLen = 20 //
- directory64EndLen = 56 // + extra
- // Constants for the first byte in CreatorVersion.
- creatorFAT = 0
- creatorUnix = 3
- creatorNTFS = 11
- creatorVFAT = 14
- creatorMacOSX = 19
- // Version numbers.
- zipVersion20 = 20 // 2.0
- zipVersion45 = 45 // 4.5 (reads and writes zip64 archives)
- // Limits for non zip64 files.
- uint16max = (1 << 16) - 1
- uint32max = (1 << 32) - 1
- // Extra header IDs.
- //
- // IDs 0..31 are reserved for official use by PKWARE.
- // IDs above that range are defined by third-party vendors.
- // Since ZIP lacked high precision timestamps (nor a official specification
- // of the timezone used for the date fields), many competing extra fields
- // have been invented. Pervasive use effectively makes them "official".
- //
- // See http://mdfs.net/Docs/Comp/Archiving/Zip/ExtraField
- zip64ExtraID = 0x0001 // Zip64 extended information
- ntfsExtraID = 0x000a // NTFS
- unixExtraID = 0x000d // UNIX
- extTimeExtraID = 0x5455 // Extended timestamp
- infoZipUnixExtraID = 0x5855 // Info-ZIP Unix extension
- )
- // FileHeader describes a file within a zip file.
- // See the zip spec for details.
- type FileHeader struct {
- // Name is the name of the file.
- //
- // It must be a relative path, not start with a drive letter (such as "C:"),
- // and must use forward slashes instead of back slashes. A trailing slash
- // indicates that this file is a directory and should have no data.
- //
- // When reading zip files, the Name field is populated from
- // the zip file directly and is not validated for correctness.
- // It is the caller's responsibility to sanitize it as
- // appropriate, including canonicalizing slash directions,
- // validating that paths are relative, and preventing path
- // traversal through filenames ("../../../").
- Name string
- // Comment is any arbitrary user-defined string shorter than 64KiB.
- Comment string
- // NonUTF8 indicates that Name and Comment are not encoded in UTF-8.
- //
- // By specification, the only other encoding permitted should be CP-437,
- // but historically many ZIP readers interpret Name and Comment as whatever
- // the system's local character encoding happens to be.
- //
- // This flag should only be set if the user intends to encode a non-portable
- // ZIP file for a specific localized region. Otherwise, the Writer
- // automatically sets the ZIP format's UTF-8 flag for valid UTF-8 strings.
- NonUTF8 bool
- CreatorVersion uint16
- ReaderVersion uint16
- Flags uint16
- // Method is the compression method. If zero, Store is used.
- Method uint16
- // Modified is the modified time of the file.
- //
- // When reading, an extended timestamp is preferred over the legacy MS-DOS
- // date field, and the offset between the times is used as the timezone.
- // If only the MS-DOS date is present, the timezone is assumed to be UTC.
- //
- // When writing, an extended timestamp (which is timezone-agnostic) is
- // always emitted. The legacy MS-DOS date field is encoded according to the
- // location of the Modified time.
- Modified time.Time
- ModifiedTime uint16 // Deprecated: Legacy MS-DOS date; use Modified instead.
- ModifiedDate uint16 // Deprecated: Legacy MS-DOS time; use Modified instead.
- CRC32 uint32
- CompressedSize uint32 // Deprecated: Use CompressedSize64 instead.
- UncompressedSize uint32 // Deprecated: Use UncompressedSize64 instead.
- CompressedSize64 uint64
- UncompressedSize64 uint64
- Extra []byte
- ExternalAttrs uint32 // Meaning depends on CreatorVersion
- }
- // FileInfo returns an os.FileInfo for the FileHeader.
- func (h *FileHeader) FileInfo() os.FileInfo {
- return headerFileInfo{h}
- }
- // headerFileInfo implements os.FileInfo.
- type headerFileInfo struct {
- fh *FileHeader
- }
- func (fi headerFileInfo) Name() string { return path.Base(fi.fh.Name) }
- func (fi headerFileInfo) Size() int64 {
- if fi.fh.UncompressedSize64 > 0 {
- return int64(fi.fh.UncompressedSize64)
- }
- return int64(fi.fh.UncompressedSize)
- }
- func (fi headerFileInfo) IsDir() bool { return fi.Mode().IsDir() }
- func (fi headerFileInfo) ModTime() time.Time {
- if fi.fh.Modified.IsZero() {
- return fi.fh.ModTime()
- }
- return fi.fh.Modified.UTC()
- }
- func (fi headerFileInfo) Mode() os.FileMode { return fi.fh.Mode() }
- func (fi headerFileInfo) Sys() interface{} { return fi.fh }
- // FileInfoHeader creates a partially-populated FileHeader from an
- // os.FileInfo.
- // Because os.FileInfo's Name method returns only the base name of
- // the file it describes, it may be necessary to modify the Name field
- // of the returned header to provide the full path name of the file.
- // If compression is desired, callers should set the FileHeader.Method
- // field; it is unset by default.
- func FileInfoHeader(fi os.FileInfo) (*FileHeader, error) {
- size := fi.Size()
- fh := &FileHeader{
- Name: fi.Name(),
- UncompressedSize64: uint64(size),
- }
- fh.SetModTime(fi.ModTime())
- fh.SetMode(fi.Mode())
- if fh.UncompressedSize64 > uint32max {
- fh.UncompressedSize = uint32max
- } else {
- fh.UncompressedSize = uint32(fh.UncompressedSize64)
- }
- return fh, nil
- }
- type directoryEnd struct {
- diskNbr uint32 // unused
- dirDiskNbr uint32 // unused
- dirRecordsThisDisk uint64 // unused
- directoryRecords uint64
- directorySize uint64
- directoryOffset uint64 // relative to file
- commentLen uint16
- comment string
- }
- // timeZone returns a *time.Location based on the provided offset.
- // If the offset is non-sensible, then this uses an offset of zero.
- func timeZone(offset time.Duration) *time.Location {
- const (
- minOffset = -12 * time.Hour // E.g., Baker island at -12:00
- maxOffset = +14 * time.Hour // E.g., Line island at +14:00
- offsetAlias = 15 * time.Minute // E.g., Nepal at +5:45
- )
- offset = offset.Round(offsetAlias)
- if offset < minOffset || maxOffset < offset {
- offset = 0
- }
- return time.FixedZone("", int(offset/time.Second))
- }
- // msDosTimeToTime converts an MS-DOS date and time into a time.Time.
- // The resolution is 2s.
- // See: https://msdn.microsoft.com/en-us/library/ms724247(v=VS.85).aspx
- func msDosTimeToTime(dosDate, dosTime uint16) time.Time {
- return time.Date(
- // date bits 0-4: day of month; 5-8: month; 9-15: years since 1980
- int(dosDate>>9+1980),
- time.Month(dosDate>>5&0xf),
- int(dosDate&0x1f),
- // time bits 0-4: second/2; 5-10: minute; 11-15: hour
- int(dosTime>>11),
- int(dosTime>>5&0x3f),
- int(dosTime&0x1f*2),
- 0, // nanoseconds
- time.UTC,
- )
- }
- // timeToMsDosTime converts a time.Time to an MS-DOS date and time.
- // The resolution is 2s.
- // See: https://msdn.microsoft.com/en-us/library/ms724274(v=VS.85).aspx
- func timeToMsDosTime(t time.Time) (fDate uint16, fTime uint16) {
- fDate = uint16(t.Day() + int(t.Month())<<5 + (t.Year()-1980)<<9)
- fTime = uint16(t.Second()/2 + t.Minute()<<5 + t.Hour()<<11)
- return
- }
- // ModTime returns the modification time in UTC using the legacy
- // ModifiedDate and ModifiedTime fields.
- //
- // Deprecated: Use Modified instead.
- func (h *FileHeader) ModTime() time.Time {
- return msDosTimeToTime(h.ModifiedDate, h.ModifiedTime)
- }
- // SetModTime sets the Modified, ModifiedTime, and ModifiedDate fields
- // to the given time in UTC.
- //
- // Deprecated: Use Modified instead.
- func (h *FileHeader) SetModTime(t time.Time) {
- t = t.UTC() // Convert to UTC for compatibility
- h.Modified = t
- h.ModifiedDate, h.ModifiedTime = timeToMsDosTime(t)
- }
- const (
- // Unix constants. The specification doesn't mention them,
- // but these seem to be the values agreed on by tools.
- s_IFMT = 0xf000
- s_IFSOCK = 0xc000
- s_IFLNK = 0xa000
- s_IFREG = 0x8000
- s_IFBLK = 0x6000
- s_IFDIR = 0x4000
- s_IFCHR = 0x2000
- s_IFIFO = 0x1000
- s_ISUID = 0x800
- s_ISGID = 0x400
- s_ISVTX = 0x200
- msdosDir = 0x10
- msdosReadOnly = 0x01
- )
- // Mode returns the permission and mode bits for the FileHeader.
- func (h *FileHeader) Mode() (mode os.FileMode) {
- switch h.CreatorVersion >> 8 {
- case creatorUnix, creatorMacOSX:
- mode = unixModeToFileMode(h.ExternalAttrs >> 16)
- case creatorNTFS, creatorVFAT, creatorFAT:
- mode = msdosModeToFileMode(h.ExternalAttrs)
- }
- if len(h.Name) > 0 && h.Name[len(h.Name)-1] == '/' {
- mode |= os.ModeDir
- }
- return mode
- }
- // SetMode changes the permission and mode bits for the FileHeader.
- func (h *FileHeader) SetMode(mode os.FileMode) {
- h.CreatorVersion = h.CreatorVersion&0xff | creatorUnix<<8
- h.ExternalAttrs = fileModeToUnixMode(mode) << 16
- // set MSDOS attributes too, as the original zip does.
- if mode&os.ModeDir != 0 {
- h.ExternalAttrs |= msdosDir
- }
- if mode&0200 == 0 {
- h.ExternalAttrs |= msdosReadOnly
- }
- }
- // isZip64 reports whether the file size exceeds the 32 bit limit
- func (h *FileHeader) isZip64() bool {
- return h.CompressedSize64 >= uint32max || h.UncompressedSize64 >= uint32max
- }
- func msdosModeToFileMode(m uint32) (mode os.FileMode) {
- if m&msdosDir != 0 {
- mode = os.ModeDir | 0777
- } else {
- mode = 0666
- }
- if m&msdosReadOnly != 0 {
- mode &^= 0222
- }
- return mode
- }
- func fileModeToUnixMode(mode os.FileMode) uint32 {
- var m uint32
- switch mode & os.ModeType {
- default:
- m = s_IFREG
- case os.ModeDir:
- m = s_IFDIR
- case os.ModeSymlink:
- m = s_IFLNK
- case os.ModeNamedPipe:
- m = s_IFIFO
- case os.ModeSocket:
- m = s_IFSOCK
- case os.ModeDevice:
- if mode&os.ModeCharDevice != 0 {
- m = s_IFCHR
- } else {
- m = s_IFBLK
- }
- }
- if mode&os.ModeSetuid != 0 {
- m |= s_ISUID
- }
- if mode&os.ModeSetgid != 0 {
- m |= s_ISGID
- }
- if mode&os.ModeSticky != 0 {
- m |= s_ISVTX
- }
- return m | uint32(mode&0777)
- }
- func unixModeToFileMode(m uint32) os.FileMode {
- mode := os.FileMode(m & 0777)
- switch m & s_IFMT {
- case s_IFBLK:
- mode |= os.ModeDevice
- case s_IFCHR:
- mode |= os.ModeDevice | os.ModeCharDevice
- case s_IFDIR:
- mode |= os.ModeDir
- case s_IFIFO:
- mode |= os.ModeNamedPipe
- case s_IFLNK:
- mode |= os.ModeSymlink
- case s_IFREG:
- // nothing to do
- case s_IFSOCK:
- mode |= os.ModeSocket
- }
- if m&s_ISGID != 0 {
- mode |= os.ModeSetgid
- }
- if m&s_ISUID != 0 {
- mode |= os.ModeSetuid
- }
- if m&s_ISVTX != 0 {
- mode |= os.ModeSticky
- }
- return mode
- }
|