| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801 |
- package xlsx
- import (
- "archive/zip"
- "encoding/xml"
- "errors"
- "fmt"
- "io"
- "math"
- "strconv"
- "strings"
- )
- // XLSXReaderError is the standard error type for otherwise undefined
- // errors in the XSLX reading process.
- type XLSXReaderError struct {
- Err string
- }
- // String() returns a string value from an XLSXReaderError struct in
- // order that it might comply with the os.Error interface.
- func (e *XLSXReaderError) Error() string {
- return e.Err
- }
- // Cell is a high level structure intended to provide user access to
- // the contents of Cell within an xlsx.Row.
- type Cell struct {
- Value string
- styleIndex int
- styles *xlsxStyles
- numFmtRefTable map[int]xlsxNumFmt
- date1904 bool
- }
- // CellInterface defines the public API of the Cell.
- type CellInterface interface {
- String() string
- }
- // String returns the value of a Cell as a string.
- func (c *Cell) String() string {
- return c.Value
- }
- // GetStyle returns the Style associated with a Cell
- func (c *Cell) GetStyle() *Style {
- style := &Style{}
- if c.styleIndex > 0 && c.styleIndex <= len(c.styles.CellXfs) {
- xf := c.styles.CellXfs[c.styleIndex-1]
- if xf.ApplyBorder {
- var border Border
- border.Left = c.styles.Borders[xf.BorderId].Left.Style
- border.Right = c.styles.Borders[xf.BorderId].Right.Style
- border.Top = c.styles.Borders[xf.BorderId].Top.Style
- border.Bottom = c.styles.Borders[xf.BorderId].Bottom.Style
- style.Border = border
- }
- if xf.ApplyFill {
- var fill Fill
- fill.PatternType = c.styles.Fills[xf.FillId].PatternFill.PatternType
- fill.BgColor = c.styles.Fills[xf.FillId].PatternFill.BgColor.RGB
- fill.FgColor = c.styles.Fills[xf.FillId].PatternFill.FgColor.RGB
- style.Fill = fill
- }
- if xf.ApplyFont {
- font := c.styles.Fonts[xf.FontId]
- style.Font = Font{}
- style.Font.Size, _ = strconv.Atoi(font.Sz.Val)
- style.Font.Name = font.Name.Val
- style.Font.Family, _ = strconv.Atoi(font.Family.Val)
- style.Font.Charset, _ = strconv.Atoi(font.Charset.Val)
- }
- }
- return style
- }
- // The number format string is returnable from a cell.
- func (c *Cell) GetNumberFormat() string {
- var numberFormat string = ""
- if c.styleIndex > 0 && c.styleIndex <= len(c.styles.CellXfs) {
- xf := c.styles.CellXfs[c.styleIndex-1]
- numFmt := c.numFmtRefTable[xf.NumFmtId]
- numberFormat = numFmt.FormatCode
- }
- return strings.ToLower(numberFormat)
- }
- func (c *Cell) formatToTime(format string) string {
- f, err := strconv.ParseFloat(c.Value, 64)
- if err != nil {
- return err.Error()
- }
- return TimeFromExcelTime(f, c.date1904).Format(format)
- }
- func (c *Cell) formatToFloat(format string) string {
- f, err := strconv.ParseFloat(c.Value, 64)
- if err != nil {
- return err.Error()
- }
- return fmt.Sprintf(format, f)
- }
- func (c *Cell) formatToInt(format string) string {
- f, err := strconv.ParseFloat(c.Value, 64)
- if err != nil {
- return err.Error()
- }
- return fmt.Sprintf(format, int(f))
- }
- // Return the formatted version of the value.
- func (c *Cell) FormattedValue() string {
- var numberFormat string = c.GetNumberFormat()
- switch numberFormat {
- case "general":
- return c.Value
- case "0", "#,##0":
- return c.formatToInt("%d")
- case "0.00", "#,##0.00", "@":
- return c.formatToFloat("%.2f")
- case "#,##0 ;(#,##0)", "#,##0 ;[red](#,##0)":
- f, err := strconv.ParseFloat(c.Value, 64)
- if err != nil {
- return err.Error()
- }
- if f < 0 {
- i := int(math.Abs(f))
- return fmt.Sprintf("(%d)", i)
- }
- i := int(f)
- return fmt.Sprintf("%d", i)
- case "#,##0.00;(#,##0.00)", "#,##0.00;[red](#,##0.00)":
- f, err := strconv.ParseFloat(c.Value, 64)
- if err != nil {
- return err.Error()
- }
- if f < 0 {
- return fmt.Sprintf("(%.2f)", f)
- }
- return fmt.Sprintf("%.2f", f)
- case "0%":
- f, err := strconv.ParseFloat(c.Value, 64)
- if err != nil {
- return err.Error()
- }
- f = f * 100
- return fmt.Sprintf("%d%%", int(f))
- case "0.00%":
- f, err := strconv.ParseFloat(c.Value, 64)
- if err != nil {
- return err.Error()
- }
- f = f * 100
- return fmt.Sprintf("%.2f%%", f)
- case "0.00e+00", "##0.0e+0":
- return c.formatToFloat("%e")
- case "mm-dd-yy":
- return c.formatToTime("01-02-06")
- case "d-mmm-yy":
- return c.formatToTime("2-Jan-06")
- case "d-mmm":
- return c.formatToTime("2-Jan")
- case "mmm-yy":
- return c.formatToTime("Jan-06")
- case "h:mm am/pm":
- return c.formatToTime("3:04 pm")
- case "h:mm:ss am/pm":
- return c.formatToTime("3:04:05 pm")
- case "h:mm":
- return c.formatToTime("15:04")
- case "h:mm:ss":
- return c.formatToTime("15:04:05")
- case "m/d/yy h:mm":
- return c.formatToTime("1/2/06 15:04")
- case "mm:ss":
- return c.formatToTime("04:05")
- case "[h]:mm:ss":
- f, err := strconv.ParseFloat(c.Value, 64)
- if err != nil {
- return err.Error()
- }
- t := TimeFromExcelTime(f, c.date1904)
- if t.Hour() > 0 {
- return t.Format("15:04:05")
- }
- return t.Format("04:05")
- case "mmss.0":
- f, err := strconv.ParseFloat(c.Value, 64)
- if err != nil {
- return err.Error()
- }
- t := TimeFromExcelTime(f, c.date1904)
- return fmt.Sprintf("%0d%0d.%d", t.Minute(), t.Second(), t.Nanosecond()/1000)
- case "yyyy\\-mm\\-dd":
- return c.formatToTime("2006\\-01\\-02")
- case "dd/mm/yy":
- return c.formatToTime("02/01/06")
- case "hh:mm:ss":
- return c.formatToTime("15:04:05")
- case "dd/mm/yy\\ hh:mm":
- return c.formatToTime("02/01/06\\ 15:04")
- case "dd/mm/yyyy hh:mm:ss":
- return c.formatToTime("02/01/2006 15:04:05")
- case "yy-mm-dd":
- return c.formatToTime("06-01-02")
- case "d-mmm-yyyy":
- return c.formatToTime("2-Jan-2006")
- case "m/d/yy":
- return c.formatToTime("1/2/06")
- case "m/d/yyyy":
- return c.formatToTime("1/2/2006")
- case "dd-mmm-yyyy":
- return c.formatToTime("02-Jan-2006")
- case "dd/mm/yyyy":
- return c.formatToTime("02/01/2006")
- case "mm/dd/yy hh:mm am/pm":
- return c.formatToTime("01/02/06 03:04 pm")
- case "mm/dd/yyyy hh:mm:ss":
- return c.formatToTime("01/02/2006 15:04:05")
- case "yyyy-mm-dd hh:mm:ss":
- return c.formatToTime("2006-01-02 15:04:05")
- }
- return c.Value
- }
- // Row is a high level structure indended to provide user access to a
- // row within a xlsx.Sheet. An xlsx.Row contains a slice of xlsx.Cell.
- type Row struct {
- Cells []*Cell
- }
- // Sheet is a high level structure intended to provide user access to
- // the contents of a particular sheet within an XLSX file.
- type Sheet struct {
- Name string
- Rows []*Row
- MaxRow int
- MaxCol int
- }
- // Style is a high level structure intended to provide user access to
- // the contents of Style within an XLSX file.
- type Style struct {
- Border Border
- Fill Fill
- Font Font
- }
- // Border is a high level structure intended to provide user access to
- // the contents of Border Style within an Sheet.
- type Border struct {
- Left string
- Right string
- Top string
- Bottom string
- }
- // Fill is a high level structure intended to provide user access to
- // the contents of background and foreground color index within an Sheet.
- type Fill struct {
- PatternType string
- BgColor string
- FgColor string
- }
- type Font struct {
- Size int
- Name string
- Family int
- Charset int
- }
- // File is a high level structure providing a slice of Sheet structs
- // to the user.
- type File struct {
- worksheets map[string]*zip.File
- numFmtRefTable map[int]xlsxNumFmt
- referenceTable []string
- styles *xlsxStyles
- Sheets []*Sheet // sheet access by index
- Sheet map[string]*Sheet // sheet access by name
- Date1904 bool
- }
- // getRangeFromString is an internal helper function that converts
- // XLSX internal range syntax to a pair of integers. For example,
- // the range string "1:3" yield the upper and lower intergers 1 and 3.
- func getRangeFromString(rangeString string) (lower int, upper int, error error) {
- var parts []string
- parts = strings.SplitN(rangeString, ":", 2)
- if parts[0] == "" {
- error = errors.New(fmt.Sprintf("Invalid range '%s'\n", rangeString))
- }
- if parts[1] == "" {
- error = errors.New(fmt.Sprintf("Invalid range '%s'\n", rangeString))
- }
- lower, error = strconv.Atoi(parts[0])
- if error != nil {
- error = errors.New(fmt.Sprintf("Invalid range (not integer in lower bound) %s\n", rangeString))
- }
- upper, error = strconv.Atoi(parts[1])
- if error != nil {
- error = errors.New(fmt.Sprintf("Invalid range (not integer in upper bound) %s\n", rangeString))
- }
- return lower, upper, error
- }
- // lettersToNumeric is used to convert a character based column
- // reference to a zero based numeric column identifier.
- func lettersToNumeric(letters string) int {
- sum, mul, n := 0, 1, 0
- for i := len(letters) - 1; i >= 0; i, mul, n = i-1, mul*26, 1 {
- c := letters[i]
- switch {
- case 'A' <= c && c <= 'Z':
- n += int(c - 'A')
- case 'a' <= c && c <= 'z':
- n += int(c - 'a')
- }
- sum += n * mul
- }
- return sum
- }
- // letterOnlyMapF is used in conjunction with strings.Map to return
- // only the characters A-Z and a-z in a string
- func letterOnlyMapF(rune rune) rune {
- switch {
- case 'A' <= rune && rune <= 'Z':
- return rune
- case 'a' <= rune && rune <= 'z':
- return rune - 32
- }
- return -1
- }
- // intOnlyMapF is used in conjunction with strings.Map to return only
- // the numeric portions of a string.
- func intOnlyMapF(rune rune) rune {
- if rune >= 48 && rune < 58 {
- return rune
- }
- return -1
- }
- // getCoordsFromCellIDString returns the zero based cartesian
- // coordinates from a cell name in Excel format, e.g. the cellIDString
- // "A1" returns 0, 0 and the "B3" return 1, 2.
- func getCoordsFromCellIDString(cellIDString string) (x, y int, error error) {
- var letterPart string = strings.Map(letterOnlyMapF, cellIDString)
- y, error = strconv.Atoi(strings.Map(intOnlyMapF, cellIDString))
- if error != nil {
- return x, y, error
- }
- y -= 1 // Zero based
- x = lettersToNumeric(letterPart)
- return x, y, error
- }
- // getMaxMinFromDimensionRef return the zero based cartesian maximum
- // and minimum coordinates from the dimension reference embedded in a
- // XLSX worksheet. For example, the dimension reference "A1:B2"
- // returns "0,0", "1,1".
- func getMaxMinFromDimensionRef(ref string) (minx, miny, maxx, maxy int, err error) {
- var parts []string
- parts = strings.Split(ref, ":")
- minx, miny, err = getCoordsFromCellIDString(parts[0])
- if err != nil {
- return -1, -1, -1, -1, err
- }
- if len(parts) == 1 {
- maxx, maxy = minx, miny
- return
- }
- maxx, maxy, err = getCoordsFromCellIDString(parts[1])
- if err != nil {
- return -1, -1, -1, -1, err
- }
- return
- }
- // calculateMaxMinFromWorkSheet works out the dimensions of a spreadsheet
- // that doesn't have a DimensionRef set. The only case currently
- // known where this is true is with XLSX exported from Google Docs.
- func calculateMaxMinFromWorksheet(worksheet *xlsxWorksheet) (minx, miny, maxx, maxy int, err error) {
- // Note, this method could be very slow for large spreadsheets.
- var x, y int
- minx = 0
- miny = 0
- maxy = 0
- maxx = 0
- for _, row := range worksheet.SheetData.Row {
- for _, cell := range row.C {
- x, y, err = getCoordsFromCellIDString(cell.R)
- if err != nil {
- return -1, -1, -1, -1, err
- }
- if x < minx {
- minx = x
- }
- if x > maxx {
- maxx = x
- }
- if y < miny {
- miny = y
- }
- if y > maxy {
- maxy = y
- }
- }
- }
- return
- }
- // makeRowFromSpan will, when given a span expressed as a string,
- // return an empty Row large enough to encompass that span and
- // populate it with empty cells. All rows start from cell 1 -
- // regardless of the lower bound of the span.
- func makeRowFromSpan(spans string) *Row {
- var error error
- var upper int
- var row *Row
- var cell *Cell
- row = new(Row)
- _, upper, error = getRangeFromString(spans)
- if error != nil {
- panic(error)
- }
- error = nil
- row.Cells = make([]*Cell, upper)
- for i := 0; i < upper; i++ {
- cell = new(Cell)
- cell.Value = ""
- row.Cells[i] = cell
- }
- return row
- }
- // makeRowFromRaw returns the Row representation of the xlsxRow.
- func makeRowFromRaw(rawrow xlsxRow) *Row {
- var upper int
- var row *Row
- var cell *Cell
- row = new(Row)
- upper = -1
- for _, rawcell := range rawrow.C {
- x, _, error := getCoordsFromCellIDString(rawcell.R)
- if error != nil {
- panic(fmt.Sprintf("Invalid Cell Coord, %s\n", rawcell.R))
- }
- if x > upper {
- upper = x
- }
- }
- upper++
- row.Cells = make([]*Cell, upper)
- for i := 0; i < upper; i++ {
- cell = new(Cell)
- cell.Value = ""
- row.Cells[i] = cell
- }
- return row
- }
- // getValueFromCellData attempts to extract a valid value, usable in CSV form from the raw cell value.
- // Note - this is not actually general enough - we should support retaining tabs and newlines.
- func getValueFromCellData(rawcell xlsxC, reftable []string) string {
- var value string = ""
- var data string = rawcell.V
- if len(data) > 0 {
- vval := strings.Trim(data, " \t\n\r")
- switch rawcell.T {
- case "s": // Shared String
- ref, error := strconv.Atoi(vval)
- if error != nil {
- panic(error)
- }
- value = reftable[ref]
- default:
- value = vval
- }
- }
- return value
- }
- // readRowsFromSheet is an internal helper function that extracts the
- // rows from a XSLXWorksheet, poulates them with Cells and resolves
- // the value references from the reference table and stores them in
- func readRowsFromSheet(Worksheet *xlsxWorksheet, file *File) ([]*Row, int, int) {
- var rows []*Row
- var row *Row
- var minCol, maxCol, minRow, maxRow, colCount, rowCount int
- var reftable []string
- var err error
- var insertRowIndex, insertColIndex int
- if len(Worksheet.SheetData.Row) == 0 {
- return nil, 0, 0
- }
- reftable = file.referenceTable
- if len(Worksheet.Dimension.Ref) > 0 {
- minCol, minRow, maxCol, maxRow, err = getMaxMinFromDimensionRef(Worksheet.Dimension.Ref)
- } else {
- minCol, minRow, maxCol, maxRow, err = calculateMaxMinFromWorksheet(Worksheet)
- }
- if err != nil {
- panic(err.Error())
- }
- rowCount = (maxRow - minRow) + 1
- colCount = (maxCol - minCol) + 1
- rows = make([]*Row, rowCount)
- insertRowIndex = minRow
- for rowIndex := 0; rowIndex < len(Worksheet.SheetData.Row); rowIndex++ {
- rawrow := Worksheet.SheetData.Row[rowIndex]
- // Some spreadsheets will omit blank rows from the
- // stored data
- for rawrow.R > (insertRowIndex + 1) {
- // Put an empty Row into the array
- rows[insertRowIndex-minRow] = new(Row)
- insertRowIndex++
- }
- // range is not empty and only one range exist
- if len(rawrow.Spans) != 0 && strings.Count(rawrow.Spans, ":") == 1 {
- row = makeRowFromSpan(rawrow.Spans)
- } else {
- row = makeRowFromRaw(rawrow)
- }
- insertColIndex = minCol
- for _, rawcell := range rawrow.C {
- x, _, _ := getCoordsFromCellIDString(rawcell.R)
- // Some spreadsheets will omit blank cells
- // from the data.
- for x > insertColIndex {
- // Put an empty Cell into the array
- row.Cells[insertColIndex-minCol] = new(Cell)
- insertColIndex++
- }
- cellX := insertColIndex - minCol
- row.Cells[cellX].Value = getValueFromCellData(rawcell, reftable)
- row.Cells[cellX].styleIndex = rawcell.S
- row.Cells[cellX].styles = file.styles
- row.Cells[cellX].numFmtRefTable = file.numFmtRefTable
- row.Cells[cellX].date1904 = file.Date1904
- insertColIndex++
- }
- rows[insertRowIndex-minRow] = row
- insertRowIndex++
- }
- return rows, colCount, rowCount
- }
- type indexedSheet struct {
- Index int
- Sheet *Sheet
- Error error
- }
- // readSheetFromFile is the logic of converting a xlsxSheet struct
- // into a Sheet struct. This work can be done in parallel and so
- // readSheetsFromZipFile will spawn an instance of this function per
- // sheet and get the results back on the provided channel.
- func readSheetFromFile(sc chan *indexedSheet, index int, rsheet xlsxSheet, fi *File, sheetXMLMap map[string]string) {
- result := &indexedSheet{Index: index, Sheet: nil, Error: nil}
- worksheet, error := getWorksheetFromSheet(rsheet, fi.worksheets, sheetXMLMap)
- if error != nil {
- result.Error = error
- sc <- result
- return
- }
- sheet := new(Sheet)
- sheet.Rows, sheet.MaxCol, sheet.MaxRow = readRowsFromSheet(worksheet, fi)
- result.Sheet = sheet
- sc <- result
- }
- // readSheetsFromZipFile is an internal helper function that loops
- // over the Worksheets defined in the XSLXWorkbook and loads them into
- // Sheet objects stored in the Sheets slice of a xlsx.File struct.
- func readSheetsFromZipFile(f *zip.File, file *File, sheetXMLMap map[string]string) ([]*Sheet, error) {
- var workbook *xlsxWorkbook
- var error error
- var rc io.ReadCloser
- var decoder *xml.Decoder
- var sheetCount int
- workbook = new(xlsxWorkbook)
- rc, error = f.Open()
- if error != nil {
- return nil, error
- }
- decoder = xml.NewDecoder(rc)
- error = decoder.Decode(workbook)
- if error != nil {
- return nil, error
- }
- file.Date1904 = workbook.WorkbookPr.Date1904
- sheetCount = len(workbook.Sheets.Sheet)
- sheets := make([]*Sheet, sheetCount)
- sheetChan := make(chan *indexedSheet, sheetCount)
- for i, rawsheet := range workbook.Sheets.Sheet {
- go readSheetFromFile(sheetChan, i, rawsheet, file, sheetXMLMap)
- }
- for j := 0; j < sheetCount; j++ {
- sheet := <-sheetChan
- if sheet.Error != nil {
- return nil, sheet.Error
- }
- sheet.Sheet.Name = workbook.Sheets.Sheet[sheet.Index].Name
- sheets[sheet.Index] = sheet.Sheet
- }
- return sheets, nil
- }
- // readSharedStringsFromZipFile() is an internal helper function to
- // extract a reference table from the sharedStrings.xml file within
- // the XLSX zip file.
- func readSharedStringsFromZipFile(f *zip.File) ([]string, error) {
- var sst *xlsxSST
- var error error
- var rc io.ReadCloser
- var decoder *xml.Decoder
- var reftable []string
- rc, error = f.Open()
- if error != nil {
- return nil, error
- }
- sst = new(xlsxSST)
- decoder = xml.NewDecoder(rc)
- error = decoder.Decode(sst)
- if error != nil {
- return nil, error
- }
- reftable = MakeSharedStringRefTable(sst)
- return reftable, nil
- }
- // readStylesFromZipFile() is an internal helper function to
- // extract a style table from the style.xml file within
- // the XLSX zip file.
- func readStylesFromZipFile(f *zip.File) (*xlsxStyles, error) {
- var style *xlsxStyles
- var error error
- var rc io.ReadCloser
- var decoder *xml.Decoder
- rc, error = f.Open()
- if error != nil {
- return nil, error
- }
- style = new(xlsxStyles)
- decoder = xml.NewDecoder(rc)
- error = decoder.Decode(style)
- if error != nil {
- return nil, error
- }
- return style, nil
- }
- func buildNumFmtRefTable(style *xlsxStyles) map[int]xlsxNumFmt {
- refTable := make(map[int]xlsxNumFmt)
- for _, numFmt := range style.NumFmts {
- refTable[numFmt.NumFmtId] = numFmt
- }
- return refTable
- }
- // readWorkbookRelationsFromZipFile is an internal helper function to
- // extract a map of relationship ID strings to the name of the
- // worksheet.xml file they refer to. The resulting map can be used to
- // reliably derefence the worksheets in the XLSX file.
- func readWorkbookRelationsFromZipFile(workbookRels *zip.File) (map[string]string, error) {
- var sheetXMLMap map[string]string
- var wbRelationships *xlsxWorkbookRels
- var rc io.ReadCloser
- var decoder *xml.Decoder
- var err error
- rc, err = workbookRels.Open()
- if err != nil {
- return nil, err
- }
- decoder = xml.NewDecoder(rc)
- wbRelationships = new(xlsxWorkbookRels)
- err = decoder.Decode(wbRelationships)
- if err != nil {
- return nil, err
- }
- sheetXMLMap = make(map[string]string)
- for _, rel := range wbRelationships.Relationships {
- if strings.HasSuffix(rel.Target, ".xml") && strings.HasPrefix(rel.Target, "worksheets/") {
- sheetXMLMap[rel.Id] = strings.Replace(rel.Target[len("worksheets/"):], ".xml", "", 1)
- }
- }
- return sheetXMLMap, nil
- }
- // OpenFile() take the name of an XLSX file and returns a populated
- // xlsx.File struct for it.
- func OpenFile(filename string) (*File, error) {
- var f *zip.ReadCloser
- f, err := zip.OpenReader(filename)
- if err != nil {
- return nil, err
- }
- return ReadZip(f)
- }
- // ReadZip() takes a pointer to a zip.ReadCloser and returns a
- // xlsx.File struct populated with its contents. In most cases
- // ReadZip is not used directly, but is called internally by OpenFile.
- func ReadZip(f *zip.ReadCloser) (*File, error) {
- defer f.Close()
- return ReadZipReader(&f.Reader)
- }
- // ReadZipReader() can be used to read xlsx in memory without touch filesystem.
- func ReadZipReader(r *zip.Reader) (*File, error) {
- var err error
- var file *File
- var reftable []string
- var sharedStrings *zip.File
- var sheetMap map[string]*Sheet
- var sheetXMLMap map[string]string
- var sheets []*Sheet
- var style *xlsxStyles
- var styles *zip.File
- var v *zip.File
- var workbook *zip.File
- var workbookRels *zip.File
- var worksheets map[string]*zip.File
- file = new(File)
- worksheets = make(map[string]*zip.File, len(r.File))
- for _, v = range r.File {
- switch v.Name {
- case "xl/sharedStrings.xml":
- sharedStrings = v
- case "xl/workbook.xml":
- workbook = v
- case "xl/_rels/workbook.xml.rels":
- workbookRels = v
- case "xl/styles.xml":
- styles = v
- default:
- if len(v.Name) > 14 {
- if v.Name[0:13] == "xl/worksheets" {
- worksheets[v.Name[14:len(v.Name)-4]] = v
- }
- }
- }
- }
- sheetXMLMap, err = readWorkbookRelationsFromZipFile(workbookRels)
- if err != nil {
- return nil, err
- }
- file.worksheets = worksheets
- reftable, err = readSharedStringsFromZipFile(sharedStrings)
- if err != nil {
- return nil, err
- }
- if reftable == nil {
- readerErr := new(XLSXReaderError)
- readerErr.Err = "No valid sharedStrings.xml found in XLSX file"
- return nil, readerErr
- }
- file.referenceTable = reftable
- style, err = readStylesFromZipFile(styles)
- if err != nil {
- return nil, err
- }
- file.styles = style
- file.numFmtRefTable = buildNumFmtRefTable(style)
- sheets, err = readSheetsFromZipFile(workbook, file, sheetXMLMap)
- if err != nil {
- return nil, err
- }
- if sheets == nil {
- readerErr := new(XLSXReaderError)
- readerErr.Err = "No sheets found in XLSX File"
- return nil, readerErr
- }
- file.Sheets = sheets
- sheetMap = make(map[string]*Sheet, len(sheets))
- for i := 0; i < len(sheets); i++ {
- sheetMap[sheets[i].Name] = sheets[i]
- }
- file.Sheet = sheetMap
- return file, nil
- }
- func NewFile() *File {
- return &File{}
- }
|