123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414 |
- package xlsx
- import (
- "archive/zip"
- "bytes"
- "encoding/xml"
- "errors"
- "fmt"
- "io"
- "os"
- "strconv"
- "strings"
- "unicode/utf8"
- )
- // File is a high level structure providing a slice of Sheet structs
- // to the user.
- type File struct {
- worksheets map[string]*zip.File
- referenceTable *RefTable
- Date1904 bool
- styles *xlsxStyleSheet
- Sheets []*Sheet
- Sheet map[string]*Sheet
- theme *theme
- DefinedNames []*xlsxDefinedName
- }
- const NoRowLimit int = -1
- // Create a new File
- func NewFile() *File {
- return &File{
- Sheet: make(map[string]*Sheet),
- Sheets: make([]*Sheet, 0),
- DefinedNames: make([]*xlsxDefinedName, 0),
- }
- }
- // OpenFile() take the name of an XLSX file and returns a populated
- // xlsx.File struct for it.
- func OpenFile(fileName string) (file *File, err error) {
- return OpenFileWithRowLimit(fileName, NoRowLimit)
- }
- // OpenFileWithRowLimit() will open the file, but will only read the specified number of rows.
- // If you save this file, it will be truncated to the number of rows specified.
- func OpenFileWithRowLimit(fileName string, rowLimit int) (file *File, err error) {
- var z *zip.ReadCloser
- z, err = zip.OpenReader(fileName)
- if err != nil {
- return nil, err
- }
- return ReadZipWithRowLimit(z, rowLimit)
- }
- // OpenBinary() take bytes of an XLSX file and returns a populated
- // xlsx.File struct for it.
- func OpenBinary(bs []byte) (*File, error) {
- return OpenBinaryWithRowLimit(bs, NoRowLimit)
- }
- // OpenBinaryWithRowLimit() take bytes of an XLSX file and returns a populated
- // xlsx.File struct for it.
- func OpenBinaryWithRowLimit(bs []byte, rowLimit int) (*File, error) {
- r := bytes.NewReader(bs)
- return OpenReaderAtWithRowLimit(r, int64(r.Len()), rowLimit)
- }
- // OpenReaderAt() take io.ReaderAt of an XLSX file and returns a populated
- // xlsx.File struct for it.
- func OpenReaderAt(r io.ReaderAt, size int64) (*File, error) {
- return OpenReaderAtWithRowLimit(r, size, NoRowLimit)
- }
- // OpenReaderAtWithRowLimit() take io.ReaderAt of an XLSX file and returns a populated
- // xlsx.File struct for it.
- func OpenReaderAtWithRowLimit(r io.ReaderAt, size int64, rowLimit int) (*File, error) {
- file, err := zip.NewReader(r, size)
- if err != nil {
- return nil, err
- }
- return ReadZipReaderWithRowLimit(file, rowLimit)
- }
- // A convenient wrapper around File.ToSlice, FileToSlice will
- // return the raw data contained in an Excel XLSX file as three
- // dimensional slice. The first index represents the sheet number,
- // the second the row number, and the third the cell number.
- //
- // For example:
- //
- // var mySlice [][][]string
- // var value string
- // mySlice = xlsx.FileToSlice("myXLSX.xlsx")
- // value = mySlice[0][0][0]
- //
- // Here, value would be set to the raw value of the cell A1 in the
- // first sheet in the XLSX file.
- func FileToSlice(path string) ([][][]string, error) {
- f, err := OpenFile(path)
- if err != nil {
- return nil, err
- }
- return f.ToSlice()
- }
- // FileToSliceUnmerged is a wrapper around File.ToSliceUnmerged.
- // It returns the raw data contained in an Excel XLSX file as three
- // dimensional slice. Merged cells will be unmerged. Covered cells become the
- // values of theirs origins.
- func FileToSliceUnmerged(path string) ([][][]string, error) {
- f, err := OpenFile(path)
- if err != nil {
- return nil, err
- }
- return f.ToSliceUnmerged()
- }
- // Save the File to an xlsx file at the provided path.
- func (f *File) Save(path string) (err error) {
- target, err := os.Create(path)
- if err != nil {
- return err
- }
- err = f.Write(target)
- if err != nil {
- return err
- }
- return target.Close()
- }
- // Write the File to io.Writer as xlsx
- func (f *File) Write(writer io.Writer) (err error) {
- parts, err := f.MarshallParts()
- if err != nil {
- return
- }
- zipWriter := zip.NewWriter(writer)
- for partName, part := range parts {
- w, err := zipWriter.Create(partName)
- if err != nil {
- return err
- }
- _, err = w.Write([]byte(part))
- if err != nil {
- return err
- }
- }
- return zipWriter.Close()
- }
- // AddSheet Add a new Sheet, with the provided name, to a File.
- // The minimum sheet name length is 1 character. If the sheet name length is less an error is thrown.
- // The maximum sheet name length is 31 characters. If the sheet name length is exceeded an error is thrown.
- // These special characters are also not allowed: : \ / ? * [ ]
- func (f *File) AddSheet(sheetName string) (*Sheet, error) {
- if _, exists := f.Sheet[sheetName]; exists {
- return nil, fmt.Errorf("duplicate sheet name '%s'.", sheetName)
- }
- runeLength := utf8.RuneCountInString(sheetName)
- if runeLength > 31 || runeLength == 0 {
- return nil, fmt.Errorf("sheet name must be 31 or fewer characters long. It is currently '%d' characters long", runeLength)
- }
- // Iterate over the runes
- for _, r := range sheetName {
- // Excel forbids : \ / ? * [ ]
- if r == ':' || r == '\\' || r == '/' || r == '?' || r == '*' || r == '[' || r == ']' {
- return nil, fmt.Errorf("sheet name must not contain any restricted characters : \\ / ? * [ ] but contains '%s'", string(r))
- }
- }
- sheet := &Sheet{
- Name: sheetName,
- File: f,
- Selected: len(f.Sheets) == 0,
- }
- f.Sheet[sheetName] = sheet
- f.Sheets = append(f.Sheets, sheet)
- return sheet, nil
- }
- // Appends an existing Sheet, with the provided name, to a File
- func (f *File) AppendSheet(sheet Sheet, sheetName string) (*Sheet, error) {
- if _, exists := f.Sheet[sheetName]; exists {
- return nil, fmt.Errorf("duplicate sheet name '%s'.", sheetName)
- }
- sheet.Name = sheetName
- sheet.File = f
- sheet.Selected = len(f.Sheets) == 0
- f.Sheet[sheetName] = &sheet
- f.Sheets = append(f.Sheets, &sheet)
- return &sheet, nil
- }
- func (f *File) makeWorkbook() xlsxWorkbook {
- return xlsxWorkbook{
- FileVersion: xlsxFileVersion{AppName: "Go XLSX"},
- WorkbookPr: xlsxWorkbookPr{ShowObjects: "all"},
- BookViews: xlsxBookViews{
- WorkBookView: []xlsxWorkBookView{
- {
- ShowHorizontalScroll: true,
- ShowSheetTabs: true,
- ShowVerticalScroll: true,
- TabRatio: 204,
- WindowHeight: 8192,
- WindowWidth: 16384,
- XWindow: "0",
- YWindow: "0",
- },
- },
- },
- Sheets: xlsxSheets{Sheet: make([]xlsxSheet, len(f.Sheets))},
- CalcPr: xlsxCalcPr{
- IterateCount: 100,
- RefMode: "A1",
- Iterate: false,
- IterateDelta: 0.001,
- },
- }
- }
- // Some tools that read XLSX files have very strict requirements about
- // the structure of the input XML. In particular both Numbers on the Mac
- // and SAS dislike inline XML namespace declarations, or namespace
- // prefixes that don't match the ones that Excel itself uses. This is a
- // problem because the Go XML library doesn't multiple namespace
- // declarations in a single element of a document. This function is a
- // horrible hack to fix that after the XML marshalling is completed.
- func replaceRelationshipsNameSpace(workbookMarshal string) string {
- newWorkbook := strings.Replace(workbookMarshal, `xmlns:relationships="http://schemas.openxmlformats.org/officeDocument/2006/relationships" relationships:id`, `r:id`, -1)
- // Dirty hack to fix issues #63 and #91; encoding/xml currently
- // "doesn't allow for additional namespaces to be defined in the
- // root element of the document," as described by @tealeg in the
- // comments for #63.
- oldXmlns := `<workbook xmlns="http://schemas.openxmlformats.org/spreadsheetml/2006/main">`
- newXmlns := `<workbook xmlns="http://schemas.openxmlformats.org/spreadsheetml/2006/main" xmlns:r="http://schemas.openxmlformats.org/officeDocument/2006/relationships">`
- return strings.Replace(newWorkbook, oldXmlns, newXmlns, 1)
- }
- // Construct a map of file name to XML content representing the file
- // in terms of the structure of an XLSX file.
- func (f *File) MarshallParts() (map[string]string, error) {
- var parts map[string]string
- var refTable *RefTable = NewSharedStringRefTable()
- refTable.isWrite = true
- var workbookRels WorkBookRels = make(WorkBookRels)
- var err error
- var workbook xlsxWorkbook
- var types xlsxTypes = MakeDefaultContentTypes()
- marshal := func(thing interface{}) (string, error) {
- body, err := xml.Marshal(thing)
- if err != nil {
- return "", err
- }
- return xml.Header + string(body), nil
- }
- parts = make(map[string]string)
- workbook = f.makeWorkbook()
- sheetIndex := 1
- if f.styles == nil {
- f.styles = newXlsxStyleSheet(f.theme)
- }
- f.styles.reset()
- if len(f.Sheets) == 0 {
- err := errors.New("Workbook must contains atleast one worksheet")
- return nil, err
- }
- for _, sheet := range f.Sheets {
- xSheet := sheet.makeXLSXSheet(refTable, f.styles)
- rId := fmt.Sprintf("rId%d", sheetIndex)
- sheetId := strconv.Itoa(sheetIndex)
- sheetPath := fmt.Sprintf("worksheets/sheet%d.xml", sheetIndex)
- partName := "xl/" + sheetPath
- types.Overrides = append(
- types.Overrides,
- xlsxOverride{
- PartName: "/" + partName,
- ContentType: "application/vnd.openxmlformats-officedocument.spreadsheetml.worksheet+xml"})
- workbookRels[rId] = sheetPath
- workbook.Sheets.Sheet[sheetIndex-1] = xlsxSheet{
- Name: sheet.Name,
- SheetId: sheetId,
- Id: rId,
- State: "visible"}
- parts[partName], err = marshal(xSheet)
- if err != nil {
- return parts, err
- }
- sheetIndex++
- }
- workbookMarshal, err := marshal(workbook)
- if err != nil {
- return parts, err
- }
- workbookMarshal = replaceRelationshipsNameSpace(workbookMarshal)
- parts["xl/workbook.xml"] = workbookMarshal
- if err != nil {
- return parts, err
- }
- parts["_rels/.rels"] = TEMPLATE__RELS_DOT_RELS
- parts["docProps/app.xml"] = TEMPLATE_DOCPROPS_APP
- // TODO - do this properly, modification and revision information
- parts["docProps/core.xml"] = TEMPLATE_DOCPROPS_CORE
- parts["xl/theme/theme1.xml"] = TEMPLATE_XL_THEME_THEME
- xSST := refTable.makeXLSXSST()
- parts["xl/sharedStrings.xml"], err = marshal(xSST)
- if err != nil {
- return parts, err
- }
- xWRel := workbookRels.MakeXLSXWorkbookRels()
- parts["xl/_rels/workbook.xml.rels"], err = marshal(xWRel)
- if err != nil {
- return parts, err
- }
- parts["[Content_Types].xml"], err = marshal(types)
- if err != nil {
- return parts, err
- }
- parts["xl/styles.xml"], err = f.styles.Marshal()
- if err != nil {
- return parts, err
- }
- return parts, nil
- }
- // Return the raw data contained in the File as three
- // dimensional slice. The first index represents the sheet number,
- // the second the row number, and the third the cell number.
- //
- // For example:
- //
- // var mySlice [][][]string
- // var value string
- // mySlice = xlsx.FileToSlice("myXLSX.xlsx")
- // value = mySlice[0][0][0]
- //
- // Here, value would be set to the raw value of the cell A1 in the
- // first sheet in the XLSX file.
- func (f *File) ToSlice() (output [][][]string, err error) {
- output = [][][]string{}
- for _, sheet := range f.Sheets {
- s := [][]string{}
- for _, row := range sheet.Rows {
- if row == nil {
- continue
- }
- r := []string{}
- for _, cell := range row.Cells {
- str, err := cell.FormattedValue()
- if err != nil {
- // Recover from strconv.NumError if the value is an empty string,
- // and insert an empty string in the output.
- if numErr, ok := err.(*strconv.NumError); ok && numErr.Num == "" {
- str = ""
- } else {
- return output, err
- }
- }
- r = append(r, str)
- }
- s = append(s, r)
- }
- output = append(output, s)
- }
- return output, nil
- }
- // ToSliceUnmerged returns the raw data contained in the File as three
- // dimensional slice (s. method ToSlice).
- // A covered cell become the value of its origin cell.
- // Example: table where A1:A2 merged.
- // | 01.01.2011 | Bread | 20 |
- // | | Fish | 70 |
- // This sheet will be converted to the slice:
- // [ [01.01.2011 Bread 20]
- // [01.01.2011 Fish 70] ]
- func (f *File) ToSliceUnmerged() (output [][][]string, err error) {
- output, err = f.ToSlice()
- if err != nil {
- return nil, err
- }
- for s, sheet := range f.Sheets {
- for r, row := range sheet.Rows {
- for c, cell := range row.Cells {
- if cell.HMerge > 0 {
- for i := c + 1; i <= c+cell.HMerge; i++ {
- output[s][r][i] = output[s][r][c]
- }
- }
- if cell.VMerge > 0 {
- for i := r + 1; i <= r+cell.VMerge; i++ {
- output[s][i][c] = output[s][r][c]
- }
- }
- }
- }
- }
- return output, nil
- }
|