123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577 |
- // Copyright 2016 - 2021 The excelize Authors. All rights reserved. Use of
- // this source code is governed by a BSD-style license that can be found in
- // the LICENSE file.
- //
- // Package excelize providing a set of functions that allow you to write to
- // and read from XLSX / XLSM / XLTM files. Supports reading and writing
- // spreadsheet documents generated by Microsoft Excel™ 2007 and later. Supports
- // complex components by high compatibility, and provided streaming API for
- // generating or reading data from a worksheet with huge amounts of data. This
- // library needs Go version 1.15 or later.
- package excelize
- import (
- "bytes"
- "encoding/xml"
- "fmt"
- "io"
- "io/ioutil"
- "os"
- "reflect"
- "strconv"
- "strings"
- "time"
- )
- // StreamWriter defined the type of stream writer.
- type StreamWriter struct {
- File *File
- Sheet string
- SheetID int
- sheetWritten bool
- cols string
- worksheet *xlsxWorksheet
- rawData bufferedWriter
- mergeCellsCount int
- mergeCells string
- tableParts string
- }
- // NewStreamWriter return stream writer struct by given worksheet name for
- // generate new worksheet with large amounts of data. Note that after set
- // rows, you must call the 'Flush' method to end the streaming writing
- // process and ensure that the order of line numbers is ascending, the common
- // API and stream API can't be work mixed to writing data on the worksheets,
- // you can't get cell value when in-memory chunks data over 16MB. For
- // example, set data for worksheet of size 102400 rows x 50 columns with
- // numbers and style:
- //
- // file := excelize.NewFile()
- // streamWriter, err := file.NewStreamWriter("Sheet1")
- // if err != nil {
- // fmt.Println(err)
- // }
- // styleID, err := file.NewStyle(`{"font":{"color":"#777777"}}`)
- // if err != nil {
- // fmt.Println(err)
- // }
- // if err := streamWriter.SetRow("A1", []interface{}{excelize.Cell{StyleID: styleID, Value: "Data"}}); err != nil {
- // fmt.Println(err)
- // }
- // for rowID := 2; rowID <= 102400; rowID++ {
- // row := make([]interface{}, 50)
- // for colID := 0; colID < 50; colID++ {
- // row[colID] = rand.Intn(640000)
- // }
- // cell, _ := excelize.CoordinatesToCellName(1, rowID)
- // if err := streamWriter.SetRow(cell, row); err != nil {
- // fmt.Println(err)
- // }
- // }
- // if err := streamWriter.Flush(); err != nil {
- // fmt.Println(err)
- // }
- // if err := file.SaveAs("Book1.xlsx"); err != nil {
- // fmt.Println(err)
- // }
- //
- // Set cell value and cell formula for a worksheet with stream writer:
- //
- // err := streamWriter.SetRow("A1", []interface{}{
- // excelize.Cell{Value: 1},
- // excelize.Cell{Value: 2},
- // excelize.Cell{Formula: "SUM(A1,B1)"}});
- //
- func (f *File) NewStreamWriter(sheet string) (*StreamWriter, error) {
- sheetID := f.getSheetID(sheet)
- if sheetID == -1 {
- return nil, fmt.Errorf("sheet %s is not exist", sheet)
- }
- sw := &StreamWriter{
- File: f,
- Sheet: sheet,
- SheetID: sheetID,
- }
- var err error
- sw.worksheet, err = f.workSheetReader(sheet)
- if err != nil {
- return nil, err
- }
- sheetPath := f.sheetMap[trimSheetName(sheet)]
- if f.streams == nil {
- f.streams = make(map[string]*StreamWriter)
- }
- f.streams[sheetPath] = sw
- _, _ = sw.rawData.WriteString(XMLHeader + `<worksheet` + templateNamespaceIDMap)
- bulkAppendFields(&sw.rawData, sw.worksheet, 2, 5)
- return sw, err
- }
- // AddTable creates an Excel table for the StreamWriter using the given
- // coordinate area and format set. For example, create a table of A1:D5:
- //
- // err := sw.AddTable("A1", "D5", "")
- //
- // Create a table of F2:H6 with format set:
- //
- // err := sw.AddTable("F2", "H6", `{
- // "table_name": "table",
- // "table_style": "TableStyleMedium2",
- // "show_first_column": true,
- // "show_last_column": true,
- // "show_row_stripes": false,
- // "show_column_stripes": true
- // }`)
- //
- // Note that the table must be at least two lines including the header. The
- // header cells must contain strings and must be unique.
- //
- // Currently only one table is allowed for a StreamWriter. AddTable must be
- // called after the rows are written but before Flush.
- //
- // See File.AddTable for details on the table format.
- func (sw *StreamWriter) AddTable(hcell, vcell, format string) error {
- formatSet, err := parseFormatTableSet(format)
- if err != nil {
- return err
- }
- coordinates, err := areaRangeToCoordinates(hcell, vcell)
- if err != nil {
- return err
- }
- _ = sortCoordinates(coordinates)
- // Correct the minimum number of rows, the table at least two lines.
- if coordinates[1] == coordinates[3] {
- coordinates[3]++
- }
- // Correct table reference coordinate area, such correct C1:B3 to B1:C3.
- ref, err := sw.File.coordinatesToAreaRef(coordinates)
- if err != nil {
- return err
- }
- // create table columns using the first row
- tableHeaders, err := sw.getRowValues(coordinates[1], coordinates[0], coordinates[2])
- if err != nil {
- return err
- }
- tableColumn := make([]*xlsxTableColumn, len(tableHeaders))
- for i, name := range tableHeaders {
- tableColumn[i] = &xlsxTableColumn{
- ID: i + 1,
- Name: name,
- }
- }
- tableID := sw.File.countTables() + 1
- name := formatSet.TableName
- if name == "" {
- name = "Table" + strconv.Itoa(tableID)
- }
- table := xlsxTable{
- XMLNS: NameSpaceSpreadSheet.Value,
- ID: tableID,
- Name: name,
- DisplayName: name,
- Ref: ref,
- AutoFilter: &xlsxAutoFilter{
- Ref: ref,
- },
- TableColumns: &xlsxTableColumns{
- Count: len(tableColumn),
- TableColumn: tableColumn,
- },
- TableStyleInfo: &xlsxTableStyleInfo{
- Name: formatSet.TableStyle,
- ShowFirstColumn: formatSet.ShowFirstColumn,
- ShowLastColumn: formatSet.ShowLastColumn,
- ShowRowStripes: formatSet.ShowRowStripes,
- ShowColumnStripes: formatSet.ShowColumnStripes,
- },
- }
- sheetRelationshipsTableXML := "../tables/table" + strconv.Itoa(tableID) + ".xml"
- tableXML := strings.Replace(sheetRelationshipsTableXML, "..", "xl", -1)
- // Add first table for given sheet.
- sheetPath := sw.File.sheetMap[trimSheetName(sw.Sheet)]
- sheetRels := "xl/worksheets/_rels/" + strings.TrimPrefix(sheetPath, "xl/worksheets/") + ".rels"
- rID := sw.File.addRels(sheetRels, SourceRelationshipTable, sheetRelationshipsTableXML, "")
- sw.tableParts = fmt.Sprintf(`<tableParts count="1"><tablePart r:id="rId%d"></tablePart></tableParts>`, rID)
- sw.File.addContentTypePart(tableID, "table")
- b, _ := xml.Marshal(table)
- sw.File.saveFileList(tableXML, b)
- return nil
- }
- // Extract values from a row in the StreamWriter.
- func (sw *StreamWriter) getRowValues(hrow, hcol, vcol int) (res []string, err error) {
- res = make([]string, vcol-hcol+1)
- r, err := sw.rawData.Reader()
- if err != nil {
- return nil, err
- }
- dec := sw.File.xmlNewDecoder(r)
- for {
- token, err := dec.Token()
- if err == io.EOF {
- return res, nil
- }
- if err != nil {
- return nil, err
- }
- startElement, ok := getRowElement(token, hrow)
- if !ok {
- continue
- }
- // decode cells
- var row xlsxRow
- if err := dec.DecodeElement(&row, &startElement); err != nil {
- return nil, err
- }
- for _, c := range row.C {
- col, _, err := CellNameToCoordinates(c.R)
- if err != nil {
- return nil, err
- }
- if col < hcol || col > vcol {
- continue
- }
- res[col-hcol] = c.V
- }
- return res, nil
- }
- }
- // Check if the token is an XLSX row with the matching row number.
- func getRowElement(token xml.Token, hrow int) (startElement xml.StartElement, ok bool) {
- startElement, ok = token.(xml.StartElement)
- if !ok {
- return
- }
- ok = startElement.Name.Local == "row"
- if !ok {
- return
- }
- ok = false
- for _, attr := range startElement.Attr {
- if attr.Name.Local != "r" {
- continue
- }
- row, _ := strconv.Atoi(attr.Value)
- if row == hrow {
- ok = true
- return
- }
- }
- return
- }
- // Cell can be used directly in StreamWriter.SetRow to specify a style and
- // a value.
- type Cell struct {
- StyleID int
- Formula string
- Value interface{}
- }
- // SetRow writes an array to stream rows by giving a worksheet name, starting
- // coordinate and a pointer to an array of values. Note that you must call the
- // 'Flush' method to end the streaming writing process.
- //
- // As a special case, if Cell is used as a value, then the Cell.StyleID will be
- // applied to that cell.
- func (sw *StreamWriter) SetRow(axis string, values []interface{}) error {
- col, row, err := CellNameToCoordinates(axis)
- if err != nil {
- return err
- }
- if !sw.sheetWritten {
- if len(sw.cols) > 0 {
- sw.rawData.WriteString("<cols>" + sw.cols + "</cols>")
- }
- _, _ = sw.rawData.WriteString(`<sheetData>`)
- sw.sheetWritten = true
- }
- fmt.Fprintf(&sw.rawData, `<row r="%d">`, row)
- for i, val := range values {
- axis, err := CoordinatesToCellName(col+i, row)
- if err != nil {
- return err
- }
- c := xlsxC{R: axis}
- if v, ok := val.(Cell); ok {
- c.S = v.StyleID
- val = v.Value
- setCellFormula(&c, v.Formula)
- } else if v, ok := val.(*Cell); ok && v != nil {
- c.S = v.StyleID
- val = v.Value
- setCellFormula(&c, v.Formula)
- }
- if err = setCellValFunc(&c, val); err != nil {
- _, _ = sw.rawData.WriteString(`</row>`)
- return err
- }
- writeCell(&sw.rawData, c)
- }
- _, _ = sw.rawData.WriteString(`</row>`)
- return sw.rawData.Sync()
- }
- // SetColWidth provides a function to set the width of a single column or
- // multiple columns for the the StreamWriter. Note that you must call
- // the 'SetColWidth' function before the 'SetRow' function. For example set
- // the width column B:C as 20:
- //
- // err := streamWriter.SetColWidth(2, 3, 20)
- //
- func (sw *StreamWriter) SetColWidth(min, max int, width float64) error {
- if sw.sheetWritten {
- return ErrStreamSetColWidth
- }
- if min > TotalColumns || max > TotalColumns {
- return ErrColumnNumber
- }
- if min < 1 || max < 1 {
- return ErrColumnNumber
- }
- if width > MaxColumnWidth {
- return ErrColumnWidth
- }
- if min > max {
- min, max = max, min
- }
- sw.cols += fmt.Sprintf(`<col min="%d" max="%d" width="%f" customWidth="1"/>`, min, max, width)
- return nil
- }
- // MergeCell provides a function to merge cells by a given coordinate area for
- // the StreamWriter. Don't create a merged cell that overlaps with another
- // existing merged cell.
- func (sw *StreamWriter) MergeCell(hcell, vcell string) error {
- _, err := areaRangeToCoordinates(hcell, vcell)
- if err != nil {
- return err
- }
- sw.mergeCellsCount++
- sw.mergeCells += fmt.Sprintf(`<mergeCell ref="%s:%s"/>`, hcell, vcell)
- return nil
- }
- // setCellFormula provides a function to set formula of a cell.
- func setCellFormula(c *xlsxC, formula string) {
- if formula != "" {
- c.F = &xlsxF{Content: formula}
- }
- }
- // setCellValFunc provides a function to set value of a cell.
- func setCellValFunc(c *xlsxC, val interface{}) (err error) {
- switch val := val.(type) {
- case int, int8, int16, int32, int64, uint, uint8, uint16, uint32, uint64:
- err = setCellIntFunc(c, val)
- case float32:
- c.T, c.V = setCellFloat(float64(val), -1, 32)
- case float64:
- c.T, c.V = setCellFloat(val, -1, 64)
- case string:
- c.T, c.V, c.XMLSpace = setCellStr(val)
- case []byte:
- c.T, c.V, c.XMLSpace = setCellStr(string(val))
- case time.Duration:
- c.T, c.V = setCellDuration(val)
- case time.Time:
- c.T, c.V, _, err = setCellTime(val)
- case bool:
- c.T, c.V = setCellBool(val)
- case nil:
- c.T, c.V, c.XMLSpace = setCellStr("")
- default:
- c.T, c.V, c.XMLSpace = setCellStr(fmt.Sprint(val))
- }
- return err
- }
- // setCellIntFunc is a wrapper of SetCellInt.
- func setCellIntFunc(c *xlsxC, val interface{}) (err error) {
- switch val := val.(type) {
- case int:
- c.T, c.V = setCellInt(val)
- case int8:
- c.T, c.V = setCellInt(int(val))
- case int16:
- c.T, c.V = setCellInt(int(val))
- case int32:
- c.T, c.V = setCellInt(int(val))
- case int64:
- c.T, c.V = setCellInt(int(val))
- case uint:
- c.T, c.V = setCellInt(int(val))
- case uint8:
- c.T, c.V = setCellInt(int(val))
- case uint16:
- c.T, c.V = setCellInt(int(val))
- case uint32:
- c.T, c.V = setCellInt(int(val))
- case uint64:
- c.T, c.V = setCellInt(int(val))
- default:
- }
- return
- }
- func writeCell(buf *bufferedWriter, c xlsxC) {
- _, _ = buf.WriteString(`<c`)
- if c.XMLSpace.Value != "" {
- fmt.Fprintf(buf, ` xml:%s="%s"`, c.XMLSpace.Name.Local, c.XMLSpace.Value)
- }
- fmt.Fprintf(buf, ` r="%s"`, c.R)
- if c.S != 0 {
- fmt.Fprintf(buf, ` s="%d"`, c.S)
- }
- if c.T != "" {
- fmt.Fprintf(buf, ` t="%s"`, c.T)
- }
- _, _ = buf.WriteString(`>`)
- if c.F != nil {
- _, _ = buf.WriteString(`<f>`)
- _ = xml.EscapeText(buf, []byte(c.F.Content))
- _, _ = buf.WriteString(`</f>`)
- }
- if c.V != "" {
- _, _ = buf.WriteString(`<v>`)
- _ = xml.EscapeText(buf, []byte(c.V))
- _, _ = buf.WriteString(`</v>`)
- }
- _, _ = buf.WriteString(`</c>`)
- }
- // Flush ending the streaming writing process.
- func (sw *StreamWriter) Flush() error {
- if !sw.sheetWritten {
- _, _ = sw.rawData.WriteString(`<sheetData>`)
- sw.sheetWritten = true
- }
- _, _ = sw.rawData.WriteString(`</sheetData>`)
- bulkAppendFields(&sw.rawData, sw.worksheet, 8, 15)
- if sw.mergeCellsCount > 0 {
- sw.mergeCells = fmt.Sprintf(`<mergeCells count="%d">%s</mergeCells>`, sw.mergeCellsCount, sw.mergeCells)
- }
- _, _ = sw.rawData.WriteString(sw.mergeCells)
- bulkAppendFields(&sw.rawData, sw.worksheet, 17, 38)
- _, _ = sw.rawData.WriteString(sw.tableParts)
- bulkAppendFields(&sw.rawData, sw.worksheet, 40, 40)
- _, _ = sw.rawData.WriteString(`</worksheet>`)
- if err := sw.rawData.Flush(); err != nil {
- return err
- }
- sheetPath := sw.File.sheetMap[trimSheetName(sw.Sheet)]
- delete(sw.File.Sheet, sheetPath)
- delete(sw.File.checked, sheetPath)
- delete(sw.File.XLSX, sheetPath)
- return nil
- }
- // bulkAppendFields bulk-appends fields in a worksheet by specified field
- // names order range.
- func bulkAppendFields(w io.Writer, ws *xlsxWorksheet, from, to int) {
- s := reflect.ValueOf(ws).Elem()
- enc := xml.NewEncoder(w)
- for i := 0; i < s.NumField(); i++ {
- if from <= i && i <= to {
- _ = enc.Encode(s.Field(i).Interface())
- }
- }
- }
- // bufferedWriter uses a temp file to store an extended buffer. Writes are
- // always made to an in-memory buffer, which will always succeed. The buffer
- // is written to the temp file with Sync, which may return an error.
- // Therefore, Sync should be periodically called and the error checked.
- type bufferedWriter struct {
- tmp *os.File
- buf bytes.Buffer
- }
- // Write to the in-memory buffer. The err is always nil.
- func (bw *bufferedWriter) Write(p []byte) (n int, err error) {
- return bw.buf.Write(p)
- }
- // WriteString wites to the in-memory buffer. The err is always nil.
- func (bw *bufferedWriter) WriteString(p string) (n int, err error) {
- return bw.buf.WriteString(p)
- }
- // Reader provides read-access to the underlying buffer/file.
- func (bw *bufferedWriter) Reader() (io.Reader, error) {
- if bw.tmp == nil {
- return bytes.NewReader(bw.buf.Bytes()), nil
- }
- if err := bw.Flush(); err != nil {
- return nil, err
- }
- fi, err := bw.tmp.Stat()
- if err != nil {
- return nil, err
- }
- // os.File.ReadAt does not affect the cursor position and is safe to use here
- return io.NewSectionReader(bw.tmp, 0, fi.Size()), nil
- }
- // Sync will write the in-memory buffer to a temp file, if the in-memory
- // buffer has grown large enough. Any error will be returned.
- func (bw *bufferedWriter) Sync() (err error) {
- // Try to use local storage
- if bw.buf.Len() < StreamChunkSize {
- return nil
- }
- if bw.tmp == nil {
- bw.tmp, err = ioutil.TempFile(os.TempDir(), "excelize-")
- if err != nil {
- // can not use local storage
- return nil
- }
- }
- return bw.Flush()
- }
- // Flush the entire in-memory buffer to the temp file, if a temp file is being
- // used.
- func (bw *bufferedWriter) Flush() error {
- if bw.tmp == nil {
- return nil
- }
- _, err := bw.buf.WriteTo(bw.tmp)
- if err != nil {
- return err
- }
- bw.buf.Reset()
- return nil
- }
- // Close the underlying temp file and reset the in-memory buffer.
- func (bw *bufferedWriter) Close() error {
- bw.buf.Reset()
- if bw.tmp == nil {
- return nil
- }
- defer os.Remove(bw.tmp.Name())
- return bw.tmp.Close()
- }
|