// Copyright 2016 - 2021 The excelize Authors. All rights reserved. Use of // this source code is governed by a BSD-style license that can be found in // the LICENSE file. // // Package excelize providing a set of functions that allow you to write to // and read from XLSX / XLSM / XLTM files. Supports reading and writing // spreadsheet documents generated by Microsoft Excelâ„¢ 2007 and later. Supports // complex components by high compatibility, and provided streaming API for // generating or reading data from a worksheet with huge amounts of data. This // library needs Go version 1.15 or later. package excelize import ( "bytes" "encoding/xml" "fmt" "io" "io/ioutil" "os" "reflect" "strconv" "strings" "time" ) // StreamWriter defined the type of stream writer. type StreamWriter struct { File *File Sheet string SheetID int sheetWritten bool cols string worksheet *xlsxWorksheet rawData bufferedWriter mergeCellsCount int mergeCells string tableParts string } // NewStreamWriter return stream writer struct by given worksheet name for // generate new worksheet with large amounts of data. Note that after set // rows, you must call the 'Flush' method to end the streaming writing // process and ensure that the order of line numbers is ascending, the common // API and stream API can't be work mixed to writing data on the worksheets, // you can't get cell value when in-memory chunks data over 16MB. For // example, set data for worksheet of size 102400 rows x 50 columns with // numbers and style: // // file := excelize.NewFile() // streamWriter, err := file.NewStreamWriter("Sheet1") // if err != nil { // fmt.Println(err) // } // styleID, err := file.NewStyle(`{"font":{"color":"#777777"}}`) // if err != nil { // fmt.Println(err) // } // if err := streamWriter.SetRow("A1", []interface{}{excelize.Cell{StyleID: styleID, Value: "Data"}}, // excelize.RowOpts{Height: 45, Hidden: false}); err != nil { // fmt.Println(err) // } // for rowID := 2; rowID <= 102400; rowID++ { // row := make([]interface{}, 50) // for colID := 0; colID < 50; colID++ { // row[colID] = rand.Intn(640000) // } // cell, _ := excelize.CoordinatesToCellName(1, rowID) // if err := streamWriter.SetRow(cell, row); err != nil { // fmt.Println(err) // } // } // if err := streamWriter.Flush(); err != nil { // fmt.Println(err) // } // if err := file.SaveAs("Book1.xlsx"); err != nil { // fmt.Println(err) // } // // Set cell value and cell formula for a worksheet with stream writer: // // err := streamWriter.SetRow("A1", []interface{}{ // excelize.Cell{Value: 1}, // excelize.Cell{Value: 2}, // excelize.Cell{Formula: "SUM(A1,B1)"}}); // // Set cell value and rows style for a worksheet with stream writer: // // err := streamWriter.SetRow("A1", []interface{}{ // excelize.Cell{Value: 1}}, // excelize.RowOpts{StyleID: styleID, Height: 20, Hidden: false}); // func (f *File) NewStreamWriter(sheet string) (*StreamWriter, error) { sheetID := f.getSheetID(sheet) if sheetID == -1 { return nil, fmt.Errorf("sheet %s is not exist", sheet) } sw := &StreamWriter{ File: f, Sheet: sheet, SheetID: sheetID, } var err error sw.worksheet, err = f.workSheetReader(sheet) if err != nil { return nil, err } sheetPath := f.sheetMap[trimSheetName(sheet)] if f.streams == nil { f.streams = make(map[string]*StreamWriter) } f.streams[sheetPath] = sw _, _ = sw.rawData.WriteString(XMLHeader + ``, rID) sw.File.addContentTypePart(tableID, "table") b, _ := xml.Marshal(table) sw.File.saveFileList(tableXML, b) return nil } // Extract values from a row in the StreamWriter. func (sw *StreamWriter) getRowValues(hrow, hcol, vcol int) (res []string, err error) { res = make([]string, vcol-hcol+1) r, err := sw.rawData.Reader() if err != nil { return nil, err } dec := sw.File.xmlNewDecoder(r) for { token, err := dec.Token() if err == io.EOF { return res, nil } if err != nil { return nil, err } startElement, ok := getRowElement(token, hrow) if !ok { continue } // decode cells var row xlsxRow if err := dec.DecodeElement(&row, &startElement); err != nil { return nil, err } for _, c := range row.C { col, _, err := CellNameToCoordinates(c.R) if err != nil { return nil, err } if col < hcol || col > vcol { continue } res[col-hcol] = c.V } return res, nil } } // Check if the token is an XLSX row with the matching row number. func getRowElement(token xml.Token, hrow int) (startElement xml.StartElement, ok bool) { startElement, ok = token.(xml.StartElement) if !ok { return } ok = startElement.Name.Local == "row" if !ok { return } ok = false for _, attr := range startElement.Attr { if attr.Name.Local != "r" { continue } row, _ := strconv.Atoi(attr.Value) if row == hrow { ok = true return } } return } // Cell can be used directly in StreamWriter.SetRow to specify a style and // a value. type Cell struct { StyleID int Formula string Value interface{} } // RowOpts define the options for the set row, it can be used directly in // StreamWriter.SetRow to specify the style and properties of the row. type RowOpts struct { Height float64 Hidden bool StyleID int } // SetRow writes an array to stream rows by giving a worksheet name, starting // coordinate and a pointer to an array of values. Note that you must call the // 'Flush' method to end the streaming writing process. // // As a special case, if Cell is used as a value, then the Cell.StyleID will be // applied to that cell. func (sw *StreamWriter) SetRow(axis string, values []interface{}, opts ...RowOpts) error { col, row, err := CellNameToCoordinates(axis) if err != nil { return err } if !sw.sheetWritten { if len(sw.cols) > 0 { _, _ = sw.rawData.WriteString("" + sw.cols + "") } _, _ = sw.rawData.WriteString(``) sw.sheetWritten = true } attrs, err := marshalRowAttrs(opts...) if err != nil { return err } fmt.Fprintf(&sw.rawData, ``, row, attrs) for i, val := range values { axis, err := CoordinatesToCellName(col+i, row) if err != nil { return err } c := xlsxC{R: axis} if v, ok := val.(Cell); ok { c.S = v.StyleID val = v.Value setCellFormula(&c, v.Formula) } else if v, ok := val.(*Cell); ok && v != nil { c.S = v.StyleID val = v.Value setCellFormula(&c, v.Formula) } if err = setCellValFunc(&c, val); err != nil { _, _ = sw.rawData.WriteString(``) return err } writeCell(&sw.rawData, c) } _, _ = sw.rawData.WriteString(``) return sw.rawData.Sync() } // marshalRowAttrs prepare attributes of the row by given options. func marshalRowAttrs(opts ...RowOpts) (attrs string, err error) { var opt *RowOpts for i := range opts { opt = &opts[i] } if opt == nil { return } if opt.Height > MaxRowHeight { err = ErrMaxRowHeight return } if opt.StyleID > 0 { attrs += fmt.Sprintf(` s="%d" customFormat="true"`, opt.StyleID) } if opt.Height > 0 { attrs += fmt.Sprintf(` ht="%v" customHeight="true"`, opt.Height) } if opt.Hidden { attrs += ` hidden="true"` } return } // SetColWidth provides a function to set the width of a single column or // multiple columns for the StreamWriter. Note that you must call // the 'SetColWidth' function before the 'SetRow' function. For example set // the width column B:C as 20: // // err := streamWriter.SetColWidth(2, 3, 20) // func (sw *StreamWriter) SetColWidth(min, max int, width float64) error { if sw.sheetWritten { return ErrStreamSetColWidth } if min > TotalColumns || max > TotalColumns { return ErrColumnNumber } if min < 1 || max < 1 { return ErrColumnNumber } if width > MaxColumnWidth { return ErrColumnWidth } if min > max { min, max = max, min } sw.cols += fmt.Sprintf(``, min, max, width) return nil } // MergeCell provides a function to merge cells by a given coordinate area for // the StreamWriter. Don't create a merged cell that overlaps with another // existing merged cell. func (sw *StreamWriter) MergeCell(hcell, vcell string) error { _, err := areaRangeToCoordinates(hcell, vcell) if err != nil { return err } sw.mergeCellsCount++ sw.mergeCells += fmt.Sprintf(``, hcell, vcell) return nil } // setCellFormula provides a function to set formula of a cell. func setCellFormula(c *xlsxC, formula string) { if formula != "" { c.F = &xlsxF{Content: formula} } } // setCellValFunc provides a function to set value of a cell. func setCellValFunc(c *xlsxC, val interface{}) (err error) { switch val := val.(type) { case int, int8, int16, int32, int64, uint, uint8, uint16, uint32, uint64: err = setCellIntFunc(c, val) case float32: c.T, c.V = setCellFloat(float64(val), -1, 32) case float64: c.T, c.V = setCellFloat(val, -1, 64) case string: c.T, c.V, c.XMLSpace = setCellStr(val) case []byte: c.T, c.V, c.XMLSpace = setCellStr(string(val)) case time.Duration: c.T, c.V = setCellDuration(val) case time.Time: c.T, c.V, _, err = setCellTime(val) case bool: c.T, c.V = setCellBool(val) case nil: c.T, c.V, c.XMLSpace = setCellStr("") default: c.T, c.V, c.XMLSpace = setCellStr(fmt.Sprint(val)) } return err } // setCellIntFunc is a wrapper of SetCellInt. func setCellIntFunc(c *xlsxC, val interface{}) (err error) { switch val := val.(type) { case int: c.T, c.V = setCellInt(val) case int8: c.T, c.V = setCellInt(int(val)) case int16: c.T, c.V = setCellInt(int(val)) case int32: c.T, c.V = setCellInt(int(val)) case int64: c.T, c.V = setCellInt(int(val)) case uint: c.T, c.V = setCellInt(int(val)) case uint8: c.T, c.V = setCellInt(int(val)) case uint16: c.T, c.V = setCellInt(int(val)) case uint32: c.T, c.V = setCellInt(int(val)) case uint64: c.T, c.V = setCellInt(int(val)) default: } return } func writeCell(buf *bufferedWriter, c xlsxC) { _, _ = buf.WriteString(``) if c.F != nil { _, _ = buf.WriteString(``) _ = xml.EscapeText(buf, []byte(c.F.Content)) _, _ = buf.WriteString(``) } if c.V != "" { _, _ = buf.WriteString(``) _ = xml.EscapeText(buf, []byte(c.V)) _, _ = buf.WriteString(``) } _, _ = buf.WriteString(``) } // Flush ending the streaming writing process. func (sw *StreamWriter) Flush() error { if !sw.sheetWritten { _, _ = sw.rawData.WriteString(``) sw.sheetWritten = true } _, _ = sw.rawData.WriteString(``) bulkAppendFields(&sw.rawData, sw.worksheet, 8, 15) if sw.mergeCellsCount > 0 { sw.mergeCells = fmt.Sprintf(`%s`, sw.mergeCellsCount, sw.mergeCells) } _, _ = sw.rawData.WriteString(sw.mergeCells) bulkAppendFields(&sw.rawData, sw.worksheet, 17, 38) _, _ = sw.rawData.WriteString(sw.tableParts) bulkAppendFields(&sw.rawData, sw.worksheet, 40, 40) _, _ = sw.rawData.WriteString(``) if err := sw.rawData.Flush(); err != nil { return err } sheetPath := sw.File.sheetMap[trimSheetName(sw.Sheet)] sw.File.Sheet.Delete(sheetPath) delete(sw.File.checked, sheetPath) sw.File.Pkg.Delete(sheetPath) return nil } // bulkAppendFields bulk-appends fields in a worksheet by specified field // names order range. func bulkAppendFields(w io.Writer, ws *xlsxWorksheet, from, to int) { s := reflect.ValueOf(ws).Elem() enc := xml.NewEncoder(w) for i := 0; i < s.NumField(); i++ { if from <= i && i <= to { _ = enc.Encode(s.Field(i).Interface()) } } } // bufferedWriter uses a temp file to store an extended buffer. Writes are // always made to an in-memory buffer, which will always succeed. The buffer // is written to the temp file with Sync, which may return an error. // Therefore, Sync should be periodically called and the error checked. type bufferedWriter struct { tmp *os.File buf bytes.Buffer } // Write to the in-memory buffer. The err is always nil. func (bw *bufferedWriter) Write(p []byte) (n int, err error) { return bw.buf.Write(p) } // WriteString wites to the in-memory buffer. The err is always nil. func (bw *bufferedWriter) WriteString(p string) (n int, err error) { return bw.buf.WriteString(p) } // Reader provides read-access to the underlying buffer/file. func (bw *bufferedWriter) Reader() (io.Reader, error) { if bw.tmp == nil { return bytes.NewReader(bw.buf.Bytes()), nil } if err := bw.Flush(); err != nil { return nil, err } fi, err := bw.tmp.Stat() if err != nil { return nil, err } // os.File.ReadAt does not affect the cursor position and is safe to use here return io.NewSectionReader(bw.tmp, 0, fi.Size()), nil } // Sync will write the in-memory buffer to a temp file, if the in-memory // buffer has grown large enough. Any error will be returned. func (bw *bufferedWriter) Sync() (err error) { // Try to use local storage if bw.buf.Len() < StreamChunkSize { return nil } if bw.tmp == nil { bw.tmp, err = ioutil.TempFile(os.TempDir(), "excelize-") if err != nil { // can not use local storage return nil } } return bw.Flush() } // Flush the entire in-memory buffer to the temp file, if a temp file is being // used. func (bw *bufferedWriter) Flush() error { if bw.tmp == nil { return nil } _, err := bw.buf.WriteTo(bw.tmp) if err != nil { return err } bw.buf.Reset() return nil } // Close the underlying temp file and reset the in-memory buffer. func (bw *bufferedWriter) Close() error { bw.buf.Reset() if bw.tmp == nil { return nil } defer os.Remove(bw.tmp.Name()) return bw.tmp.Close() }