stream_test.go 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487
  1. package xlsx
  2. import (
  3. "bytes"
  4. "fmt"
  5. "io"
  6. "reflect"
  7. "strings"
  8. . "gopkg.in/check.v1"
  9. )
  10. const (
  11. TestsShouldMakeRealFiles = false
  12. )
  13. type StreamSuite struct{}
  14. var _ = Suite(&SheetSuite{})
  15. func (s *StreamSuite) TestTestsShouldMakeRealFilesShouldBeFalse(t *C) {
  16. if TestsShouldMakeRealFiles {
  17. t.Fatal("TestsShouldMakeRealFiles should only be true for local debugging. Don't forget to switch back before commiting.")
  18. }
  19. }
  20. func (s *StreamSuite) TestXlsxStreamWrite(t *C) {
  21. // When shouldMakeRealFiles is set to true this test will make actual XLSX files in the file system.
  22. // This is useful to ensure files open in Excel, Numbers, Google Docs, etc.
  23. // In case of issues you can use "Open XML SDK 2.5" to diagnose issues in generated XLSX files:
  24. // https://www.microsoft.com/en-us/download/details.aspx?id=30425
  25. testCases := []struct {
  26. testName string
  27. sheetNames []string
  28. workbookData [][][]string
  29. headerTypes [][]*CellType
  30. expectedError error
  31. }{
  32. {
  33. testName: "One Sheet",
  34. sheetNames: []string{
  35. "Sheet1",
  36. },
  37. workbookData: [][][]string{
  38. {
  39. {"Token", "Name", "Price", "SKU"},
  40. {"123", "Taco", "300", "0000000123"},
  41. },
  42. },
  43. headerTypes: [][]*CellType{
  44. {nil, CellTypeString.Ptr(), nil, CellTypeString.Ptr()},
  45. },
  46. },
  47. {
  48. testName: "One Column",
  49. sheetNames: []string{
  50. "Sheet1",
  51. },
  52. workbookData: [][][]string{
  53. {
  54. {"Token"},
  55. {"123"},
  56. },
  57. },
  58. },
  59. {
  60. testName: "Several Sheets, with different numbers of columns and rows",
  61. sheetNames: []string{
  62. "Sheet 1", "Sheet 2", "Sheet3",
  63. },
  64. workbookData: [][][]string{
  65. {
  66. {"Token", "Name", "Price", "SKU"},
  67. {"123", "Taco", "300", "0000000123"},
  68. },
  69. {
  70. {"Token", "Name", "Price", "SKU", "Stock"},
  71. {"456", "Salsa", "200", "0346", "1"},
  72. {"789", "Burritos", "400", "754", "3"},
  73. },
  74. {
  75. {"Token", "Name", "Price"},
  76. {"9853", "Guacamole", "500"},
  77. {"2357", "Margarita", "700"},
  78. },
  79. },
  80. },
  81. {
  82. testName: "Two Sheets with same the name",
  83. sheetNames: []string{
  84. "Sheet 1", "Sheet 1",
  85. },
  86. workbookData: [][][]string{
  87. {
  88. {"Token", "Name", "Price", "SKU"},
  89. {"123", "Taco", "300", "0000000123"},
  90. },
  91. {
  92. {"Token", "Name", "Price", "SKU", "Stock"},
  93. {"456", "Salsa", "200", "0346", "1"},
  94. {"789", "Burritos", "400", "754", "3"},
  95. },
  96. },
  97. expectedError: fmt.Errorf("duplicate sheet name '%s'.", "Sheet 1"),
  98. },
  99. {
  100. testName: "One Sheet Registered, tries to write to two",
  101. sheetNames: []string{
  102. "Sheet 1",
  103. },
  104. workbookData: [][][]string{
  105. {
  106. {"Token", "Name", "Price", "SKU"},
  107. {"123", "Taco", "300", "0000000123"},
  108. },
  109. {
  110. {"Token", "Name", "Price", "SKU"},
  111. {"456", "Salsa", "200", "0346"},
  112. },
  113. },
  114. expectedError: AlreadyOnLastSheetError,
  115. },
  116. {
  117. testName: "One Sheet, too many columns in row 1",
  118. sheetNames: []string{
  119. "Sheet 1",
  120. },
  121. workbookData: [][][]string{
  122. {
  123. {"Token", "Name", "Price", "SKU"},
  124. {"123", "Taco", "300", "0000000123", "asdf"},
  125. },
  126. },
  127. expectedError: WrongNumberOfRowsError,
  128. },
  129. {
  130. testName: "One Sheet, too few columns in row 1",
  131. sheetNames: []string{
  132. "Sheet 1",
  133. },
  134. workbookData: [][][]string{
  135. {
  136. {"Token", "Name", "Price", "SKU"},
  137. {"123", "Taco", "300"},
  138. },
  139. },
  140. expectedError: WrongNumberOfRowsError,
  141. },
  142. {
  143. testName: "Lots of Sheets, only writes rows to one, only writes headers to one, should not error and should still create a valid file",
  144. sheetNames: []string{
  145. "Sheet 1", "Sheet 2", "Sheet 3", "Sheet 4", "Sheet 5", "Sheet 6",
  146. },
  147. workbookData: [][][]string{
  148. {
  149. {"Token", "Name", "Price", "SKU"},
  150. {"123", "Taco", "300", "0000000123"},
  151. },
  152. {{}},
  153. {{"Id", "Unit Cost"}},
  154. {{}},
  155. {{}},
  156. {{}},
  157. },
  158. },
  159. {
  160. testName: "Two Sheets, only writes to one, should not error and should still create a valid file",
  161. sheetNames: []string{
  162. "Sheet 1", "Sheet 2",
  163. },
  164. workbookData: [][][]string{
  165. {
  166. {"Token", "Name", "Price", "SKU"},
  167. {"123", "Taco", "300", "0000000123"},
  168. },
  169. {{}},
  170. },
  171. },
  172. {
  173. testName: "Larger Sheet",
  174. sheetNames: []string{
  175. "Sheet 1",
  176. },
  177. workbookData: [][][]string{
  178. {
  179. {"Token", "Name", "Price", "SKU", "Token", "Name", "Price", "SKU", "Token", "Name", "Price", "SKU", "Token", "Name", "Price", "SKU", "Token", "Name", "Price", "SKU", "Token", "Name", "Price", "SKU"},
  180. {"123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123"},
  181. {"456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346"},
  182. {"789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754"},
  183. {"123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123"},
  184. {"456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346"},
  185. {"789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754"},
  186. {"123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123"},
  187. {"456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346"},
  188. {"789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754"},
  189. {"123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123"},
  190. {"456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346"},
  191. {"789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754"},
  192. {"123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123"},
  193. {"456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346"},
  194. {"789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754"},
  195. {"123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123"},
  196. {"456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346"},
  197. {"789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754"},
  198. {"123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123"},
  199. {"456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346"},
  200. {"789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754"},
  201. {"123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123", "123", "Taco", "300", "0000000123"},
  202. {"456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346", "456", "Salsa", "200", "0346"},
  203. {"789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754", "789", "Burritos", "400", "754"},
  204. },
  205. },
  206. },
  207. {
  208. testName: "UTF-8 Characters. This XLSX File loads correctly with Excel, Numbers, and Google Docs. It also passes Microsoft's Office File Format Validator.",
  209. sheetNames: []string{
  210. "Sheet1",
  211. },
  212. workbookData: [][][]string{
  213. {
  214. // String courtesy of https://github.com/minimaxir/big-list-of-naughty-strings/
  215. // Header row contains the tags that I am filtering on
  216. {"Token", endSheetDataTag, "Price", fmt.Sprintf(dimensionTag, "A1:D1")},
  217. // Japanese and emojis
  218. {"123", "パーティーへ行かないか", "300", "🍕🐵 🙈 🙉 🙊"},
  219. // XML encoder/parser test strings
  220. {"123", `<?xml version="1.0" encoding="ISO-8859-1"?>`, "300", `<?xml version="1.0" encoding="ISO-8859-1"?><!DOCTYPE foo [ <!ELEMENT foo ANY ><!ENTITY xxe SYSTEM "file:///etc/passwd" >]><foo>&xxe;</foo>`},
  221. // Upside down text and Right to Left Arabic text
  222. {"123", `˙ɐnbᴉlɐ ɐuƃɐɯ ǝɹolop ʇǝ ǝɹoqɐl ʇn ʇunpᴉpᴉɔuᴉ ɹodɯǝʇ poɯsnᴉǝ op pǝs 'ʇᴉlǝ ƃuᴉɔsᴉdᴉpɐ ɹnʇǝʇɔǝsuoɔ 'ʇǝɯɐ ʇᴉs ɹolop ɯnsdᴉ ɯǝɹo˥
  223. 00˙Ɩ$-`, "300", `ﷺ`},
  224. {"123", "Taco", "300", "0000000123"},
  225. },
  226. },
  227. },
  228. }
  229. for i, testCase := range testCases {
  230. var filePath string
  231. var buffer bytes.Buffer
  232. if TestsShouldMakeRealFiles {
  233. filePath = fmt.Sprintf("Workbook%d.xlsx", i)
  234. }
  235. err := writeStreamFile(filePath, &buffer, testCase.sheetNames, testCase.workbookData, testCase.headerTypes, TestsShouldMakeRealFiles)
  236. if err != testCase.expectedError && err.Error() != testCase.expectedError.Error() {
  237. t.Fatalf("Error differs from expected error. Error: %v, Expected Error: %v ", err, testCase.expectedError)
  238. }
  239. if testCase.expectedError != nil {
  240. return
  241. }
  242. // read the file back with the xlsx package
  243. var bufReader *bytes.Reader
  244. var size int64
  245. if !TestsShouldMakeRealFiles {
  246. bufReader = bytes.NewReader(buffer.Bytes())
  247. size = bufReader.Size()
  248. }
  249. actualSheetNames, actualWorkbookData := readXLSXFile(t, filePath, bufReader, size, TestsShouldMakeRealFiles)
  250. // check if data was able to be read correctly
  251. if !reflect.DeepEqual(actualSheetNames, testCase.sheetNames) {
  252. t.Fatal("Expected sheet names to be equal")
  253. }
  254. if !reflect.DeepEqual(actualWorkbookData, testCase.workbookData) {
  255. t.Fatal("Expected workbook data to be equal")
  256. }
  257. }
  258. }
  259. // The purpose of TestXlsxStyleBehavior is to ensure that initMaxStyleId has the correct starting value
  260. // and that the logic in AddSheet() that predicts Style IDs is correct.
  261. func (s *StreamSuite) TestXlsxStyleBehavior(t *C) {
  262. file := NewFile()
  263. sheet, err := file.AddSheet("Sheet 1")
  264. if err != nil {
  265. t.Fatal(err)
  266. }
  267. row := sheet.AddRow()
  268. rowData := []string{"testing", "1", "2", "3"}
  269. if count := row.WriteSlice(&rowData, -1); count != len(rowData) {
  270. t.Fatal("not enough cells written")
  271. }
  272. parts, err := file.MarshallParts()
  273. styleSheet, ok := parts["xl/styles.xml"]
  274. if !ok {
  275. t.Fatal("no style sheet")
  276. }
  277. // Created an XLSX file with only the default style.
  278. // We expect that the number of styles is one more than our max index constant.
  279. // This means the library adds two styles by default.
  280. if !strings.Contains(styleSheet, fmt.Sprintf(`<cellXfs count="%d">`, initMaxStyleId+1)) {
  281. t.Fatal("Expected sheet to have two styles")
  282. }
  283. file = NewFile()
  284. sheet, err = file.AddSheet("Sheet 1")
  285. if err != nil {
  286. t.Fatal(err)
  287. }
  288. row = sheet.AddRow()
  289. rowData = []string{"testing", "1", "2", "3", "4"}
  290. if count := row.WriteSlice(&rowData, -1); count != len(rowData) {
  291. t.Fatal("not enough cells written")
  292. }
  293. sheet.Cols[0].SetType(CellTypeString)
  294. sheet.Cols[1].SetType(CellTypeString)
  295. sheet.Cols[3].SetType(CellTypeNumeric)
  296. sheet.Cols[4].SetType(CellTypeString)
  297. parts, err = file.MarshallParts()
  298. styleSheet, ok = parts["xl/styles.xml"]
  299. if !ok {
  300. t.Fatal("no style sheet")
  301. }
  302. // Created an XLSX file with two distinct cell types, which should create two new styles.
  303. // The same cell type was added three times, this should be coalesced into the same style rather than
  304. // recreating the style. This XLSX stream library depends on this behavior when predicting the next style id.
  305. if !strings.Contains(styleSheet, fmt.Sprintf(`<cellXfs count="%d">`, initMaxStyleId+1+2)) {
  306. t.Fatal("Expected sheet to have four styles")
  307. }
  308. }
  309. // writeStreamFile will write the file using this stream package
  310. func writeStreamFile(filePath string, fileBuffer io.Writer, sheetNames []string, workbookData [][][]string, headerTypes [][]*CellType, shouldMakeRealFiles bool) error {
  311. var file *StreamFileBuilder
  312. var err error
  313. if shouldMakeRealFiles {
  314. file, err = NewStreamFileBuilderForPath(filePath)
  315. if err != nil {
  316. return err
  317. }
  318. } else {
  319. file = NewStreamFileBuilder(fileBuffer)
  320. }
  321. for i, sheetName := range sheetNames {
  322. header := workbookData[i][0]
  323. var sheetHeaderTypes []*CellType
  324. if i < len(headerTypes) {
  325. sheetHeaderTypes = headerTypes[i]
  326. }
  327. err := file.AddSheet(sheetName, header, sheetHeaderTypes)
  328. if err != nil {
  329. return err
  330. }
  331. }
  332. streamFile, err := file.Build()
  333. if err != nil {
  334. return err
  335. }
  336. for i, sheetData := range workbookData {
  337. if i != 0 {
  338. err = streamFile.NextSheet()
  339. if err != nil {
  340. return err
  341. }
  342. }
  343. for i, row := range sheetData {
  344. if i == 0 {
  345. continue
  346. }
  347. err = streamFile.Write(row)
  348. if err != nil {
  349. return err
  350. }
  351. }
  352. }
  353. err = streamFile.Close()
  354. if err != nil {
  355. return err
  356. }
  357. return nil
  358. }
  359. // readXLSXFile will read the file using the xlsx package.
  360. func readXLSXFile(t *C, filePath string, fileBuffer io.ReaderAt, size int64, shouldMakeRealFiles bool) ([]string, [][][]string) {
  361. var readFile *File
  362. var err error
  363. if shouldMakeRealFiles {
  364. readFile, err = OpenFile(filePath)
  365. if err != nil {
  366. t.Fatal(err)
  367. }
  368. } else {
  369. readFile, err = OpenReaderAt(fileBuffer, size)
  370. if err != nil {
  371. t.Fatal(err)
  372. }
  373. }
  374. var actualWorkbookData [][][]string
  375. var sheetNames []string
  376. for _, sheet := range readFile.Sheets {
  377. sheetData := [][]string{}
  378. for _, row := range sheet.Rows {
  379. data := []string{}
  380. for _, cell := range row.Cells {
  381. str, err := cell.FormattedValue()
  382. if err != nil {
  383. t.Fatal(err)
  384. }
  385. data = append(data, str)
  386. }
  387. sheetData = append(sheetData, data)
  388. }
  389. sheetNames = append(sheetNames, sheet.Name)
  390. actualWorkbookData = append(actualWorkbookData, sheetData)
  391. }
  392. return sheetNames, actualWorkbookData
  393. }
  394. func (s *StreamSuite) TestAddSheetErrorsAfterBuild(t *C) {
  395. file := NewStreamFileBuilder(bytes.NewBuffer(nil))
  396. err := file.AddSheet("Sheet1", []string{"Header"}, nil)
  397. if err != nil {
  398. t.Fatal(err)
  399. }
  400. err = file.AddSheet("Sheet2", []string{"Header2"}, nil)
  401. if err != nil {
  402. t.Fatal(err)
  403. }
  404. _, err = file.Build()
  405. if err != nil {
  406. t.Fatal(err)
  407. }
  408. err = file.AddSheet("Sheet3", []string{"Header3"}, nil)
  409. if err != BuiltStreamFileBuilderError {
  410. t.Fatal(err)
  411. }
  412. }
  413. func (s *StreamSuite) TestBuildErrorsAfterBuild(t *C) {
  414. file := NewStreamFileBuilder(bytes.NewBuffer(nil))
  415. err := file.AddSheet("Sheet1", []string{"Header"}, nil)
  416. if err != nil {
  417. t.Fatal(err)
  418. }
  419. err = file.AddSheet("Sheet2", []string{"Header2"}, nil)
  420. if err != nil {
  421. t.Fatal(err)
  422. }
  423. _, err = file.Build()
  424. if err != nil {
  425. t.Fatal(err)
  426. }
  427. _, err = file.Build()
  428. if err != BuiltStreamFileBuilderError {
  429. t.Fatal(err)
  430. }
  431. }
  432. func (s *StreamSuite) TestCloseWithNothingWrittenToSheets(t *C) {
  433. buffer := bytes.NewBuffer(nil)
  434. file := NewStreamFileBuilder(buffer)
  435. sheetNames := []string{"Sheet1", "Sheet2"}
  436. workbookData := [][][]string{
  437. {{"Header1", "Header2"}},
  438. {{"Header3", "Header4"}},
  439. }
  440. err := file.AddSheet(sheetNames[0], workbookData[0][0], nil)
  441. if err != nil {
  442. t.Fatal(err)
  443. }
  444. err = file.AddSheet(sheetNames[1], workbookData[1][0], nil)
  445. if err != nil {
  446. t.Fatal(err)
  447. }
  448. stream, err := file.Build()
  449. if err != nil {
  450. t.Fatal(err)
  451. }
  452. err = stream.Close()
  453. if err != nil {
  454. t.Fatal(err)
  455. }
  456. bufReader := bytes.NewReader(buffer.Bytes())
  457. size := bufReader.Size()
  458. actualSheetNames, actualWorkbookData := readXLSXFile(t, "", bufReader, size, false)
  459. // check if data was able to be read correctly
  460. if !reflect.DeepEqual(actualSheetNames, sheetNames) {
  461. t.Fatal("Expected sheet names to be equal")
  462. }
  463. if !reflect.DeepEqual(actualWorkbookData, workbookData) {
  464. t.Fatal("Expected workbook data to be equal")
  465. }
  466. }