2014-12-25 04:16:44 -05:00
|
|
|
/* ====================================================================
|
|
|
|
Licensed to the Apache Software Foundation (ASF) under one or more
|
|
|
|
contributor license agreements. See the NOTICE file distributed with
|
|
|
|
this work for additional information regarding copyright ownership.
|
|
|
|
The ASF licenses this file to You under the Apache License, Version 2.0
|
|
|
|
(the "License"); you may not use this file except in compliance with
|
|
|
|
the License. You may obtain a copy of the License at
|
|
|
|
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
limitations under the License.
|
|
|
|
==================================================================== */
|
|
|
|
package org.apache.poi.stress;
|
|
|
|
|
2016-04-01 02:25:49 -04:00
|
|
|
import static org.junit.Assert.assertFalse;
|
2015-09-13 15:05:40 -04:00
|
|
|
import static org.junit.Assert.assertNotNull;
|
|
|
|
|
2016-04-01 02:25:49 -04:00
|
|
|
import java.io.*;
|
|
|
|
import java.util.HashSet;
|
2015-09-13 15:05:40 -04:00
|
|
|
import java.util.Iterator;
|
2016-04-01 02:25:49 -04:00
|
|
|
import java.util.Set;
|
2014-12-25 04:16:44 -05:00
|
|
|
|
|
|
|
import javax.xml.parsers.ParserConfigurationException;
|
|
|
|
import javax.xml.transform.TransformerException;
|
|
|
|
|
2016-04-01 02:25:49 -04:00
|
|
|
import org.apache.poi.POIXMLException;
|
|
|
|
import org.apache.poi.openxml4j.exceptions.InvalidFormatException;
|
|
|
|
import org.apache.poi.openxml4j.exceptions.OLE2NotOfficeXmlFileException;
|
2015-09-13 15:05:40 -04:00
|
|
|
import org.apache.poi.openxml4j.exceptions.OpenXML4JException;
|
|
|
|
import org.apache.poi.openxml4j.opc.OPCPackage;
|
|
|
|
import org.apache.poi.util.IOUtils;
|
2016-04-01 02:25:49 -04:00
|
|
|
import org.apache.poi.xssf.eventusermodel.XLSX2CSV;
|
2015-09-13 15:05:40 -04:00
|
|
|
import org.apache.poi.xssf.eventusermodel.XSSFReader;
|
2016-04-01 02:25:49 -04:00
|
|
|
import org.apache.poi.xssf.eventusermodel.examples.FromHowTo;
|
2014-12-25 04:16:44 -05:00
|
|
|
import org.apache.poi.xssf.extractor.XSSFExportToXml;
|
|
|
|
import org.apache.poi.xssf.usermodel.XSSFMap;
|
|
|
|
import org.apache.poi.xssf.usermodel.XSSFWorkbook;
|
|
|
|
import org.junit.Test;
|
|
|
|
import org.xml.sax.SAXException;
|
|
|
|
|
|
|
|
public class XSSFFileHandler extends SpreadsheetHandler {
|
2015-09-13 15:05:40 -04:00
|
|
|
@Override
|
2014-12-25 04:16:44 -05:00
|
|
|
public void handleFile(InputStream stream) throws Exception {
|
2015-09-13 15:05:40 -04:00
|
|
|
// ignore password protected files
|
|
|
|
if (POIXMLDocumentHandler.isEncrypted(stream)) return;
|
|
|
|
|
2015-12-31 03:23:04 -05:00
|
|
|
ByteArrayOutputStream out = new ByteArrayOutputStream();
|
|
|
|
IOUtils.copy(stream, out);
|
2015-09-13 15:05:40 -04:00
|
|
|
|
2015-12-31 03:23:04 -05:00
|
|
|
final byte[] bytes = out.toByteArray();
|
|
|
|
final XSSFWorkbook wb;
|
|
|
|
wb = new XSSFWorkbook(new ByteArrayInputStream(bytes));
|
2015-12-30 15:31:30 -05:00
|
|
|
|
2015-09-13 15:05:40 -04:00
|
|
|
// use the combined handler for HSSF/XSSF
|
2016-03-31 09:56:27 -04:00
|
|
|
handleWorkbook(wb);
|
2015-09-13 15:05:40 -04:00
|
|
|
|
2014-12-25 04:16:44 -05:00
|
|
|
// TODO: some documents fail currently...
|
|
|
|
//XSSFFormulaEvaluator evaluator = new XSSFFormulaEvaluator(wb);
|
|
|
|
//evaluator.evaluateAll();
|
|
|
|
|
2015-09-13 15:05:40 -04:00
|
|
|
// also verify general POIFS-stuff
|
|
|
|
new POIXMLDocumentHandler().handlePOIXMLDocument(wb);
|
|
|
|
|
|
|
|
// and finally ensure that exporting to XML works
|
|
|
|
exportToXML(wb);
|
2015-12-31 03:23:04 -05:00
|
|
|
|
|
|
|
checkXSSFReader(OPCPackage.open(new ByteArrayInputStream(bytes)));
|
2016-01-10 15:44:17 -05:00
|
|
|
|
|
|
|
wb.close();
|
2015-09-13 15:05:40 -04:00
|
|
|
}
|
|
|
|
|
2014-12-25 04:16:44 -05:00
|
|
|
|
2016-03-31 09:56:27 -04:00
|
|
|
private void checkXSSFReader(OPCPackage p) throws IOException, OpenXML4JException {
|
2015-09-13 15:05:40 -04:00
|
|
|
XSSFReader reader = new XSSFReader(p);
|
|
|
|
|
|
|
|
// these can be null...
|
|
|
|
InputStream sharedStringsData = reader.getSharedStringsData();
|
|
|
|
if(sharedStringsData != null) {
|
|
|
|
sharedStringsData.close();
|
|
|
|
}
|
|
|
|
reader.getSharedStringsTable();
|
|
|
|
|
|
|
|
InputStream stylesData = reader.getStylesData();
|
|
|
|
if(stylesData != null) {
|
|
|
|
stylesData.close();
|
|
|
|
}
|
|
|
|
reader.getStylesTable();
|
|
|
|
|
|
|
|
InputStream themesData = reader.getThemesData();
|
|
|
|
if(themesData != null) {
|
|
|
|
themesData.close();
|
|
|
|
}
|
|
|
|
|
|
|
|
assertNotNull(reader.getWorkbookData());
|
|
|
|
|
|
|
|
Iterator<InputStream> sheetsData = reader.getSheetsData();
|
|
|
|
while(sheetsData.hasNext()) {
|
|
|
|
InputStream str = sheetsData.next();
|
|
|
|
str.close();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-12-25 04:16:44 -05:00
|
|
|
private void exportToXML(XSSFWorkbook wb) throws SAXException,
|
|
|
|
ParserConfigurationException, TransformerException {
|
|
|
|
for (XSSFMap map : wb.getCustomXMLMappings()) {
|
|
|
|
XSSFExportToXml exporter = new XSSFExportToXml(map);
|
|
|
|
|
|
|
|
ByteArrayOutputStream os = new ByteArrayOutputStream();
|
|
|
|
exporter.exportToXML(os, true);
|
|
|
|
}
|
|
|
|
}
|
2016-04-01 02:25:49 -04:00
|
|
|
|
|
|
|
private static final Set<String> EXPECTED_ADDITIONAL_FAILURES = new HashSet<String>();
|
|
|
|
static {
|
|
|
|
// expected sheet-id not found
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/52348.xlsx");
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/59021.xlsx");
|
|
|
|
// zip-bomb
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/54764.xlsx");
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/54764-2.xlsx");
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/54764.xlsx");
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/poc-xmlbomb.xlsx");
|
|
|
|
// strict OOXML
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/57914.xlsx");
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/SampleSS.strict.xlsx");
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/SimpleStrict.xlsx");
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/sample.strict.xlsx");
|
|
|
|
// binary format
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/Simple.xlsb");
|
|
|
|
// TODO: good to ignore?
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.add("spreadsheet/sample-beta.xlsx");
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
|
|
|
public void handleAdditional(File file) throws Exception {
|
|
|
|
// redirect stdout as the examples often write lots of text
|
|
|
|
PrintStream oldOut = System.out;
|
|
|
|
try {
|
|
|
|
System.setOut(new PrintStream(new OutputStream() {
|
|
|
|
@Override
|
|
|
|
public void write(int b) throws IOException {
|
|
|
|
}
|
|
|
|
}));
|
|
|
|
FromHowTo.main(new String[]{file.getAbsolutePath()});
|
|
|
|
XLSX2CSV.main(new String[]{file.getAbsolutePath()});
|
|
|
|
|
|
|
|
assertFalse("Expected Extraction to fail for file " + file + " and handler " + this + ", but did not fail!",
|
|
|
|
EXPECTED_ADDITIONAL_FAILURES.contains(file.getParentFile().getName() + "/" + file.getName()));
|
|
|
|
|
|
|
|
} catch (OLE2NotOfficeXmlFileException e) {
|
|
|
|
// we have some files that are not actually OOXML and thus cannot be tested here
|
|
|
|
} catch (IllegalArgumentException e) {
|
|
|
|
if(!EXPECTED_ADDITIONAL_FAILURES.contains(file.getParentFile().getName() + "/" + file.getName())) {
|
|
|
|
throw e;
|
|
|
|
}
|
|
|
|
} catch (InvalidFormatException e) {
|
|
|
|
if(!EXPECTED_ADDITIONAL_FAILURES.contains(file.getParentFile().getName() + "/" + file.getName())) {
|
|
|
|
throw e;
|
|
|
|
}
|
|
|
|
} catch (IOException e) {
|
|
|
|
if(!EXPECTED_ADDITIONAL_FAILURES.contains(file.getParentFile().getName() + "/" + file.getName())) {
|
|
|
|
throw e;
|
|
|
|
}
|
|
|
|
} catch (POIXMLException e) {
|
|
|
|
if(!EXPECTED_ADDITIONAL_FAILURES.contains(file.getParentFile().getName() + "/" + file.getName())) {
|
|
|
|
throw e;
|
|
|
|
}
|
|
|
|
} finally {
|
|
|
|
System.setOut(oldOut);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-09-13 15:05:40 -04:00
|
|
|
// a test-case to test this locally without executing the full TestAllFiles
|
|
|
|
@Test
|
|
|
|
public void test() throws Exception {
|
2015-12-31 03:23:04 -05:00
|
|
|
InputStream stream = new BufferedInputStream(new FileInputStream("test-data/spreadsheet/ref-56737.xlsx"));
|
2015-09-13 15:05:40 -04:00
|
|
|
try {
|
|
|
|
handleFile(stream);
|
|
|
|
} finally {
|
|
|
|
stream.close();
|
|
|
|
}
|
|
|
|
}
|
2015-02-27 09:58:41 -05:00
|
|
|
|
|
|
|
// a test-case to test this locally without executing the full TestAllFiles
|
|
|
|
@Test
|
|
|
|
public void testExtractor() throws Exception {
|
2015-12-31 03:23:04 -05:00
|
|
|
handleExtracting(new File("test-data/spreadsheet/ref-56737.xlsx"));
|
2015-02-27 09:58:41 -05:00
|
|
|
}
|
2016-04-01 02:25:49 -04:00
|
|
|
|
|
|
|
@Test
|
|
|
|
public void testAdditional() throws Exception {
|
|
|
|
handleAdditional(new File("test-data/spreadsheet/poc-xmlbomb.xlsx"));
|
|
|
|
}
|
|
|
|
}
|