java对execl的操作

最新推荐文章于 2024-04-19 10:52:05 发布

hy飞无

最新推荐文章于 2024-04-19 10:52:05 发布

阅读量750

点赞数

分类专栏： java

本文链接：https://blog.csdn.net/hyhanyu/article/details/81068194

版权

java 专栏收录该内容

47 篇文章 0 订阅

订阅专栏

HSSFWorkbook 对应操作的execl的文件格式为xls,需要注

意的是在导出execl文件时，一个sheet最多导出65535 ,并且会消耗内存。

XSSFWorkbook 对应操作的execl的文件格式为xlsx，最多可以导出 104 万行，不过当导出大量数据时，会消耗大量内存，并占用大量cpu。

SXSSFWorkbook是streaming版本的XSSFWorkbook,它只会保存最新的excel rows在内存里供查看，在此之前的excel rows都会被写入到硬盘里（Windows电脑的话，是写入到C盘根目录下的temp文件夹）。被写入到硬盘里的rows是不可见的/不可访问的。只有还保存在内存里的才可以被访问到。

至于多少行保存在内存里，其他写入硬盘，是由DEFAULT_WINDOW_SIZE决定的。代码也可以在创建SXSSFWorkbook实例时，传入一个int参数，来设定。需注意的是，int rowAccessWindowSize如果传入100，并不是指100行保存在内存里，而是说100的屏幕尺寸下可见的行数。所以现在直接使用SXSSFWorkbook 即可。

SXSSFWorkbook 导入列子：

@RequestMapping("/exportExecl")
	@ResponseBody
	public void exportExecl(@RequestParam Integer deviceId, String beginTime, String endTime,
			@RequestParam(defaultValue = "0") Integer pageNum) {
		ServletOutputStream outputStream = null;
		List<DeviceMonitorDatas> list = null;
		Row row = null;
		SXSSFWorkbook workbook = null;
		Sheet sheet = null;

		try {
			if (!semaphoreExecl.tryAcquire()) {
				response.setCharacterEncoding("utf-8");
				PrintWriter writer = response.getWriter();
				writer.print("当前操作人数太多，请稍后再试！");
				writer.flush();
				writer.close();
				
			} else {
				String times = Dateutil.getStrAllTime(new Date());
				long count = iDeviceDataService.deviceListDataCount(deviceId, Dateutil.getDayMin(beginTime),
						Dateutil.getDayMax(endTime));
				response.setContentType("application/vnd.ms-excel");
				response.setHeader("Content-disposition", "attachment;filename=" + times + "_数据.xlsx");
				workbook = new SXSSFWorkbook(10000);
				sheet = workbook.createSheet();

				DeviceMonitorDatas bean = null;
				setExeclTitle(sheet);

				for (int i = 0; i < count; i = i + 10000) {
					list = iDeviceDataService.exportDeviceListData(i, 100000, deviceId, Dateutil.getDayMin(beginTime),
							Dateutil.getDayMax(endTime));
					if (list != null && !list.isEmpty()) {
						for (int j = 0; j < list.size(); j++) {
							bean = list.get(j);
							row = sheet.createRow(i * 10000 + j + 1);
							setExeclTitle(row, bean);
						}
					}

				}
				outputStream = response.getOutputStream();
				workbook.write(outputStream);
				outputStream.flush();
				outputStream.close();

			}
		} catch (Exception e) {
             e.printStackTrace();
		} finally {
			list = null;
			row = null;
			sheet = null;
			workbook = null;
			semaphoreExecl.release();

		}

	}

其他的一些常用方法：

HSSFCellStyle titleStyle = sheet.getWorkbook().createCellStyle(); //创建一个单元格样式
titleStyle.setVerticalAlignment(VerticalAlignment.CENTER);// 垂直
titleStyle.setAlignment(HorizontalAlignment.CENTER);// 水平
HSSFFont titleFont = sheet.getWorkbook().createFont();
titleFont.setFontName("楷体");//字体名称
titleFont.setFontHeightInPoints((short)18); //字体大小
titleFont.setBold(true);//粗体
titleFont.setColor(HSSFColor.HSSFColorPredefined.BLACK.getIndex());//设置字体颜色
titleStyle.setFont(titleFont);//设置字体样式

HSSFCell cell = row.createCell(0);//创建单元格
cell.setCellValue("辩题");
cell.setCellStyle(titleStyle);//设置单元格的样式

CellRangeAddress cellRangeAddress = new CellRangeAddress(0,3 , 0, 2); //合并单元格参数意义第一行，最后一行，第一列，最后一列
sheet.addMergedRegion(cellRangeAddress); //添加到sheet里。

对于读取execl ，如果文件太大，用官方推荐的把xlsx转为xsv代码：

package com.glodio.util;
import java.io.File;
import java.io.IOException;
import java.io.InputStream;
import java.io.PrintStream;

import javax.xml.parsers.ParserConfigurationException;

import org.apache.poi.openxml4j.exceptions.OpenXML4JException;
import org.apache.poi.openxml4j.opc.OPCPackage;
import org.apache.poi.openxml4j.opc.PackageAccess;
import org.apache.poi.ss.usermodel.DataFormatter;
import org.apache.poi.ss.util.CellAddress;
import org.apache.poi.ss.util.CellReference;
import org.apache.poi.util.SAXHelper;//这个类的位置被改过,直接拷贝官方的代码需要修改
import org.apache.poi.xssf.eventusermodel.ReadOnlySharedStringsTable;
import org.apache.poi.xssf.eventusermodel.XSSFReader;
import org.apache.poi.xssf.eventusermodel.XSSFSheetXMLHandler;
import org.apache.poi.xssf.eventusermodel.XSSFSheetXMLHandler.SheetContentsHandler;
import org.apache.poi.xssf.extractor.XSSFEventBasedExcelExtractor;
import org.apache.poi.xssf.model.StylesTable;
import org.apache.poi.xssf.usermodel.XSSFComment;
import org.xml.sax.ContentHandler;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLReader;

/**
 * A rudimentary XLSX -> CSV processor modeled on the
 * POI sample program XLS2CSVmra from the package
 * org.apache.poi.hssf.eventusermodel.examples.
 * As with the HSSF version, this tries to spot missing
 *  rows and cells, and output empty entries for them.
 * <p>
 * Data sheets are read using a SAX parser to keep the
 * memory footprint relatively small, so this should be
 * able to read enormous workbooks.  The styles table and
 * the shared-string table must be kept in memory.  The
 * standard POI styles table class is used, but a custom
 * (read-only) class is used for the shared string table
 * because the standard POI SharedStringsTable grows very
 * quickly with the number of unique strings.
 * <p>
 * For a more advanced implementation of SAX event parsing
 * of XLSX files, see {@link XSSFEventBasedExcelExtractor}
 * and {@link XSSFSheetXMLHandler}. Note that for many cases,
 * it may be possible to simply use those with a custom 
 * {@link SheetContentsHandler} and no SAX code needed of
 * your own!
 */
public class XLSX2CSV {
    /**
     * Uses the XSSF Event SAX helpers to do most of the work
     *  of parsing the Sheet XML, and outputs the contents
     *  as a (basic) CSV.
     */
    private class SheetToCSV implements SheetContentsHandler {
        private boolean firstCellOfRow;
        private int currentRow = -1;
        private int currentCol = -1;
        //这个方法 我们是否要过滤掉前几列数据 ，如果minColumns 为2 那么0,1,2的数据不会读取
        private void outputMissingRows(int number) {
            for (int i=0; i<number; i++) {
                for (int j=0; j<minColumns; j++) {
                    output.append(',');
                }
                output.append('\n');
            }
        }

        @Override
        public void startRow(int rowNum) {
            // If there were gaps, output the missing rows
            //outputMissingRows(rowNum-currentRow-1);
            // Prepare for this row
            firstCellOfRow = true;
            currentRow = rowNum;
            currentCol = -1;
        }

        @Override
        public void endRow(int rowNum) {
            // Ensure the minimum number of columns  每一行执行完后 执行该方法 我们可以做数验证 把不符合数据的进行抛弃掉

            for (int i=currentCol; i<minColumns; i++) {
                output.append(',');
            }
            output.append('\n');
        }

        @Override
        public void cell(String cellReference, String formattedValue,
                XSSFComment comment) {
           //处理每个单元格的数据，如果单元格的数据为空 那么这个方法不会执行
            if (firstCellOfRow) {
                firstCellOfRow = false;
            } else {
                output.append(',');
            }

            // gracefully handle missing CellRef here in a similar way as XSSFCell does
            if(cellReference == null) {
                cellReference = new CellAddress(currentRow, currentCol).formatAsString();
            }

            // Did we miss any cells? //如果前面的单元格数据有为空的，那么这个会执行
            int thisCol = (new CellReference(cellReference)).getCol();
            int missedCols = thisCol - currentCol - 1;
            for (int i=0; i<missedCols; i++) {
                output.append(',');
            }
            currentCol = thisCol;
            
            // Number or string?
            try {
                //noinspection ResultOfMethodCallIgnored
                Double.parseDouble(formattedValue);
                output.append(formattedValue);
            } catch (NumberFormatException e) {
                output.append('"');
                output.append(formattedValue);
                output.append('"');
            }
        }

		@Override
		public void headerFooter(String arg0, boolean arg1, String arg2) {
			// TODO Auto-generated method stub
			
		}
    }


    ///

    private  OPCPackage xlsxPackage;

    /**
     * Number of columns to read starting with leftmost
     */
    private final int minColumns;

    /**
     * Destination for data
     */
    private final PrintStream output;

    /**
     * Creates a new XLSX -> CSV examples
     *
     * @param pkg        The XLSX package to process
     * @param output     The PrintStream to output the CSV to
     * @param minColumns The minimum number of columns to output, or -1 for no minimum
     */
    public XLSX2CSV(OPCPackage pkg, PrintStream output, int minColumns) {
        this.xlsxPackage = pkg;
        this.output = output;
        this.minColumns = minColumns;
    }

    /**
     * Parses and shows the content of one sheet
     * using the specified styles and shared-strings tables.
     *
     * @param styles The table of styles that may be referenced by cells in the sheet
     * @param strings The table of strings that may be referenced by cells in the sheet
     * @param sheetInputStream The stream to read the sheet-data from.

     * @exception java.io.IOException An IO exception from the parser,
     *            possibly from a byte stream or character stream
     *            supplied by the application.
     * @throws SAXException if parsing the XML data fails.
     */
    public void processSheet(
            StylesTable styles,
            ReadOnlySharedStringsTable strings,
            SheetContentsHandler sheetHandler, 
            InputStream sheetInputStream) throws IOException, SAXException {
        DataFormatter formatter = new DataFormatter();
        InputSource sheetSource = new InputSource(sheetInputStream);
        try {
            XMLReader sheetParser = SAXHelper.newXMLReader();
            ContentHandler handler = new XSSFSheetXMLHandler(
                  styles, null, strings, sheetHandler, formatter, false);
            sheetParser.setContentHandler(handler);
            sheetParser.parse(sheetSource);
         } catch(ParserConfigurationException e) {
            throw new RuntimeException("SAX parser appears to be broken - " + e.getMessage());
         }
    }

    /**
     * Initiates the processing of the XLS workbook file to CSV.
     *
     * @throws IOException If reading the data from the package fails.
     * @throws SAXException if parsing the XML data fails.
     */
    public void process() throws IOException, OpenXML4JException, SAXException {
        ReadOnlySharedStringsTable strings = new ReadOnlySharedStringsTable(this.xlsxPackage);
        XSSFReader xssfReader = new XSSFReader(this.xlsxPackage);
        StylesTable styles = xssfReader.getStylesTable();
        XSSFReader.SheetIterator iter = (XSSFReader.SheetIterator) xssfReader.getSheetsData();
        int index = 0;
        while (iter.hasNext()) {
            try (InputStream stream = iter.next()) {
                String sheetName = iter.getSheetName();
                this.output.println();
                this.output.println(sheetName + " [index=" + index + "]:");
                processSheet(styles, strings, new SheetToCSV(), stream);
            }
            ++index;
        }
        iter = null;
        styles = null;
        xssfReader = null;
        strings = null;
       
    }

    
    
    public static void readExecl(InputStream inputStream ) throws Exception {
    
        int minColumns = -1;
        

        // The package open is instantaneous, as it should be.
        try (OPCPackage p = OPCPackage.open(inputStream)) {
            XLSX2CSV xlsx2csv = new XLSX2CSV(p, System.out, minColumns);
            xlsx2csv.process();
        }
        
    }
    
    public static void readExecl(String fileName) throws Exception {
        
    	 File xlsxFile = new File(fileName);
         if (!xlsxFile.exists()) {
             System.err.println("Not found or not a file: " + xlsxFile.getPath());
             return;
         }

         int minColumns = -1;
      
         XLSX2CSV xlsx2csv = null;
         // The package open is instantaneous, as it should be.
         try (OPCPackage p = OPCPackage.open(xlsxFile.getPath(), PackageAccess.READ)) {
              xlsx2csv = new XLSX2CSV(p, System.out, minColumns);
             xlsx2csv.process();
           
         }
         xlsx2csv.xlsxPackage = null;
         xlsx2csv = null;
    }
    
    public static void main(String[] args) throws Exception {
    
        File xlsxFile = new File("E://2.xlsx");
        if (!xlsxFile.exists()) {
            System.err.println("Not found or not a file: " + xlsxFile.getPath());
            return;
        }

        int minColumns = -1;
        if (args.length >= 2)
            minColumns = Integer.parseInt(args[1]);

        // The package open is instantaneous, as it should be.
        //try()这样会自动调用对象的close的方法
        try (OPCPackage p = OPCPackage.open(xlsxFile.getPath(), PackageAccess.READ)) {
            XLSX2CSV xlsx2csv = new XLSX2CSV(p, System.out, minColumns);
            xlsx2csv.process();
            
        }
    }
}

我们只需要重新写 SheetToCSV implements SheetContentsHandler 就可以使用了，OPCPackage.open(xlsxFile.getPath(), PackageAccess.READ) 最好读取文件，如果改成流执行的时候，刚开始是会消耗大量内存，后面就正常了。