数据驱动---JAVA读取excle数据

package com.jason.framework.utils;

import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;

import net.sf.json.JSONObject;

import org.apache.log4j.Logger;
import org.apache.poi.ss.usermodel.Cell;
import org.apache.poi.ss.usermodel.DataFormatter;
import org.apache.poi.ss.usermodel.DateUtil;
import org.apache.poi.ss.usermodel.Row;
import org.apache.poi.ss.usermodel.Sheet;
import org.apache.poi.ss.usermodel.Workbook;
import org.apache.poi.ss.usermodel.WorkbookFactory;
import org.apache.poi.xssf.usermodel.XSSFCell;
import org.apache.poi.xssf.usermodel.XSSFRow;
import org.apache.poi.xssf.usermodel.XSSFSheet;
import org.apache.poi.xssf.usermodel.XSSFWorkbook;

import com.jason.framework.constants.constant;
import com.jason.framework.exception.NestedBusinessException;

public class ExcelReader {
    private String filePath;
    private String sheetName;
    private Workbook workBook;    
    private Sheet sheet;
    private List<String> columnHeaderList;
    private List<List<String>> listData;
    private List<Map<String,String>> mapData;
    private boolean flag;
    private static Map<String, String> map = new HashMap<String, String>();
    private static  SimpleLogger log = SimpleLogger.getLogger(ExcelReader.class);

    public ExcelReader(String filePath, String sheetName) {
        this.filePath = filePath;
        this.sheetName = sheetName;
        this.flag = false;
        this.load();
    }    

    private void load() {
        FileInputStream inStream = null;
        try {
            inStream = new FileInputStream(new File(filePath));
            workBook = WorkbookFactory.create(inStream);
            sheet = workBook.getSheet(sheetName);            
        } catch (Exception e) {
            e.printStackTrace();
        }finally{
            try {
                if(inStream!=null){
                    inStream.close();
                }                
            } catch (IOException e) {                
                e.printStackTrace();
            }
        }
    }

    public static List<Map<String, String>> getExcelToList(String xlsxPath, String sheetName) {

        XSSFWorkbook xssfWorkbook=null;
        try {
            if (!xlsxPath.endsWith(".xlsx")) {
                throw new NestedBusinessException("请检查文件名是否正确!");
            }
            InputStream is = new FileInputStream(xlsxPath);
            xssfWorkbook = new XSSFWorkbook(is);
        } catch (IOException e) {
            throw new NestedBusinessException("系统找不到文件异常!", e);
        }
        // 循环工作表Sheet
            XSSFSheet xssfSheet = xssfWorkbook.getSheet(sheetName);

            if (null == xssfSheet) {
                throw new NestedBusinessException("请检查sheet页是否存在!");
            }
            List<Map<String, String>> list = new ArrayList<Map<String, String>>();
            // 循环行Row
            XSSFRow rowTitleRow =xssfSheet.getRow(0);
            for (int rowNum = 1; rowNum <= xssfSheet.getLastRowNum(); rowNum++) {
                XSSFRow xssfRow = xssfSheet.getRow(rowNum);
                if (xssfRow == null) {
                    continue;
                }
                Map<String, String> map = new HashMap<String, String>();
                // 循环列Cell
                for (int cellNum = 0; cellNum <rowTitleRow.getLastCellNum(); cellNum++) {
                    XSSFCell xssfCell = xssfRow.getCell(cellNum);
                    XSSFCell xssfCellTitleCell = rowTitleRow.getCell(cellNum);
                    map.put(getCellValue(xssfCellTitleCell), getCellValue(xssfCell));
                }
                list.add(map);
            }
            return list;
    }

    private static String getCellValue(Cell cell) {
        String cellValue = "";
        DataFormatter formatter = new DataFormatter();
        if (cell != null) {
            switch (cell.getCellType()) {
                case Cell.CELL_TYPE_NUMERIC:
                    if (DateUtil.isCellDateFormatted(cell)) {
                        cellValue = formatter.formatCellValue(cell);
                    } else {
                        double value = cell.getNumericCellValue();
                        int intValue = (int) value;
                        cellValue = value - intValue == 0 ? String.valueOf(intValue) : String.valueOf(value);
                    }
                    break;
                case Cell.CELL_TYPE_STRING:
                    cellValue = cell.getStringCellValue();
                    break;
                case Cell.CELL_TYPE_BOOLEAN:
                    cellValue = String.valueOf(cell.getBooleanCellValue());
                    break;
                case Cell.CELL_TYPE_FORMULA:
                    cellValue = String.valueOf(cell.getCellFormula());
                    break;
                case Cell.CELL_TYPE_BLANK:
                    cellValue = "";
                    break;
                case Cell.CELL_TYPE_ERROR:
                    cellValue = "";
                    break;
                default:
                    cellValue = cell.toString().trim();
                    break;
            }
        }
        return cellValue.trim();
    }

    private List<List<String>> getSheetData() {
        listData = new ArrayList<List<String>>();
        mapData = new ArrayList<Map<String, String>>();    
        columnHeaderList = new ArrayList<String>();
        int numOfRows = sheet.getLastRowNum() + 1;
        for (int i = 0; i < numOfRows; i++) {
            Row row = sheet.getRow(i);
            Map<String, String> map = new HashMap<String, String>();
            List<String> list = new ArrayList<String>();
            if (row != null) {
                for (int j = 0; j < row.getLastCellNum(); j++) {
                    Cell cell = row.getCell(j);
                    if (i == 0){
                        columnHeaderList.add(getCellValue(cell));
                    }
                    else{                        
                        map.put(columnHeaderList.get(j), getCellValue(cell));
                    }
                    list.add(getCellValue(cell));
                }
            }
            if (i > 0){
                mapData.add(map);
            }
            listData.add(list);
        }
        flag = true;

        return listData;
    }

    public String getCellData(int row, int col){
        if(row<=0 || col<=0){
            return null;
        }
        if(!flag){
            this.getSheetData();
        }        
        if(listData.size()>=row && listData.get(row-1).size()>=col){
            return listData.get(row-1).get(col-1);
        }else{
            return null;
        }
    }

    public String getCellData(int row, String headerName){
        if(row<=0){
            return null;
        }
        if(!flag){
            this.getSheetData();
        }        
        if(mapData.size()>=row && mapData.get(row-1).containsKey(headerName)){
            return mapData.get(row-1).get(headerName);
        }else{
            return null;
        }
    }

    public static Map<String, String> getDataByValue(String excelPath, String sheetName, String vaule){
       List<Map<String, String>> list =ExcelReader.getExcelToList(excelPath,sheetName);
       for (Map<String, String> data : list) {
           if (data.containsValue(vaule)) {
               map = data;
           }
        }
       return map;
    }
}
  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
Java Spark可以通过以下几种方式读取Excel数据: 1. 使用Apache POI库读取Excel数据,然后将数据转换为Spark DataFrame。 2. 使用Excel DataSource API,这是一个基于Spark SQL的插件,可以直接从Excel中加载数据并生成Spark DataFrame。 3. 使用第三方库,例如DataBricks的excelent或者CData的Excel JDBC驱动程序。 下面是使用Apache POI库读取Excel数据的示例代码: ```java import org.apache.spark.sql.Dataset; import org.apache.spark.sql.Row; import org.apache.spark.sql.SparkSession; import org.apache.spark.sql.types.DataTypes; import org.apache.spark.sql.types.StructField; import org.apache.spark.sql.types.StructType; import org.apache.spark.sql.functions.*; import java.util.ArrayList; import java.util.List; import org.apache.poi.ss.usermodel.*; import org.apache.poi.xssf.usermodel.XSSFWorkbook; public class ExcelReader { public static void main(String[] args) { SparkSession spark = SparkSession.builder() .appName("Excel Reader") .master("local[*]") .getOrCreate(); String filePath = "path/to/excel/file.xlsx"; String sheetName = "Sheet1"; // Read Excel file into a Workbook object Workbook workbook = null; try { workbook = new XSSFWorkbook(filePath); } catch (Exception e) { e.printStackTrace(); } // Get the sheet from the workbook Sheet sheet = workbook.getSheet(sheetName); // Get the header row Row headerRow = sheet.getRow(0); // Create a list of StructField objects to define the schema List<StructField> fields = new ArrayList<>(); for (Cell cell : headerRow) { String columnName = cell.getStringCellValue(); StructField field = DataTypes.createStructField(columnName, DataTypes.StringType, true); fields.add(field); } // Create the schema StructType schema = DataTypes.createStructType(fields); // Read the data rows and convert them to Spark Rows List<Row> rows = new ArrayList<>(); for (int i = 1; i <= sheet.getLastRowNum(); i++) { Row row = sheet.getRow(i); List<String> rowValues = new ArrayList<>(); for (Cell cell : row) { rowValues.add(cell.getStringCellValue()); } Row sparkRow = RowFactory.create(rowValues.toArray()); rows.add(sparkRow); } // Create the DataFrame Dataset<Row> df = spark.createDataFrame(rows, schema); // Show the DataFrame df.show(); // Close the workbook try { workbook.close(); } catch (Exception e) { e.printStackTrace(); } } } ``` 注意:这段代码仅适用于读取XLSX格式的Excel文件,如果要读取XLS格式的文件,需要使用HSSF而不是XSSF。

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值