jxl 删除excel重复的行

最新推荐文章于 2023-12-24 13:01:19 发布

陈蒙_

最新推荐文章于 2023-12-24 13:01:19 发布

阅读量3k

点赞数 1

分类专栏：其他 Java 编程

本文为博主原创文章，欢迎转载，请保留原文出处。

本文链接：https://blog.csdn.net/zhaizu/article/details/27657647

版权

Java 编程同时被 2 个专栏收录

26 篇文章 0 订阅

订阅专栏

其他

22 篇文章 0 订阅

订阅专栏

思路：先从前到后检索excel文件，找出重复的行的行号（从0开始），然后删除之；

注意：使用removeRow(int row)删除多行时，需要从后往前遍历，因为从前往后删除时行号就乱了，跟检索时的行号不一致了，导致误删或漏删，具体见代码第79-82行；

	/**
	 * 得到excel中重复的行号，判重标准为第0列数据
	 * @param filename
	 * @return
	 */
	public static final ArrayList<Integer> getDuplicateRows(String filename) {
		
		/**
		 * 从前往后找出重复的行号
		 */
		ArrayList<String> ids = new ArrayList<String>();
		ArrayList<Integer> duplicateRows = new ArrayList<Integer>();

		File file = new File(filename);

		// 读excel文件
		if (file.exists() == true) {

			// 文件存在，读取其中原始数据
			Workbook book = null;
			try {
				System.out.println("excel文件存在: " + file.getAbsolutePath());
				book = Workbook.getWorkbook(file);
			} catch (BiffException e) {
				e.printStackTrace();
			} catch (IOException e) {
				e.printStackTrace();
			}
			Sheet sheet = book.getSheet(0);

			int rows = sheet.getRows();
			
			// 取出excel中的第0列数据
			for (int i = 0; i < rows; i++) {
				
				// 第0列数据
				Cell idCell = sheet.getCell(0, i);
				String id = idCell.getContents().trim();
								
				if (ids.contains(id) == false) {
					ids.add(id);
				} else {
					duplicateRows.add(i);
				}
			}
			
			// 关闭文件
			book.close();
			
			// 释放空间
			ids.clear();
		} else {
			System.err.println("文件不存在。。。");
			return duplicateRows;
		}
		
		return duplicateRows;
	}
	
	/**
	 * 删除filename文件rowsToRemove中的行
	 * @param filename
	 * @param rowsToRemove
	 * @return
	 */
	public static int removeRows(String filename, ArrayList<Integer> rowsToRemove) {
		Workbook wb = null;
		WritableWorkbook book = null;
		WritableSheet wsheet = null;
		File f = new File(filename);

		try {
			wb = Workbook.getWorkbook(f);
			book = Workbook.createWorkbook(f, wb);
			wsheet = book.getSheet(0);
			
			System.out.println("to delete rows: " + rowsToRemove);
			
			for (int i = rowsToRemove.size() - 1; i >= 0; i--) {
				int row = rowsToRemove.get(i);
				wsheet.removeRow(row);
			}
			
			// 关闭文件
			book.write();
			book.close();
			
			// 释放空间
			rowsToRemove.clear();

		} catch (BiffException e) {
			e.printStackTrace();
		} catch (IOException e) {
			e.printStackTrace();
		} catch (WriteException e) {
			e.printStackTrace();
		}
		
		return 0;
	}
	
	/**
	 * 删除某excel中相同的行，从前往后检索，删除后面重复的行
	 * 判重条件是第0列数据
	 * @param filename
	 * @return
	 */
	public static int removeDuplicateRows(String filename) {
		
		// 从前往后找出重复的行号
		ArrayList<Integer> duplicateRows = getDuplicateRows(filename);
		
		// 根据行号删除重复的行
		removeRows(filename, duplicateRows);
		
		return 0;
	}