爬取Excel表格(加强版)
package test; import io.ExcelOperat; import java.io.File; import java.io.IOException; import java.util.HashMap; import java.util.Map; /** * @ProjectName: TutorDualSelectionSystem * @Package: test * @ClassName: MapNestedDemo * @Author: 王团结 * @Description: 手工排课类 * @Date: 2019/7/2 15:17 * @Version: 1.0 */ public class MapNestedDemo { public static void main(String[] args) { // // String path_01="C:\\Users\\ASUS\\Desktop\\2019-2020学年第一学期教材征订计划3.xls"; // String path_02="C:\\Users\\ASUS\\Desktop\\startClassPlan_fb.xls"; // // String path_01="C:\\Users\\ASUS\\Desktop\\手工排课.xls"; // String path_02="C:\\Users\\ASUS\\Desktop\\startClassPlan_fb.xls"; String path_01="C:\\Users\\ASUS\\Desktop\\手工排课.xls"; String path_02="C:\\Users\\ASUS\\Desktop\\startClassPlan_fb.xls"; //第一个文件迭代输出 System.out.println("第一个文件迭代输出"); System.out.println("----------------------------------------------------------------------------------------------"); String[] put_01 = crow(path_01); //第二个文件迭代输出 System.out.println("第二个文件迭代输出"); System.out.println("----------------------------------------------------------------------------------------------"); String[] put_02= crow(path_02); // // compare(put_01,put_02); } private static String[] crow(String path) { File file_01 = new File(path); String[][] excel = new String[0][]; try { excel = ExcelOperat.getData(file_01, 1); } catch (IOException e) { System.out.println("--------------------------------------------------------------------------"); System.out.println("读取错误!"); } int rowLength = excel.length; //输出总行数 System.out.println("文件"+path+"总行数" + rowLength); System.out.println("--------------------------------------------------------------------------"); String[] total=new String[3000]; int m=0; for (int i=0;i<rowLength;i++){ String[] split = excel[i][3].split(","); for(int j=0;j<split.length;j++){ total[m++]= excel[i][1]+"|"+excel[i][2]+"|"+split[j]+"\t"+excel[i][13]; } } String[] totals=new String[m]; for (int i=0;i<m;i++){ totals[i]=total[i]; // System.out.println(i+totals[i]); } return totals; } //比较 private static void compare(String[] put_01,String[] put_02 ) { int m=0; System.out.println("\t\t\t手工排课 .xls"+"\t\t\t\t\t\t\t\t\t\t"+"startClassPlan_fb.xls"); System.out.println("序号"+"\t|课程号|课程名|班级名\t教师姓名"+"\t\t\t\t\t"+"序号"+"\t|课程号|课程名|班级名\t教师姓名"); for(int i=0;i<put_01.length;i++){ String[] split = put_01[i].split("\t"); for (int j=0;j<put_02.length;j++){ String[] split1 = put_02[j].split("\t"); if(split[0].equals(split1[0])){ if(split[1].startsWith("外聘")){ put_01[i]=put_01[i].replace(split[1],split1[1]); }else if(!split[split.length-1].equals(split1[split1.length-1])){ System.out.println((m++)+"\t|" +put_01[i]+"\t\t\t\t\t"+put_02[j]); } } } } } }
package io; import java.io.BufferedInputStream; import java.io.File; import java.io.FileInputStream; import java.io.FileNotFoundException; import java.io.IOException; import java.text.DecimalFormat; import java.text.SimpleDateFormat; import java.util.ArrayList; import java.util.Arrays; import java.util.Date; import java.util.List; import org.apache.poi.hssf.usermodel.HSSFCell; import org.apache.poi.hssf.usermodel.HSSFDateUtil; import org.apache.poi.hssf.usermodel.HSSFRow; import org.apache.poi.hssf.usermodel.HSSFSheet; import org.apache.poi.hssf.usermodel.HSSFWorkbook; import org.apache.poi.poifs.filesystem.POIFSFileSystem; /** * @ProjectName: TutorDualSelectionSystem * @Package: io * @ClassName: ExcelOperat * @Author: 王团结 * @Description: 读取Excel内容 * @Date: 2019/7/2 14:39 * @Version: 1.0 */ public class ExcelOperat { // public static void main(String[] args) throws Exception { // // File file = new File("C:\\Users\\ASUS\\Desktop\\2019-2020学年第一学期教材征订计划3.xls"); // // String[][] result = getData(file, 1); // // int rowLength = result.length; // // // // for (int i = 0; i < rowLength; i++) { // System.out.print(result[i][2] + "\t\t"); //// for (int j = 0; j < result[i].length; j++) { //// //// System.out.print(result[i][j] + "\t\t"); //// //// } // // System.out.println(); // // } // // // } /** * 读取Excel的内容,第一维数组存储的是一行中格列的值,二维数组存储的是多少个行 * * @param file 读取数据的源Excel * @param ignoreRows 读取数据忽略的行数,比喻行头不需要读入 忽略的行数为1 * @return 读出的Excel中数据的内容 * @throws FileNotFoundException * @throws IOException */ public static String[][] getData(File file, int ignoreRows) throws FileNotFoundException, IOException { List<String[]> result = new ArrayList<String[]>(); int rowSize = 0; BufferedInputStream in = new BufferedInputStream(new FileInputStream( file)); // 打开HSSFWorkbook POIFSFileSystem fs = new POIFSFileSystem(in); HSSFWorkbook wb = new HSSFWorkbook(fs); HSSFCell cell = null; for (int sheetIndex = 0; sheetIndex < wb.getNumberOfSheets(); sheetIndex++) { HSSFSheet st = wb.getSheetAt(sheetIndex); // 第一行为标题,不取 for (int rowIndex = ignoreRows; rowIndex <= st.getLastRowNum(); rowIndex++) { HSSFRow row = st.getRow(rowIndex); if (row == null) { continue; } int tempRowSize = row.getLastCellNum() + 1; if (tempRowSize > rowSize) { rowSize = tempRowSize; } String[] values = new String[rowSize]; Arrays.fill(values, ""); boolean hasValue = false; for (short columnIndex = 0; columnIndex <= row.getLastCellNum(); columnIndex++) { String value = ""; cell = row.getCell(columnIndex); if (cell != null) { // 注意:一定要设成这个,否则可能会出现乱码 cell.setEncoding(HSSFCell.ENCODING_UTF_16); switch (cell.getCellType()) { case HSSFCell.CELL_TYPE_STRING: value = cell.getStringCellValue(); break; case HSSFCell.CELL_TYPE_NUMERIC: if (HSSFDateUtil.isCellDateFormatted(cell)) { Date date = cell.getDateCellValue(); if (date != null) { value = new SimpleDateFormat("yyyy-MM-dd") .format(date); } else { value = ""; } } else { value = new DecimalFormat("0").format(cell .getNumericCellValue()); } break; case HSSFCell.CELL_TYPE_FORMULA: // 导入时如果为公式生成的数据则无值 if (!cell.getStringCellValue().equals("")) { value = cell.getStringCellValue(); } else { value = cell.getNumericCellValue() + ""; } break; case HSSFCell.CELL_TYPE_BLANK: break; case HSSFCell.CELL_TYPE_ERROR: value = ""; break; case HSSFCell.CELL_TYPE_BOOLEAN: value = (cell.getBooleanCellValue() == true ? "Y" : "N"); break; default: value = ""; } } if (columnIndex == 0 && value.trim().equals("")) { break; } values[columnIndex] = rightTrim(value); hasValue = true; } if (hasValue) { result.add(values); } } } in.close(); String[][] returnArray = new String[result.size()][rowSize]; for (int i = 0; i < returnArray.length; i++) { returnArray[i] = (String[]) result.get(i); } return returnArray; } /** * 去掉字符串右边的空格 * * @param str 要处理的字符串 * @return 处理后的字符串 */ public static String rightTrim(String str) { if (str == null) { return ""; } int length = str.length(); for (int i = length - 1; i >= 0; i--) { if (str.charAt(i) != 0x20) { break; } length--; } return str.substring(0, length); } }