爬取Excel表格(加强版)

  

package test;

import io.ExcelOperat;

import java.io.File;
import java.io.IOException;
import java.util.HashMap;
import java.util.Map;

/**
 * @ProjectName: TutorDualSelectionSystem
 * @Package: test
 * @ClassName: MapNestedDemo
 * @Author: 王团结
 * @Description: 手工排课类
 * @Date: 2019/7/2 15:17
 * @Version: 1.0
 */
public class MapNestedDemo {

    public static void main(String[] args) {


//
//        String path_01="C:\Users\ASUS\Desktop\2019-2020学年第一学期教材征订计划3.xls";
//        String path_02="C:\Users\ASUS\Desktop\startClassPlan_fb.xls";

//
//        String path_01="C:\Users\ASUS\Desktop\手工排课.xls";
//        String path_02="C:\Users\ASUS\Desktop\startClassPlan_fb.xls";
        String path_01="C:\Users\ASUS\Desktop\手工排课.xls";
        String path_02="C:\Users\ASUS\Desktop\startClassPlan_fb.xls";



        //第一个文件迭代输出
        System.out.println("第一个文件迭代输出");
        System.out.println("----------------------------------------------------------------------------------------------");
        String[] put_01 = crow(path_01);

        //第二个文件迭代输出
        System.out.println("第二个文件迭代输出");
        System.out.println("----------------------------------------------------------------------------------------------");
        String[] put_02= crow(path_02);

//
//
        compare(put_01,put_02);

    }

    private static String[] crow(String path) {
        File file_01 = new File(path);

        String[][] excel = new String[0][];
        try {
            excel = ExcelOperat.getData(file_01, 1);
        } catch (IOException e) {
            System.out.println("--------------------------------------------------------------------------");
            System.out.println("读取错误!");
        }

        int rowLength = excel.length;
        //输出总行数

        System.out.println("文件"+path+"总行数" + rowLength);
        System.out.println("--------------------------------------------------------------------------");
        String[] total=new String[3000];
        int m=0;
        for (int i=0;i<rowLength;i++){
            String[] split = excel[i][3].split(",");
            for(int j=0;j<split.length;j++){
                total[m++]= excel[i][1]+"|"+excel[i][2]+"|"+split[j]+"	"+excel[i][13];
            }
        }
        String[] totals=new String[m];
        for (int i=0;i<m;i++){
                totals[i]=total[i];
//            System.out.println(i+totals[i]);
        }
        return totals;
    }


    //比较
    private static void compare(String[] put_01,String[] put_02 ) {
        int m=0;

        System.out.println("			手工排课 .xls"+"										"+"startClassPlan_fb.xls");
        System.out.println("序号"+"	|课程号|课程名|班级名	教师姓名"+"					"+"序号"+"	|课程号|课程名|班级名	教师姓名");
        for(int i=0;i<put_01.length;i++){
            String[] split = put_01[i].split("	");
          for (int j=0;j<put_02.length;j++){
              String[] split1 = put_02[j].split("	");
              if(split[0].equals(split1[0])){
                  if(split[1].startsWith("外聘")){
                      put_01[i]=put_01[i].replace(split[1],split1[1]);
                  }else if(!split[split.length-1].equals(split1[split1.length-1])){
                      System.out.println((m++)+"	|" +put_01[i]+"					"+put_02[j]);
                  }
              }

          }
        }

    }




}
package io;

import java.io.BufferedInputStream;

import java.io.File;

import java.io.FileInputStream;

import java.io.FileNotFoundException;

import java.io.IOException;

import java.text.DecimalFormat;

import java.text.SimpleDateFormat;

import java.util.ArrayList;

import java.util.Arrays;

import java.util.Date;

import java.util.List;


import org.apache.poi.hssf.usermodel.HSSFCell;

import org.apache.poi.hssf.usermodel.HSSFDateUtil;

import org.apache.poi.hssf.usermodel.HSSFRow;

import org.apache.poi.hssf.usermodel.HSSFSheet;

import org.apache.poi.hssf.usermodel.HSSFWorkbook;

import org.apache.poi.poifs.filesystem.POIFSFileSystem;

/**
 * @ProjectName: TutorDualSelectionSystem
 * @Package: io
 * @ClassName: ExcelOperat
 * @Author: 王团结
 * @Description: 读取Excel内容
 * @Date: 2019/7/2 14:39
 * @Version: 1.0
 */
public class ExcelOperat {
//    public static void main(String[] args) throws Exception {
//
//        File file = new File("C:\Users\ASUS\Desktop\2019-2020学年第一学期教材征订计划3.xls");
//
//        String[][] result = getData(file, 1);
//
//        int rowLength = result.length;
//
//
//
//         for (int i = 0; i < rowLength; i++) {
//             System.out.print(result[i][2] + "		");
////            for (int j = 0; j < result[i].length; j++) {
////
////                System.out.print(result[i][j] + "		");
////
////            }
//
//            System.out.println();
//
//        }
//
//
//    }

    /**
     * 读取Excel的内容,第一维数组存储的是一行中格列的值,二维数组存储的是多少个行
     *
     * @param file       读取数据的源Excel
     * @param ignoreRows 读取数据忽略的行数,比喻行头不需要读入 忽略的行数为1
     * @return 读出的Excel中数据的内容
     * @throws FileNotFoundException
     * @throws IOException
     */

    public static String[][] getData(File file, int ignoreRows)

            throws FileNotFoundException, IOException {

        List<String[]> result = new ArrayList<String[]>();

        int rowSize = 0;

        BufferedInputStream in = new BufferedInputStream(new FileInputStream(

                file));

        // 打开HSSFWorkbook

        POIFSFileSystem fs = new POIFSFileSystem(in);

        HSSFWorkbook wb = new HSSFWorkbook(fs);

        HSSFCell cell = null;

        for (int sheetIndex = 0; sheetIndex < wb.getNumberOfSheets(); sheetIndex++) {

            HSSFSheet st = wb.getSheetAt(sheetIndex);

            // 第一行为标题,不取

            for (int rowIndex = ignoreRows; rowIndex <= st.getLastRowNum(); rowIndex++) {

                HSSFRow row = st.getRow(rowIndex);

                if (row == null) {

                    continue;

                }

                int tempRowSize = row.getLastCellNum() + 1;

                if (tempRowSize > rowSize) {

                    rowSize = tempRowSize;

                }

                String[] values = new String[rowSize];

                Arrays.fill(values, "");

                boolean hasValue = false;

                for (short columnIndex = 0; columnIndex <= row.getLastCellNum(); columnIndex++) {

                    String value = "";

                    cell = row.getCell(columnIndex);

                    if (cell != null) {

                        // 注意:一定要设成这个,否则可能会出现乱码

                        cell.setEncoding(HSSFCell.ENCODING_UTF_16);

                        switch (cell.getCellType()) {

                            case HSSFCell.CELL_TYPE_STRING:

                                value = cell.getStringCellValue();

                                break;

                            case HSSFCell.CELL_TYPE_NUMERIC:

                                if (HSSFDateUtil.isCellDateFormatted(cell)) {

                                    Date date = cell.getDateCellValue();

                                    if (date != null) {

                                        value = new SimpleDateFormat("yyyy-MM-dd")

                                                .format(date);

                                    } else {

                                        value = "";

                                    }

                                } else {

                                    value = new DecimalFormat("0").format(cell

                                            .getNumericCellValue());

                                }

                                break;

                            case HSSFCell.CELL_TYPE_FORMULA:

                                // 导入时如果为公式生成的数据则无值

                                if (!cell.getStringCellValue().equals("")) {

                                    value = cell.getStringCellValue();

                                } else {

                                    value = cell.getNumericCellValue() + "";

                                }

                                break;

                            case HSSFCell.CELL_TYPE_BLANK:

                                break;

                            case HSSFCell.CELL_TYPE_ERROR:

                                value = "";

                                break;

                            case HSSFCell.CELL_TYPE_BOOLEAN:

                                value = (cell.getBooleanCellValue() == true ? "Y"

                                        : "N");

                                break;

                            default:

                                value = "";

                        }

                    }

                    if (columnIndex == 0 && value.trim().equals("")) {

                        break;

                    }

                    values[columnIndex] = rightTrim(value);

                    hasValue = true;

                }


                if (hasValue) {

                    result.add(values);

                }

            }

        }

        in.close();

        String[][] returnArray = new String[result.size()][rowSize];

        for (int i = 0; i < returnArray.length; i++) {

            returnArray[i] = (String[]) result.get(i);

        }

        return returnArray;

    }


    /**
     * 去掉字符串右边的空格
     *
     * @param str 要处理的字符串
     * @return 处理后的字符串
     */

    public static String rightTrim(String str) {

        if (str == null) {

            return "";

        }

        int length = str.length();

        for (int i = length - 1; i >= 0; i--) {

            if (str.charAt(i) != 0x20) {

                break;

            }

            length--;

        }

        return str.substring(0, length);

    }
}
原文地址:https://www.cnblogs.com/King-boy/p/11131927.html