网页Email抓取 java

import java.io.BufferedReader;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.util.regex.Matcher;
import java.util.regex.Pattern;


public class EmailSpilder {
    public static void main(String[] args) {
        try {
            BufferedReader re = new BufferedReader(new FileReader("D:\大家留下email吧。。.htm"));
            String line = null;
            while((line = re.readLine())!=null){
                parse(line);
            }
        } catch (FileNotFoundException e) {
            // TODO Auto-generated catch block
            e.printStackTrace();
        } catch (IOException e) {
            // TODO Auto-generated catch block
            e.printStackTrace();
        }
        
    }

    private static void parse(String readLine) {
        Pattern p = Pattern.compile("[\w[.-]]+@[\w[.-]]+\.[\w]+");
        Matcher m = p.matcher(readLine);
        while(m.find()){
            System.out.println(m.group());
        }
    }
}
原文地址:https://www.cnblogs.com/lakelise/p/4243014.html