1 import java.io.BufferedReader; 2 import java.io.FileNotFoundException; 3 import java.io.FileReader; 4 import java.io.IOException; 5 import java.util.regex.Matcher; 6 import java.util.regex.Pattern; 7 ?8 ?9 public class EmailSpider {10 11 ????public static void main(String[] args) {12 ????????try {13 ????????????BufferedReader br = new BufferedReader(new FileReader("D:\\share\\courseware\\1043633.html"));14 ????????????String line = "";15 ????????????while((line=br.readLine()) != null) {16 ????????????????parse(line);17 ????????????}18 ????????} catch (FileNotFoundException e) {19 ????????????// TODO Auto-generated catch block20 ????????????e.printStackTrace();21 ????????} catch (IOException e) {22 ????????????// TODO Auto-generated catch block23 ????????????e.printStackTrace();24 ????????}25 ????}26 27 ????private static void parse(String line) {28 ????????Pattern p = Pattern.compile("[\\w[.-]]+@[\\w[.-]]+\\.[\\w]+");29 ????????Matcher m = p.matcher(line);30 ????????while(m.find()) {31 ????????????System.out.println(m.group());32 ????????}33 ????}34 35 }
使用正则表达式进行某网页中的email邮箱抽取
原文地址:https://www.cnblogs.com/XiDaPuBen/p/8678762.html