import java.io.BufferedReader;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.sql.Timestamp;
import java.text.SimpleDateFormat;
import java.util.Calendar;
import java.util.Date;
import java.util.GregorianCalendar;
import java.util.TimeZone;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
public class EmailSpider { // Email蜘蛛程序
public static void main(String[] args) {
try { // 从文件中读入
BufferedReader br = new BufferedReader(
new FileReader("F:\\index.html"));
String line = "";
while ((line = br.readLine()) != null) { // 整行读入
parse(line);
}
} catch (FileNotFoundException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
}
private static void parse(String line) {
Pattern p = Pattern.compile("[\\w[.-]]+@[\\w[.-]]+\\.[\\w]+"); // 匹配邮件地址
Matcher m = p.matcher(line);
while (m.find()) {
System.out.println(m.group()); // 分组打印
}
}
}
从网页中攫取邮箱
最新推荐文章于 2023-04-20 08:31:37 发布