用正则表达式提取网页中的邮箱地址

最新推荐文章于 2025-11-01 17:29:00 发布

原创最新推荐文章于 2025-11-01 17:29:00 发布 · 6.8k 阅读

2 ·

CC 4.0 BY-SA版权

文章标签：

#正则表达式 #string #regex #import #class #null

Java 专栏收录该内容

52 篇文章

订阅专栏

本文介绍了一个Java程序，该程序利用正则表达式从指定的HTML文件中提取所有的邮箱地址。通过读取文件内容并应用特定的正则表达式模式，程序能够准确地匹配并打印出所有找到的邮箱地址。

import java.io.BufferedReader; import java.io.FileReader; import java.io.IOException; import java.util.regex.*; public class MyRegex { public static void main(String[] args) { try { //读取网页文件,里面有N个邮箱地址 String content = read("e:/1.htm");//read()方法在下面 //匹配邮箱的正则表达式 String regex="//w+([-+.']//w+)*@//w+([-.]//w+)*//.//w+([-.]//w+)*"; Matcher m=Pattern.compile(regex).matcher(content); while(m.find()){ //输出邮箱地址 System.out.println(m.group()); } } catch (IOException e) { e.printStackTrace(); } } /** * 读取文本内容 * @param fileName 文本名称，包括路径 * @return 返回文本内容 */ public static String read(String fileName) throws IOException{ BufferedReader br=new BufferedReader(new FileReader(fileName)); StringBuilder sb=new StringBuilder(); String s; while((s=br.readLine())!=null) { sb.append(s); sb.append("/r/n"); } br.close(); return sb.toString(); } }