正则表达式,模拟网络爬虫小例子
发布时间:2020-12-14 01:11:23 所属栏目:百科 来源:网络整理
导读:package cn.zhengze;import java.io.BufferedReader;import java.io.File;import java.io.FileNotFoundException;import java.io.FileReader;import java.io.IOException;import java.io.InputStreamReader;import java.util.ArrayList;import java.util.Lis
package cn.zhengze; import java.io.BufferedReader; import java.io.File; import java.io.FileNotFoundException; import java.io.FileReader; import java.io.IOException; import java.io.InputStreamReader; import java.util.ArrayList; import java.util.List; import java.util.regex.Matcher; import java.util.regex.Pattern; public class netbug { /** * @param args * @throws IOException */ public static void main(String[] args) throws IOException { File file = new File("mail.html"); String regex = "w+@[a-zA-Z0-9]+(.[a-zA-Z]{2,3}){1,3}"; List<String> mailList = getMails(file,regex); for (String mail : mailList) { System.out.println(mail); } } private static List<String> getMails(File file,String regex) throws IOException { BufferedReader bufr = new BufferedReader(new FileReader(file)); Pattern p = Pattern.compile(regex); List<String> list = new ArrayList<String>(); String line = null; while ((line = bufr.readLine()) != null) { Matcher m = p.matcher(line); while (m.find()) { list.add(m.group()); } } return list; } } (编辑:李大同) 【声明】本站内容均来自网络,其相关言论仅代表作者个人观点,不代表本站立场。若无意侵犯到您的权利,请及时与联系站长删除相关内容! |