天天看點

java擷取qq郵箱的網絡爬蟲

代碼如下

package Game;
import java.io.BufferedReader;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStreamReader;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

public class Main {
    public static void main(String[] args) throws IOException {
        File file=new File("D:\\index.html");
        BufferedReader buf=new BufferedReader(new InputStreamReader(new FileInputStream(file)));
        String str=null;
        String regex="(.)[email protected](.)+(\\.[a-z]+){1,}";
        Pattern pattern=Pattern.compile(regex);
        while((str=buf.readLine())!=null)
        {
            Matcher matcher=pattern.matcher(str);
            while(matcher.find())
            System.out.println(matcher.group());
        }
        buf.close();

    }
}
           

  詳細說明:http://java.662p.com/thread-3731-1-1.html

轉載于:https://www.cnblogs.com/liniuzen/p/4107842.html