您的位置:首页 > 其它

博客第一天!努力的开始!

2016-05-12 15:52 344 查看
package bs;

import java.io.BufferedReader;

import java.io.FileReader;

import java.io.IOException;

import java.io.InputStreamReader;

import java.net.URL;

import java.util.regex.Matcher;

import java.util.regex.Pattern;

import org.junit.Test;

public class SpideDemo {

 public static void main(String[] args) {

        try {

   URL url=new URL("http://www.sina.com");

   BufferedReader br=new BufferedReader(new InputStreamReader(url.openStream()));

   

   String regex="\\w+@\\w+(\\.\\w+)+";

   String regex1="<a href=";

   Pattern p=Pattern.compile(regex);

   String line=null;

   while((line=br.readLine())!=null){

    

    Matcher m=p.matcher(line);

    Matcher m1=p.matcher(regex1);

    while(m1.find()){

     

    }

    while(m.find()){

     System.out.println(m.group());

    }

   }

  } catch (Exception e) {

   e.printStackTrace();

  }

       

 }

 @Test

 public void hello(){

  try {

   BufferedReader br=new BufferedReader(new FileReader("./net/mail.html"));

   String regex="^[a-z0-9]+([._\\-]*[a-z0-9])*@([a-z0-9]+[-a-z0-9]*[a-z0-9]+.){1,63}[a-z0-9]+$";

   Pattern p=Pattern.compile(regex);

   String str=null;

   while((str=br.readLine())!=null){

    Matcher m=p.matcher(str);

    while(m.find()){

     System.out.println(m.group());

    }

   }

  } catch (IOException e) {

   e.printStackTrace();

  }

 }

}
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: