博客第一天!努力的开始!
2016-05-12 15:52
344 查看
package bs;
import java.io.BufferedReader;
import java.io.FileReader;
import java.io.IOException;
import java.io.InputStreamReader;
import java.net.URL;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import org.junit.Test;
public class SpideDemo {
public static void main(String[] args) {
try {
URL url=new URL("http://www.sina.com");
BufferedReader br=new BufferedReader(new InputStreamReader(url.openStream()));
String regex="\\w+@\\w+(\\.\\w+)+";
String regex1="<a href=";
Pattern p=Pattern.compile(regex);
String line=null;
while((line=br.readLine())!=null){
Matcher m=p.matcher(line);
Matcher m1=p.matcher(regex1);
while(m1.find()){
}
while(m.find()){
System.out.println(m.group());
}
}
} catch (Exception e) {
e.printStackTrace();
}
}
@Test
public void hello(){
try {
BufferedReader br=new BufferedReader(new FileReader("./net/mail.html"));
String regex="^[a-z0-9]+([._\\-]*[a-z0-9])*@([a-z0-9]+[-a-z0-9]*[a-z0-9]+.){1,63}[a-z0-9]+$";
Pattern p=Pattern.compile(regex);
String str=null;
while((str=br.readLine())!=null){
Matcher m=p.matcher(str);
while(m.find()){
System.out.println(m.group());
}
}
} catch (IOException e) {
e.printStackTrace();
}
}
}
import java.io.BufferedReader;
import java.io.FileReader;
import java.io.IOException;
import java.io.InputStreamReader;
import java.net.URL;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import org.junit.Test;
public class SpideDemo {
public static void main(String[] args) {
try {
URL url=new URL("http://www.sina.com");
BufferedReader br=new BufferedReader(new InputStreamReader(url.openStream()));
String regex="\\w+@\\w+(\\.\\w+)+";
String regex1="<a href=";
Pattern p=Pattern.compile(regex);
String line=null;
while((line=br.readLine())!=null){
Matcher m=p.matcher(line);
Matcher m1=p.matcher(regex1);
while(m1.find()){
}
while(m.find()){
System.out.println(m.group());
}
}
} catch (Exception e) {
e.printStackTrace();
}
}
@Test
public void hello(){
try {
BufferedReader br=new BufferedReader(new FileReader("./net/mail.html"));
String regex="^[a-z0-9]+([._\\-]*[a-z0-9])*@([a-z0-9]+[-a-z0-9]*[a-z0-9]+.){1,63}[a-z0-9]+$";
Pattern p=Pattern.compile(regex);
String str=null;
while((str=br.readLine())!=null){
Matcher m=p.matcher(str);
while(m.find()){
System.out.println(m.group());
}
}
} catch (IOException e) {
e.printStackTrace();
}
}
}
相关文章推荐
- DRL前沿之:Hierarchical Deep Reinforcement Learning
- JavaScript的模块化开发框架Sea.js上手指南
- java和Spring发送邮件
- Spring-boot添加Mybatis
- GIT的认识
- DateFormat只要 年月日
- test
- 俩台服务器搭建redis主从的问题
- AngularJs获取数组的元素例子
- Nginx配置PHP框架时出现Access Denied时的解决办法
- sql server 各种等待类型-转
- jQuery中find和filter的区别
- 用户体验
- 博客园的用户体验
- 单个App的UI测试
- python 第一章 介绍-1.python特点.
- 阅读协议之知识点记录--持续更新中... ...
- spring mvc拦截器和<mvc:annotation-driven />的详解
- Java面试题--只提出了问题
- Opencv函数研究