java获取网页源码
2013-03-08 09:36
155 查看
01 package gogo.cool;
02
03 import java.io.BufferedReader;
04 import java.io.IOException;
05 import java.io.InputStreamReader;
06 import java.net.HttpURLConnection;
07 import java.net.URL;
08
09 public class test1 {
10
11 public static void main(String[] a) throws IOException {
12
13 String url = "http://www.baidu.com";
14
15 System.out.println(getHTML(url, "gbk")); // 使用原网页里声明的gb2312反而会出现乱码
16
17 }
18
19 public static String getHTML(String pageURL, String encoding) {
20
21 StringBuilder pageHTML = new StringBuilder();
22
23 try {
24
25 URL url = new URL(pageURL);
26
27 HttpURLConnection connection = (HttpURLConnection) url
28 .openConnection();
29
30 connection.setRequestProperty("User-Agent", "MSIE 7.0");
31
32 BufferedReader br = new BufferedReader(new InputStreamReader(
33 connection.getInputStream(), encoding));
34
35 String line = null;
36
37 while ((line = br.readLine()) != null) {
38
39 pageHTML.append(line);
40
41 pageHTML.append("\r\n");
42
43 }
44
45 connection.disconnect();
46
47 } catch (Exception e) {
48
49 e.printStackTrace();
50
51 }
52
53 return pageHTML.toString();
54
55 }
56 }
02
03 import java.io.BufferedReader;
04 import java.io.IOException;
05 import java.io.InputStreamReader;
06 import java.net.HttpURLConnection;
07 import java.net.URL;
08
09 public class test1 {
10
11 public static void main(String[] a) throws IOException {
12
13 String url = "http://www.baidu.com";
14
15 System.out.println(getHTML(url, "gbk")); // 使用原网页里声明的gb2312反而会出现乱码
16
17 }
18
19 public static String getHTML(String pageURL, String encoding) {
20
21 StringBuilder pageHTML = new StringBuilder();
22
23 try {
24
25 URL url = new URL(pageURL);
26
27 HttpURLConnection connection = (HttpURLConnection) url
28 .openConnection();
29
30 connection.setRequestProperty("User-Agent", "MSIE 7.0");
31
32 BufferedReader br = new BufferedReader(new InputStreamReader(
33 connection.getInputStream(), encoding));
34
35 String line = null;
36
37 while ((line = br.readLine()) != null) {
38
39 pageHTML.append(line);
40
41 pageHTML.append("\r\n");
42
43 }
44
45 connection.disconnect();
46
47 } catch (Exception e) {
48
49 e.printStackTrace();
50
51 }
52
53 return pageHTML.toString();
54
55 }
56 }
相关文章推荐
- JAVA获取网页源码
- java 获取网页源码
- Java获取网页源码处理
- JAVA获取网页源码并写入html文件
- java 根据URL获取网页源码
- JAVA获取网页源码
- java使用websocket,并且获取HttpSession,源码分析
- java利用正则表达式获取一个网页中的所有邮箱地址
- php file_get_contents向网页提交Cookie并获取源码
- Android网络:HTTP之利用HttpURLConnection访问网页、获取网络图片实例 (附源码)
- Java:java爬虫获取动态网页的数据
- 根据网址获取网页源码(1)
- android练习一之获取网页源码
- Java使用URL获取网页内容
- Linux获取网页源码的几种方法 linux爬虫程序
- java 获取resource的源码分析
- C#获取网页源码
- Delphi XE下获取网页源码记录
- 根据URL获取网页TXT源码【Android】