java下载网页中的内容
2013-09-26 18:19
246 查看
import java.io.BufferedReader; import java.io.ByteArrayOutputStream; import java.io.File; import java.io.FileOutputStream; import java.io.InputStream; import java.io.InputStreamReader; import java.net.HttpURLConnection; import java.net.URL; public class UrlResource { public static void main(String[] args){ try { System.out.println(UrlResource.getUrlDetail("http://www.baidu.com",true)); saveUrlFile("http://www.baidu.com/img/baidu_jgylogo3.gif", "D:\\1.gif"); } catch (Exception e) { e.printStackTrace(); } } //获取网络文件,转存到fileDes中,fileDes需要带文件后缀名 public static void saveUrlFile(String fileUrl,String fileDes) throws Exception { File toFile = new File(fileDes); if (toFile.exists()) { // throw new Exception("file exist"); return; } toFile.createNewFile(); FileOutputStream outImgStream = new FileOutputStream(toFile); outImgStream.write(getUrlFileData(fileUrl)); outImgStream.close(); } //获取链接地址文件的byte数据 public static byte[] getUrlFileData(String fileUrl) throws Exception { URL url = new URL(fileUrl); HttpURLConnection httpConn = (HttpURLConnection) url.openConnection(); httpConn.connect(); InputStream cin = httpConn.getInputStream(); ByteArrayOutputStream outStream = new ByteArrayOutputStream(); byte[] buffer = new byte[1024]; int len = 0; while ((len = cin.read(buffer)) != -1) { outStream.write(buffer, 0, len); } cin.close(); byte[] fileData = outStream.toByteArray(); outStream.close(); return fileData; } //获取链接地址的字符数据,wichSep是否换行标记 public static String getUrlDetail(String urlStr,boolean withSep) throws Exception { URL url = new URL(urlStr); HttpURLConnection httpConn = (HttpURLConnection)url.openConnection(); httpConn.connect(); InputStream cin = httpConn.getInputStream(); BufferedReader reader = new BufferedReader(new InputStreamReader(cin,"UTF-8")); StringBuffer sb = new StringBuffer(); String rl = null; while((rl = reader.readLine()) != null) { if (withSep) { sb.append(rl).append(System.getProperty("line.separator")); } else { sb.append(rl); } } return sb.toString(); } }
相关文章推荐
- java下载网页内容和网络图片
- JAVA:获得网页下载文件内容
- 使用Java下载网页的下载链接的内容
- java下载网页并读取内容
- 实现Java读取网页内容并下载网页中出现的图片
- java下载网页内容和网络图片
- java下载html页面---把网页内容保存成本地html
- java下载html页面---把网页内容保存成本地html
- java下载读取网页内容方式
- Java读取网页内容并下载图片的实例
- java 使用URL来读取网页内容
- JAVA取网页内容信息
- Java获取网页内容、图片、JavaScript和CSS文件工具类
- Java基础:利用HttpClient获取网页内容
- java爬取网页内容 简单例子(1)——使用正则表达式
- 关于chunked gzip,socket下载网页内容. - xiqi8144的专栏 - 博客频道 - CSDN.NET
- Java使用HttpClient的HttpGet获取网页内容
- JAVA 抓取网页内容
- Java基础:Day01笔记内容 (概述、JDK的下载及安装)
- java小demo:下载http://learning.sohu.com/s2004/7231/s221868027.shtml中所有的内容图片