首页 诗词 字典 板报 句子 名言 友答 励志 学校 网站地图
当前位置: 首页 > 教程频道 > 开发语言 > 编程 >

简略HTTP抓取网页内容

2012-11-12 
简单HTTP抓取网页内容package com.testimport java.io.BufferedReaderimport java.io.InputStreamimpor

简单HTTP抓取网页内容

package com.test;import java.io.BufferedReader;import java.io.InputStream;import java.io.InputStreamReader;import java.net.HttpURLConnection;import java.net.URL;public class TestHttp {public static void main(String[] args) throws Exception {String urlString = "http://www.baidu.com";HttpURLConnection urlConnection = null;URL url = new URL(urlString);urlConnection = (HttpURLConnection) url.openConnection();urlConnection.setRequestMethod("GET");urlConnection.setDoOutput(true);urlConnection.setDoInput(true);urlConnection.setUseCaches(false);InputStream in = urlConnection.getInputStream();BufferedReader bufferedReader = new BufferedReader(new InputStreamReader(in));StringBuffer temp = new StringBuffer();String line = bufferedReader.readLine();while (line != null) {temp.append(line);line = bufferedReader.readLine();}bufferedReader.close();String ecod = urlConnection.getContentEncoding();if (ecod == null)ecod = "UTF-8";String result = new String(temp.toString().getBytes(), ecod);System.out.println(result);}}

热点排行