当前位置: 代码迷 >> HTML/CSS >> 经过url地址抓取网页html代码
  详细解决方案

经过url地址抓取网页html代码

热度:100   发布时间:2012-12-22 12:05:07.0
通过url地址抓取网页html代码
import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.HttpURLConnection;
import java.net.URL;

public class URLUtil {

  public static String getHtml(String urlString) {
    try {
       StringBuffer html = new StringBuffer();
       URL url = new URL(urlString);
       HttpURLConnection conn = (HttpURLConnection) url.openConnection();
       InputStreamReader isr = new InputStreamReader(conn.getInputStream());
       BufferedReader br = new BufferedReader(isr);
       String temp;
      while ((temp = br.readLine()) != null) {
         html.append(temp).append("\n");
       }
       br.close();
       isr.close();
      return html.toString();
     } catch (Exception e) {
       e.printStackTrace();
      return null;
     }
   }

  public static void main(String[] args) {
     System.out.println(URLUtil.getHtml("http://www.fastunit.com"));
   }
}
  相关解决方案