日期:2014-05-17  浏览次数:20601 次

通过url地址抓取网页html代码
import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.HttpURLConnection;
import java.net.URL;

public class URLUtil {

  public static String getHtml(String urlString) {
    try {
       StringBuffer html = new StringBuffer();
       URL url = new URL(urlString);
       HttpURLConnection conn = (HttpURLConnection) url.openConnection();
       InputStreamReader isr = new InputStreamReader(conn.getInputStream());
       BufferedReader br = new BufferedReader(isr);
       String temp;
      while ((temp = br.readLine()) != null) {
         html.append(temp).append("\n");
       }
       br.close();
       isr.close();
      return html.toString();
     } catch (Exception e) {
       e.printStackTrace();
      return null;
     }
   }

  public static void main(String[] args) {
     System.out.println(URLUtil.getHtml("http://www.fastunit.com"));
   }
}