package test;
import java.net.HttpURLConnection;
import java.net.URL;
import java.util.Scanner;
public class WebCapturer从网页抓取数据 {
public static void main(String[] args) throws Exception {
URL url = new URL("http://www.baidu.com/s?wd=360");
HttpURLConnection conn = (HttpURLConnection) url.openConnection();
conn.setRequestProperty("User-Agent", // 很重要
"Mozilla/5.0 (X11; U; Linux i686; zh-CN; rv:1.9.1.2) "
+ " Gecko/20090803 Fedora/3.5.2-2.fc11 Firefox/3.5.2");
conn.setRequestMethod("GET");
Scanner scanner = new Scanner(conn.getInputStream());
while (scanner.hasNextLine()) {
System.out.println(scanner.nextLine());
}
}
}
//抓取页面的html
java 抓取 网页 数据
最新推荐文章于 2024-04-30 14:28:06 发布