网络编程 socket, 最基本应用——抓页面。 抓个页面happy下
import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStreamReader;
import java.net.URL;
import java.net.URLConnection;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
public class SocketTest {
private static Log log = LogFactory.getLog(Test.class);
private static final String USER_AGENT = "";
public static void main(String[] args) throws IOException {
log.info("hello Molly");
String protocal = "http://";
String host = "images.google.cn";
String path = "/images?hl=zh-CN&q=x&gbv=2&aq=f";
String urlString = protocal + host + path;
URL url = new URL(urlString);
URLConnection conn = url.openConnection();
conn.addRequestProperty("User-Agent", USER_AGENT);
BufferedReader reader = new BufferedReader(new InputStreamReader(conn
.getInputStream()));
StringBuffer document = new StringBuffer();
String line = null;
while ((line = reader.readLine()) != null)
document.append(line + "\n");
reader.close();
log.debug("\n" + document.toString());
}
}
--------- 超华丽的分隔线 ---------
User-Agent:Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1) ; .NET CLR 2.0.50727)
User-Agent:Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1) ; .NET CLR 2.0.50727; MAXTHON 2.0)
User-Agent:Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.8.1.14) Gecko/20080404 Firefox/2.0.0.14
User-Agent:Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN) AppleWebKit/525.13 (KHTML, like Gecko) Version/3.1 Safari/525.13.3
User-Agent:Opera/9.27 (Windows NT 5.1; U; zh-cn)
--------- 超华丽的分隔线 ---------
User-Agent 有啥用? 你猜 - 3-