URLConnection得到的网页是乱码

URLConnection得到的网页是乱码的问题,是因为baidu,google等采用了gzip压缩,而在请求时Accept-Encoding又含有gzip,所以导致读取到的是乱码

import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.InetSocketAddress;
import java.net.Proxy;
import java.net.URL;
import java.net.URLConnection;
import java.net.UnknownHostException;

public class SessionFactory {

public static void main(String[] args) {
String url = "http://www.baidu.com/";
try {
send(url);
} catch (UnknownHostException e) {
// TODO Auto-generated catch block
e.printStackTrace();
} catch (IOException e) {
// TODO Auto-generated catch block
e.printStackTrace();
}
}

public static synchronized boolean send(String url)
throws UnknownHostException, IOException {

// 运用代理
String proxyHost = "10.167.39.11";
String proxyPort = "8080";

URL urlRoot = new URL(url);

// 运用代理
InetSocketAddress addr = new InetSocketAddress("10.167.39.11", 8080);
Proxy proxy = new Proxy(Proxy.Type.HTTP, addr);

URLConnection conn = urlRoot.openConnection(proxy);
conn
.addRequestProperty(
"User-Agent",
"Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.9.1.8) Gecko/20100202 Firefox/3.5.8 GTB6");
conn
.addRequestProperty("Accept",
"text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8");

conn.addRequestProperty("Accept-Language", "en-us,en;q=0.5");
// conn.addRequestProperty("Accept-Encoding", "gzip,deflate");
conn.addRequestProperty("Accept-Charset",
"ISO-8859-1,utf-8;q=0.7,*;q=0.7");
conn.addRequestProperty("Keep-Alive", "300");
conn.addRequestProperty("Proxy-Connection", "keep-alive");


conn.connect();
System.out.println(conn.getContentEncoding());

// InputStream is = conn.getInputStream();
// int intTemp;
// while ((intTemp = is.read()) != -1) {
// System.out.println((char) intTemp);
// }
BufferedReader in = new BufferedReader(new InputStreamReader(conn
.getInputStream(), "gb2312"));// 读取网页全部内容
String temp;
while ((temp = in.readLine()) != null) {
System.out.println(temp);
}

return true;
}
}
  • 1
    点赞
  • 1
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值