HttpClient乱码,网上有好多方法,在这,仅说下自己获取页面,出现乱码的情情况:
将数据流增加字符集,这样就可以解决这个问题:
如:“BufferedReader br = new BufferedReader(new InputStreamReader(in,"UTF-8"));”
源码如下:
private String getPage(String url,String encode){
//创建HttpClient实例
HttpClient httpClient=new HttpClient();
//设置编码参数
if (encode!=null){
httpClient.getParams().setParameter(HttpMethodParams.HTTP_CONTENT_CHARSET,encode);
}else{
httpClient.getParams().setParameter(HttpMethodParams.HTTP_CONTENT_CHARSET,"gbk");
}
//忽略Cookies
httpClient.getParams().setCookiePolicy(CookiePolicy.IGNORE_COOKIES);
//创建GetMethod实例访问指定URL
GetMethod getMethod = new GetMethod(url);
try{
//访问指定URL并取得返回状态码
int statusCode = httpClient.executeMethod(getMethod);
if (statusCode==200){//返回成功状态码200
//读取页面HTML源码
StringBuffer sb = new StringBuffer();
InputStream in = getMethod.getResponseBodyAsStream();
BufferedReader br = new BufferedReader(new InputStreamReader(in,"UTF-8"));
String line;
while((line=br.readLine())!=null){
sb.append(line);
}
if(br!=null)br.close();
return sb.toString();
}else{
return null;
}
}catch(Exception ex){
ex.printStackTrace();
return null;
}
}