#网页HTML的编码是gb2312
<meta http-equiv="Content-Type" content="text/html; charset=gb2312">
#Java用utf-8 读取汉字乱码,读取网页HTML内容后输出汉子乱码
URLConnection urlConnection = new URL(url).openConnection();
HttpURLConnection connection = (HttpURLConnection) urlConnection;
connection.setRequestMethod("GET");
//连接
connection.connect();
BufferedReader bufferedReader = new BufferedReader(new InputStreamReader
(connection.getInputStream(), StandardCharsets.UTF_8));
StringBuilder bs = new StringBuilder();
String l;
while ((l = bufferedReader.readLine()) != null)