java 获取网页指定内容-2(实践+修改)

import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.HttpURLConnection;
import java.net.URL;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.util.Arrays;


public class Weather {
 String urlString;
 String array;
 StringBuffer sb=new StringBuffer("");
  
 public static void main(String[] args) throws Exception {
  Weather client = new Weather("http://www.weather.com.cn/weather/101181201.shtml");
  client.run();
 }
 public Weather(String urlString) {
  this.urlString = urlString;
 }
 public void run() throws Exception {
 
  URL url = new URL(urlString);
  
  HttpURLConnection urlConnection = (HttpURLConnection) url.openConnection();
  
  BufferedReader reader = new BufferedReader(new InputStreamReader(urlConnection
    .getInputStream(),"utf8"));
  String line;

  while ((line = reader.readLine()) != null){
  Pattern p = Pattern.compile("<p class=\"wea\">(.+?)</p>");
    Matcher m = p.matcher(line);
    while(m.find()) { 
        array = m.group(1);
        sb.append(array+","); 
    }
  }
  
    String arr = sb.toString();
    String[] s = arr.split("\\,");
    System.out.println(s[s.length - 7]);
    
 }
 

}

 

utf8编码格式

 

import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.HttpURLConnection;
import java.net.URL;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.util.Arrays;


public class Weather {
 String urlString;
 String array;
 StringBuffer sb=new StringBuffer("");
  
 public static void main(String[] args) throws Exception {
  
  Weather client = new Weather("http://www.weather.com.cn/weather/101181201.shtml");
  client.run();
 }
 public Weather(String urlString) {
  this.urlString = urlString;
 }
 public void run() throws Exception {
 
  URL url = new URL(urlString);
  
  HttpURLConnection urlConnection = (HttpURLConnection) url.openConnection();
  
  BufferedReader reader = new BufferedReader(new InputStreamReader(urlConnection
    .getInputStream(),"utf8"));
  String line;

  while ((line = reader.readLine()) != null){
  Pattern p = Pattern.compile("<p class=\"wea\">(.+?)</p>");
    Matcher m = p.matcher(line);
    while(m.find()) { 
        array = m.group(1);
        sb.append(array+",");//符合正则的数据追加到sb,并以逗号分割 
    }
  }
  
    String arr = sb.toString();//sb转为字符串
    String[] s = arr.split("\\,");//字符串转为数组,以逗号为标记 
    System.out.println(s[s.length - 7]);//取数组中倒数第7个数
    
 }
 

}

 

转载于:https://www.cnblogs.com/hellowzd/p/4991796.html

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值