如果出现正则内容出现东西过多,再增加一个(),group一下
完全原创,呕心沥血呀
package com.zzk.cn;
import java.awt.List;
import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.MalformedURLException;
import java.net.URL;
import java.net.URLConnection;
import java.util.ArrayList;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
public class TestSun {
public static void main(String[] args) {
URL url = null;
URLConnection conn = null;
InputStream in = null;
InputStreamReader isr = null;
BufferedReader br = null;
try {
url = new URL("http://www.weather.com.cn/weather/101010100.shtml");
conn = url.openConnection();
in = conn.getInputStream();
isr = new InputStreamReader(in,"utf8");
br = new BufferedReader(isr);
String line = "";
String info="";
while (null != (line = br.readLine())) {
//System.out.println(line);
info+=line;
}
//System.out.println(info);
Pattern p=Pattern.compile("div\\sclass=.weatherTopright.*?</div>");//正则获取网页大致信息
Matcher m=p.matcher(info);
String s1="";
while(m.find()) {
s1=m.group();
//System.out.println(s1);
}
String s2="";
Pattern p1=Pattern.compile("bold;.>(\\d+):(\\d+)</strong>");//正则获取网页日出日落信息
//Pattern p1=Pattern.compile("<(/?\\s?br\\b)>");
Matcher m1=p1.matcher(s1);
//System.out.println(s1);
ArrayList<String> a = new ArrayList<String>();
while(m1.find()) {
//m1.group(1);
String s=m1.group(1);
String s0=m1.group(2);
String result = s+":"+s0;
a.add(result);
}
System.out.println(a.get(0));
System.out.println(a.get(1));
// System.out.println(a.get(2));
// System.out.println(a.get(3));
Pattern p2=Pattern.compile("div\\sclass=.todayLiving.*?</div>");//正则获取网页大致信息
Matcher n=p2.matcher(info);
String t1="";
while(n.find()) {
t1=n.group();
//System.out.println(t1);
}
String t2="";
Pattern p3=Pattern.compile("<blockquote>\\s(.*?)\\s</blockquote>");//正则获取网页日出日落信息
//Pattern p1=Pattern.compile("<(/?\\s?br\\b)>");
ArrayList<String> b = new ArrayList<String>();
Matcher n1=p3.matcher(t1);
while(n1.find()) {
t2=n1.group();
//System.out.println(n1.group());
String detail=t2;
b.add(detail);
}
String guoming=b.get(0).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String wuran=b.get(1).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String ganmao=b.get(2).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String ziwaixian=b.get(3).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String chuanyi=b.get(4).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String shushi=b.get(5).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String huazhuang=b.get(6).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String meifa=b.get(7).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String xiche=b.get(8).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String lukuang=b.get(9).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String jiaotong=b.get(10).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String lvyou=b.get(11).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String yundong=b.get(12).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String chenlian=b.get(13).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String diaoyu=b.get(14).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String huachuan=b.get(15).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String yuehui=b.get(16).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String guangjie=b.get(17).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String liangshai=b.get(18).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String yusan=b.get(19).replaceAll("<blockquote>", "").replaceAll("</blockquote>", "").replaceAll(" ", "");
String t3="";
Pattern p4=Pattern.compile("<dt>(.*?)</dt>.*?target=.*?blank.*?>(.*?)<b\\sclass=.*?>(.*?)</b>");//正则获取网页日出日落信息
//Pattern p1=Pattern.compile("<(/?\\s?br\\b)>");
ArrayList<String> c = new ArrayList<String>();
Matcher n2=p4.matcher(t1);
while(n2.find()) {
t3=n2.group(2);
System.out.println(n2.group(3));
String index=t3;
c.add(index);
}
String iguoming=c.get(0).replaceAll(" ", "");
String iwuran=c.get(1).replaceAll(" ", "");
String iganmao=c.get(2).replaceAll(" ", "");
String iziwaixian=c.get(3).replaceAll(" ", "");
String ichuanyi=c.get(4).replaceAll(" ", "");
String ishushi=c.get(5).replaceAll(" ", "");
String ihuazhuang=c.get(6).replaceAll(" ", "");
String imeifa=c.get(7).replaceAll(" ", "");
String ixiche=c.get(8).replaceAll(" ", "");
String ilukuang=c.get(9).replaceAll(" ", "");
String ijiaotong=c.get(10).replaceAll(" ", "");
String ilvyou=c.get(11).replaceAll(" ", "");
String iyundong=c.get(12).replaceAll(" ", "");
String ichenlian=c.get(13).replaceAll(" ", "");
String idiaoyu=c.get(14).replaceAll(" ", "");
String ihuachuan=c.get(15).replaceAll(" ", "");
String iyuehui=c.get(16).replaceAll(" ", "");
String iguangjie=c.get(17).replaceAll(" ", "");
String iliangshai=c.get(18).replaceAll(" ", "");
String iyusan=c.get(19).replaceAll(" ", "");
//System.out.println(iguoming);
} catch (MalformedURLException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
} finally {
try {
if (null != br) {
br.close();
}
} catch (IOException e) {
e.printStackTrace();
}
br = null;
try {
if (null != isr) {
isr.close();
}
} catch (IOException e) {
e.printStackTrace();
}
isr = null;
try {
if (null != in) {
in.close();
}
} catch (IOException e) {
e.printStackTrace();
}
in = null;
}
}
}
输出: 07:32
16:52
天气较好,您在出门的时候无须带雨伞。
极不易发
良
易发
弱
寒冷
较不舒适
保湿
一般
较适宜
干燥
良好
一般
较不宜
较不宜
不宜
不适宜
较不适宜
较不宜
基本适宜
不带伞
不带伞