因为要用到天气信息,在网上找了免费的api,不是有调用限制就是返回的结果不满意,看了百度的比较合适,决定用爬虫抓下来
在百度上搜索"北京天气",将浏览器的地址复制,作为请求地址
添加jar包
org.jsoup
jsoup
1.10.3
抓取程序package com.orange.utils;
import java.io.IOException;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;
public class TestWeather {
private static String weatherUrl = "http://www.baidu.com/baidu?tn=monline_3_dg&ie=utf-8&wd=%E5%8C%97%E4%BA%AC%E5%A4%A9%E6%B0%94";
public static void getWeather() {
String userAgent = UserAgentUtil.getUserAgents();
try {
Document doc = Jsoup.connect(weatherUrl).userAgent(userAgent).timeout(5000).get();
Elements a = doc.getElementsByClass("op_weather4_twoicon").get(0).getElementsByTag("a");
for (Element element : a) {
String quality = "";
String current = "";
String today = "";
//只有当天才有实时温度
if (!element.getElementsByClass("op_weather4_twoicon_sh