(1)加入jar包
jsoup -1.6.1-jar
(2)测试文档
package com.jsoup.test;
import java.io.File;
import java.io.IOException;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.select.Elements;
public class JsoupTest {
public static void main(String[] args) throws IOException {
File input = new File("F:/webmagic/zhidao.baidu.com/2.json");
Document doc = Jsoup.parse(input,"UTF-8","http://zhidao.baidu.com/");
Elements id = doc.getElementsByClass("ask-title"); //
System.out.println("得到的结果是:"+id.text());
}
}
(3)文档结构