<dependency>
<groupId>org.jsoup</groupId>
<artifactId>jsoup</artifactId>
<version>1.11.3</version>
</dependency>
// Jsoup通过字符串读取html内容
Jsoup.parseBodyFragment(htmlContent)
// Jsoup通过url读取html内容
Document document = Jsoup.connect(url)
.timeout(10000)
.ignoreContentType(true)
.userAgent("Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/71.0.3578.98 Safari/537.36")
.get();
// Jsoup获取元素举例:
Elements ps = Jsoup.parseBodyFragment(htmlContent).select("body").get(0).getElementsByTag("p");
document.select("div[class=category-content j-cover-overflow]").get(0);
document.select("div[id=j-course-outline]").get(0).select("div[class=outline]").get(0).select("div[class=f-richEditorText]").get(0).getElementsByTag("p");
// Jsoup获取元素内容举例:
Element span = p.select("span").get(0).select("span").get(0);
String text= span.text();
Jsoup API:https://jsoup.org/apidocs/org/jsoup/Jsoup.html
Jsoup实例:https://www.javatpoint.com/jsoup-example-print-form-parameters