1.引入maven依赖
<!-- jsoup -->
<dependency>
<groupId>org.jsoup</groupId>
<artifactId>jsoup</artifactId>
<version>1.10.2</version>
</dependency>
2.代码
import java.io.BufferedReader;
import java.io.FileReader;
import java.io.IOException;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.select.Elements;
public class JsoupTest {
/**
* 读HTML文件
* @param pathname
* @return
*/
public static String readHtml(String path) {
StringBuffer buff = new StringBuffer();
// 建立一个对象,它把文件内容转成计算机能读懂的语言