package Dome01;import java.io.BufferedReader;import java.io.BufferedWriter;import java.io.FileOutputStream;import java.io.IOException;import java.io.InputStreamReader;import java.io.OutputStreamWriter;import java.net.MalformedURLException;import java.net.URL;public class Test {public static void main(String[] args) {try {URL ul = new URL("http://www.w3cschool.cn/");//里面写你要抓取的网页地址即可BufferedReader bf =new BufferedReader(new InputStreamReader(ul.openStream(),"UTF-8"));//指定编码格式(读)BufferedWriter bu = new BufferedWriter(new OutputStreamWriter(new FileOutputStream("dome.html"),"UTF-8"));//指定编码格式(写)String len;while((len = bf.readLine())!=null){System.out.println(len);bu.write(len);bu.newLine();//换加一行分隔符}bu.close();bf.close();} catch (MalformedURLException e) {e.printStackTrace();} catch (IOException e) {e.printStackTrace();} finally{}}}
使用import java.net.URL;抓取网页
最新推荐文章于 2024-06-06 09:07:54 发布