1、该网站的ppt链接全部都在页面上,用正则手动提取所有链接,放在指定位置的,以txt形式保存,格式如下
2、写个java文件处理一下,如下:
1 package platform; 2 3 import java.io.BufferedInputStream; 4 import java.io.BufferedOutputStream; 5 import java.io.BufferedReader; 6 import java.io.File; 7 import java.io.FileInputStream; 8 import java.io.FileNotFoundException; 9 import java.io.FileOutputStream; 10 import java.io.IOException; 11 import java.io.InputStreamReader; 12 import java.io.UnsupportedEncodingException; 13 import java.net.HttpURLConnection; 14 import java.net.URL; 15 import java.util.HashMap; 16 import java.util.Map; 17 18 import org.apache.http.HttpResponse; 19 import org.apache.http.client.ClientProtocolException; 20 import org.apache.http.client.methods.HttpPost; 21 import org.apache.http.impl.client.DefaultHttpClient; 22 23 public class TestQConDownload { 24 25 public static void main(String[] args) { 26 BufferedReader bufferedReader; 27 Str