// 这是java 用Jsoup 解析网页源码
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import java.io.BufferedReader;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.URL;
import java.net.URLConnection;
public class JavaDemo {
public static String getContent(String url , String encoding) {
StringBuffer buffer = new StringBuffer();
try {
URL u = new URL(url);
URLConnection uc = u.openConnection();
InputStream inputStream = uc.getInputStream();
InputStreamReader inputStreamReader = new InputStreamReader(inputStream);
BufferedReader reader = new BufferedReader(inputStreamReader);
String temp = null;
while ((temp = reader.readLine())!= null){
temp += temp;
buffer.append(temp+"\n");
}
Document parse = Jsoup.parse(buffer.toString());
System.out.println(parse);
} catch (Exception e) {
e.printStackTrace();
}
return null;
}
public static void main(String[] args) {
String url = "https://movie.douban.com";
String encoding = "utf-8";
getContent(url,encoding);
}
}
# 这是python
import urllib.request
response = urllib.request.urlopen("https://movie.douban.com")
html = response.read().decode('utf-8')
print(html)
看完之后视觉冲击还是很大的 尤其对懒人来说 敲简短的代码是多么幸福的事情!
当然,这是拿python的强项去和java的弱项对比, 而且在java代码块中考虑了效率的问题,要简写也是可以的:
public static String getContent(String url , String encoding) throws Exception {
String temp = null;
while ((temp = new BufferedReader(new InputStreamReader(new URL(url).openConnection().getInputStream())).readLine())!= null){
temp += temp;
}
Document parse = Jsoup.parse(temp);
return null;
}