java爬取27270代码@wangfupeng
我就直接贴代码了。
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.springframework.beans.factory.annotation.Autowired;
import org.springframework.scheduling.annotation.Scheduled;
import org.springframework.stereotype.Component;
import org.springframework.util.StringUtils;
@Component
public class FileSchedule {
public static final Logger logger = LoggerFactory.getLogger(FileSchedule.class);
@Autowired
Www27270comClientWrapper www27270comClientWrapper;
@Autowired
PictureCategoryService pictureCategoryService;
@Autowired
PictureService pictureService;
@Scheduled(cron="0 0 * * * ?")
public void getMethod() {
for (int page = 1; page < 200; page++) {
String meinvtupianString = www27270comClientWrapper.meinvtupian("list_11_" + page);
String meinvtupianBoxDiv = HtmlUtil.getHtmlString(meinvtupianString, "<div class=\"MeinvTuPianBox\">", "</div>", 1, 0);
String meinvtupianBoxDivUl = HtmlUtil.getHtmlString(meinvtupianBoxDiv, "<ul>", "</ul>", 1, 0);
String[] meinvtupianBoxDivUlLis = meinvtupianBoxDivUl.split("</li>");
for (int i = 0; i < meinvtupianBoxDivUlLis.length - 1; i++) {
String meinvtupianBoxDivUlLi = meinvtupianBoxDivUlLis[i];
String pictureUrl = HtmlUtil.getHtmlString(meinvt