url不匹配获取不到要爬取的网页
@Gecco(matchUrl="http://so.csdn.net/so/search/s.do?p={page}&q={keyword}", pipelines={"consolePipeline","CSDNSearchListPipeline"})
public class CSDNSearchPage implements HtmlBean {
/**
*
*/
private static final long serialVersionUID = -8768911729454034269L;
@Request
private HttpRequest request;
@RequestParameter
private String page;
@RequestParameter
private String keyword;
@RequestParameter
private String siteType;
@HtmlField(cssPath = ".search-list")
List articleList;
public HttpRequest getRequest() {
return request;
}
public void setRequest(HttpRequest request) {
this.request = request;
}
public List getArticleList() {
return articleList;
}
public void setArticleList(List articleList) {
this.articleList = articleList;
}
public String getPage() {
return page;
}
public void setPage(String page) {
this.page = page;
}
public String getKeyword() {
return keyword;
}
public void setKeyword(String keyword) {
this.keyword = keyword;
}
public String getSiteType() {
return siteType;
}
public void setSiteType(String siteType) {
this.siteType = siteType;
}
public static void main(String[] args) {
HttpGetRequest start = new HttpGetRequest("http://so.csdn.net/so/search/s.do?p=1&q=Java");
start.setCharset("UTF-8");
ApplicationContext ctx = new ClassPathXmlApplicationContext("applicationContext.xml");
PipelineFactory springPipelineFactory = (PipelineFactory) ctx.getBean("springPipelineFactory");
GeccoEngine.create()
.pipelineFactory(springPipelineFactory)
.classpath("com.wz.article")
.start(start)
.mobile(false)
.run();
}
}
报错信息:
希望大神指点迷津,不胜感激~