public function fetchingData() {
header("Content-type:text/html;Charset=utf8");
$url="http://www.itheima.com.com/2017/0329/23.html"; //抓取网站内容
$ret=file_get_contents($url); // 将内容的编码集由 GB312 替换成UTF-8
$ret=iconv('GB2312', 'UTF-8', $ret); // 替换掉不需要的内容
$ret=str_replace('', '', $ret); $ret =preg_replace("/(\d+)、/", "", $ret); //正则匹配内容数据
$pattern= "/\(.*)\<\/p\>/i"; preg_match_all($pattern, $ret,$matches); // 正则匹配标题数据
$titlePattern = "/\(.*)\<\/h2\>/i"; preg_match($titlePattern,$ret, $match);
$title =$match[1]; // 将匹配结果集放入数据库
if(!empty($matches[1])) {
$filterResult = array_filter($matches[1]);
foreach($filterResult as $item) {
$data =[
'source' => 'http://www.itcast.com',
'author'=> $title,
'content' => $item,
'add_time' => time()
];
$id =$this->rhesis->addInfo($data);
if ($id > 0) {
echo$item.' add successful!'; echo "";
}
}
}
}