php模拟登陆,网络爬虫

private function findBook($data,$msg,$user){
		$html = new simple_html_dom();
		$post_fields=array(
				"bor_id"=>$user["patron_barcode"],
				"bor_verification"=>$user["patron_password"]
		);
		$login_url="";
		$cookie_file = tempnam('temp','cookie');
		//模拟登陆
		$ch = curl_init($login_url);
		curl_setopt($ch, CURLOPT_HEADER, 0);
		curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);
		curl_setopt($ch, CURLOPT_POST, 1);
		curl_setopt($ch, CURLOPT_POSTFIELDS, $post_fields);
		curl_setopt($ch, CURLOPT_COOKIEJAR, $cookie_file);
		$contents = curl_exec($ch);
		
		//获取数据
		$ch = curl_init('');
		curl_setopt($ch, CURLOPT_HEADER, 0);
		curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);
		curl_setopt($ch, CURLOPT_COOKIEFILE, $cookie_file);
		$contents = curl_exec($ch);
		curl_close($ch);
		
		
		
		$back = array("data"=>array());
		$i = 0;
		$type="news";
		$html->load($contents);
		
		foreach($html->find('table[class=items]') as $item){
			$tit=$item->find('div.itemtitle a',0);
			$des=$item->find('td.col2 table tbody tr',0);
			$mes=$item->find('td.libs a',0);
			$img=$item->find('td img',-1);
			$back['data'][$i++] = array (
					"Title" => str_replace(" ","",$tit->plaintext)."\n".$mes->plaintext,
					"Url" => $tit->href,
					"Description"=>str_replace(" ","",$des->plaintext),
					"PicUrl"=>$img->src
			);
		}
		
		return new back($msg->getToUsername(),$msg->getFromUsername(),$back, $type, $msg->getCreateTime(),0);
	}


html解析用PHP Simple HTML DOM Parser

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值