爬取360指数三部曲
- 获取360用户的token
- 通过账号、密码、token模拟登陆,获取cookie
- 设置cookie,爬取360指数
代码实现
<?php
class CrawlerOf360Data
{
private $curl;
function __construct()
{
$this->init_curl_client();
}
function init_curl_client() {
$this->curl = curl_init();
curl_setopt($this->curl, CURLOPT_URL, "https://login.360.cn/");
curl_setopt($this->curl, CURLOPT_TIMEOUT, 60);
curl_setopt($this->curl, CURLOPT_COOKIEJAR, dirname(__FILE__).'/cookie.txt');
curl_setopt($this->curl, CURLOPT_COOKIEFILE, dirname(__FILE__).'/cookie.txt');
curl_setopt($this->curl, CURLOPT_SSL_VERIFYHOST, 0);
curl_setopt($this->curl, CURLOPT_SSL_VERIFYPEER, 0);
curl_setopt($this->curl, CURLOPT_RETURNTRANSFER, 1);
}
function get360Data($name) {
$_tokenPostFields = array(
'callback' => 'jQuery18309010124561026427_1524021670433',
'src'=> 'pcw_360index',
'from'=> 'pcw_360index',
'charset'=> 'UTF-8',
'requestScema'=> 'https',
'o'=>