参考链接:
http://phantomjs.org/examples.html
phantomjs是一个无界面浏览器,可用于网页截图和前端自动化测试,基于webkit内核(也就是chrome使用的内核),并使用js编写业务脚本来请求、浏览和操作页面。在学习过程中可参考http://phantomjs.org/examples.html进行学习。
1、安装phantomjs
下载phantomjs(官网下载),选择自己需要的版本下载即可,我这里是在windows下使用的,下载后直接解压,为了方便我将包含phantomjs.exe的目标路径添加到了环境变量里面,后续使用比较方便。
安装完成后在cmd里面输入phantomjs --version即可查看phantomjs版本信息。
2、python中使用phantomjs
import os
import collections
import logging
import subprocess
import posixpath
page_info = {
'url': 'http://xxx.com/dashboard',
'page': 'file/data_analyze.json',
'subject': 'data_analyze',
'cookie_name': 'xxx',
'cookie_value': 'xxx',
'cookie_domain': 'xxx'
}
def screenshot(page_info):
page = page_info['page']
subject = page_info['subject']
image_file = subject + '.png'
if os.path.exists(image_file):
os.remove(image_file)
params = collections.OrderedDict()
params['url'] = posixpath.join(page_info['url'], page)
params['width'] = 1200
params['height'] = 4096
params['png'] = subject + '.png'
params['cname'] = page_info['cookie_name']
params['cvalue'] = page_info['cookie_value']
params['cdomain'] = page_info['cookie_domain']
args = ' '.join(['%s=%s' % (k, v) for k, v in params.items()])
#真实环境中phantomjs和render.js的路径要进行调整
cmd = 'phantomjs --ignore-ssl-errors=true --web-security=false render.js %s' % args
status = subprocess.call(cmd, shell=True)
if status != 0:
logging.error('screenshot for subject=%s with status=%s', subject, status)
return False
return True
if __name__ == '__main__':
screenshot(page_info)
3、render js的实现。
phantomjs官网有很多这样的例子,现贴一个rasterize.js的实现。
"use strict";
var page = require('webpage').create(),
system = require('system'),
address, output, size, pageWidth, pageHeight;
if (system.args.length < 3 || system.args.length > 5) {
console.log('Usage: rasterize.js URL filename [paperwidth*paperheight|paperformat] [zoom]');
console.log(' paper (pdf output) examples: "5in*7.5in", "10cm*20cm", "A4", "Letter"');
console.log(' image (png/jpg output) examples: "1920px" entire page, window width 1920px');
console.log(' "800px*600px" window, clipped to 800x600');
phantom.exit(1);
} else {
address = system.args[1];
output = system.args[2];
page.viewportSize = { width: 600, height: 600 };
if (system.args.length > 3 && system.args[2].substr(-4) === ".pdf") {
size = system.args[3].split('*');
page.paperSize = size.length === 2 ? { width: size[0], height: size[1], margin: '0px' }
: { format: system.args[3], orientation: 'portrait', margin: '1cm' };
} else if (system.args.length > 3 && system.args[3].substr(-2) === "px") {
size = system.args[3].split('*');
if (size.length === 2) {
pageWidth = parseInt(size[0], 10);
pageHeight = parseInt(size[1], 10);
page.viewportSize = { width: pageWidth, height: pageHeight };
page.clipRect = { top: 0, left: 0, width: pageWidth, height: pageHeight };
} else {
console.log("size:", system.args[3]);
pageWidth = parseInt(system.args[3], 10);
pageHeight = parseInt(pageWidth * 3/4, 10); // it's as good an assumption as any
console.log ("pageHeight:",pageHeight);
page.viewportSize = { width: pageWidth, height: pageHeight };
}
}
if (system.args.length > 4) {
page.zoomFactor = system.args[4];
}
page.open(address, function (status) {
if (status !== 'success') {
console.log('Unable to load the address!');
phantom.exit(1);
} else {
window.setTimeout(function () {
page.render(output);
phantom.exit();
}, 200);
}
});
}