依赖
--定义数据
SpiderWebs={}
SpiderWebs[1]={url='https://www.oschina.net', selector='a.news-link', content='div.content'}
--采集URL
--'https://www.oschina.net'
--'a.news-link'
--'div.content'
function SpiderProc(url, selector, contentname)
local htmlparser = require('htmlparser')
local ret,text = ExecuteURL(math.random(1,10), url, true)
local root = htmlparser.parse(text,10000)
print(" chapters")
local sel, chapters = root(selector), {}
for k,v in pairs(sel) do
local href = v.attributes['href']
if not SpiderUrl[href] then
local title = v.attributes['title']
--print(k,v.name, href)
local ret,resp = ExecuteU