nodejs做小爬虫 nodejs 学习 day3

最新推荐文章于 2024-05-04 09:56:38 发布

菜鸟啊啊啊啊21

最新推荐文章于 2024-05-04 09:56:38 发布

阅读量238

点赞数

分类专栏： jquery nodejs 文章标签： nodejs 爬虫

jquery 同时被 2 个专栏收录

15 篇文章 0 订阅

订阅专栏

nodejs

4 篇文章 0 订阅

订阅专栏

源码：

var http = require('http')
var cheerio = require('cheerio')
var url = 'http://www.imooc.com/learn/348'

function filechapters (html){
var $ = cheerio.load(html)
var chapters = $('.chapter')
// [{
// chaptertitle" '',
// videos:[
// tile:'',
// id:''
// ]

// }]

var coursedata = []
chapters.each(function(item){
var chapter = $(this)
var chaptertitle = chapter.find('strong').text()
var videos = chapter.find('.video').children('li')
var chapterdata = {
chaptertitle : chaptertitle,
videos:[]
}

videos.each(function(item){
var video = $(this).find('.J-media-item')
var videotitle = video.text()
var id = video.attr('href').split('video/')[1]

chapterdata.videos.push({
title:videotitle,
id:id
})

})
coursedata.push(chapterdata)

})
return coursedata
}
function printcouseinfo (coursedata){
coursedata.forEach(function(item){
var chaptertitle = item.chaptertitle
console.log(chaptertitle + '\n')
var videos = item.videos
videos.forEach(function(key){
console.log('[' + key.id + ']' + key.title)

})
})

}

http.get(url,function(res){
var html = ''
res.on('data',function(data){

html += data
})
res.on('end',function(){
var coursedata = filechapters (html)
printcouseinfo (coursedata)
})
}).on('error',function(){

console.log('出现错误')
})

菜鸟啊啊啊啊21

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
nodejs做小爬虫 nodejs 学习 day3

源码：var http = require('http');var url = 'http://www.imooc.com/learn/637';http.get(url,function(res){var html = '';res.on('data',function(data){html += data ;})res.on('end',functi
复制链接

扫一扫