-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathcrawler.js
More file actions
54 lines (50 loc) · 1.31 KB
/
Copy pathcrawler.js
File metadata and controls
54 lines (50 loc) · 1.31 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
var http = require('http')
var cheerio = require('cheerio')
var url = 'http://www.imooc.com/learn/348'
function filterChapters(html){
var $ = cheerio.load(html)
var chapters = $('.chapter')
var courseData = []
chapters.each(function(){
var item = $(this)
var chapterTitle = item.find('strong').text().replace(/(^\s*)|(\s*$)/g, "")
var videos = item.find('.video').children('li')
var chapter = {
chapterTitle: chapterTitle,
videos: []
}
videos.each(function(){
var video = $(this)
video = video.find('.J-media-item')
var videoTitle = video.text().replace(/(^\s*)|(\s*$)/g, "");
var videoId = video.attr('href').split('video/')[1]
chapter.videos.push({
videoId: videoId,
videoTitle: videoTitle
})
})
courseData.push(chapter)
})
return courseData
}
function printCourseInfo(courseData){
courseData.forEach(function(item){
var chapterTitle = item.chapterTitle
console.log(chapterTitle + '\n')
item.videos.forEach(function(video){
console.log(' 【' + video.videoId + '】' + video.videoTitle + '\n')
})
})
}
http.get(url, function(res){
var html = ''
res.on('data',function(data){
html += data
})
res.on('end',function(){
var courseData = filterChapters(html)
printCourseInfo(courseData)
})
}).on('error',function(){
console.log('获取课程内容出错!')
})