forked from grant/npm-crawler
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathindex.js
57 lines (48 loc) · 1.15 KB
/
index.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
var jsdom = require('jsdom'),
request = require('request'),
url = require('url'),
npm = require("npm");
var configObject = {
"dev": false,
"loglevel": "error"
};
getData(0);
function getData(j) {
request({
uri: 'https://npmjs.org/browse/all/' + j
}, function (err, response, body) {
if (err && response.statusCode !== 200) {
console.log('Request error.');
}
npm.load(configObject, function (er, npm) {
jsdom.env({
html: body,
scripts: ['http://code.jquery.com/jquery-1.6.min.js'],
done: function (err, window) {
var $ = window.jQuery;
var $rows = $('body').find('.row');
if ($rows.length > 1) {
$rows.each(function (i, item) {
var $a = $(item).find('a');
var module = $a.html();
crawled(module);
});
getData(j + 1);
}
}
});
});
});
}
var modules = [];
var i = 0;
var fs = require('fs');
function crawled(module) {
modules.push(module);
if (i % 100 === 0) {
fs.writeFile("modules.txt", modules, function(err) {
console.log('saved!');
});
}
++i;
}