-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsubmissions.js
62 lines (48 loc) · 1.33 KB
/
submissions.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
var request = require("request"),
data = require(__dirname + "/data.js"),
utils = require(__dirname + "/utils.js");
/**
* Monitors the most recent 30 submissions for analysis. On
* the first run it scrapes the most recent 1000.
*/
var url = "http://api.thriftdb.com/api.hnsearch.com/items/_search" +
"?sortby=create_ts+desc" +
"&filter[fields][type]=submission";
var firsttime = false;
var offset = 0;
setTimeout(function() {
var scrape = arguments.callee;
if(!data.ready()) {
return setTimeout(scrape, 1000);
}
var options = {
url: url
}
if(firsttime) {
options.url += "&start=" + offset + "&limit=100";
} else {
options.url += "&limit=30";
}
request(options, function (error, response, body) {
if (error) {
console.log("scrape.error (submissions.js#36) " + error);
return setTimeout(scrape, 1000);
};
var jbody = JSON.parse(body);
if(jbody.results && jbody.results.length > 0) {
for(var i=0; i<jbody.results.length; i++) {
var item = jbody.results[i].item;
var domain = utils.baseurl(item.url || "selfpost")
data.queueDomain(domain);
data.queueUser(item.username, null, true);
}
}
if(firsttime && offset != 900) {
offset += 100;
return setTimeout(scrape, 1000);
}
firsttime = false;
offset = 0;
return setTimeout(scrape, 60000);
});
}, 1000);