-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathindex.js
149 lines (134 loc) · 5.14 KB
/
index.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
const Twitter = require('twitter');
const config = require('config');
const phantom = require('phantom');
const queue = require('queue');
const path = require('path');
let q = queue({
concurrency: config.get('archival.parallel'),
autostart: true,
});
const User = require(path.join(__dirname, 'lib', 'schemas', 'userSchema'));
const Tweet = require(path.join(__dirname, 'lib', 'schemas', 'tweetSchema'));
const twitter = new Twitter(config.get('twitter'));
const trackTweets = (_user) => {
const findUser = (user) => {
User.findOne({id_str: user.id_str}, (err, result) => {
if (err) return console.error(err);
if (result
&& (result.screen_name != user.screen_name
|| result.name != user.name
|| result.description != user.description
|| result.url != user.url
|| result.location != user.location
|| result.verified != user.verified)) return updateUser(user);
if (result) return startInterval(result);
createUser(user);
});
};
const createUser = (user) => {
new User({
id_str: user.id_str,
screen_name: user.screen_name,
name: user.name,
description: user.description,
url: user.url,
location: user.location,
verified: user.verified,
created_at: user.created_at,
}).save((err, result) => {
if (err || !result) return console.error(`Failed to create database entry for user '${user.screen_name}'!`);
findUser(user);
});
};
const updateUser = (user) => {
User.where({
id_str: user.id_str
}).update({
screen_name: user.screen_name,
name: user.name,
description: user.description,
url: user.url,
location: user.location,
verified: user.verified
}, (err, result) => {
if (err) console.error(err);
findUser(user);
})
};
const fetchTweets = (user) => {
Tweet.findOne({_user: user._id})
.sort({created_at: -1})
.exec((err, result) => {
if (err) return;
if (!result) result = {id_str: '0'};
twitter.get('statuses/user_timeline', {user_id: _user.id_str, since_id: parseInt(result.id_str), count: 200}, (error, result, response) => {
if (error || !result) return;
result.forEach((tweet) => {
if (tweet.user.id_str != user.id_str || !tweet || !tweet.id_str) return;
Tweet.findOne({id_str: tweet.id_str}, (err, result) => {
if (err) return console.error(err);
if (result) return;
new Tweet({
id_str: tweet.id_str,
coordinates: tweet.coordinates,
created_at: tweet.created_at,
possibly_sensitive: tweet.possibly_sensitive,
source: tweet.source,
scopes: tweet.scopes,
text: tweet.text,
_user: user._id,
}).save((err, result) => {
if (err) return console.error(`Failed to save new tweet from user '${user.screen_name}'!`);
console.log(`Saved new tweet from user '${user.screen_name}'!`);
q.push((cb) => {
(async function() {
console.log(`Archiving tweet ${tweet.id_str}...`);
const instance = await phantom.create();
const page = await instance.createPage();
await page.on("onResourceRequested", function(requestData) {
//console.info('Requesting', requestData.url)
});
const status = await page.open(`https://web.archive.org/save/https://twitter.com/${user.screen_name}/status/${tweet.id_str}`);
//console.log(status);
const content = await page.property('content');
//console.log(content);
await instance.exit();
Tweet.where({id_str: tweet.id_str}).update({
archive_link: `https://web.archive.org/web/https://twitter.com/${user.screen_name}/status/${tweet.id_str}`
}, (err, result) => {
if (err) return cb();
console.log(`Saved archive link for tweet ${tweet.id_str}.`);
cb();
});
}());
});
});
});
});
});
});
};
const calculateInterval = () => {
const userCount = config.get('trackedUsers').length;
const interval = Math.ceil(((60 * 15) / 1450) * userCount) * 1000;
return Math.max(5000, interval);
};
const startInterval = (user) => {
fetchTweets(user);
setInterval(() => {
fetchTweets(user);
}, calculateInterval());
};
findUser(_user);
};
if (config.get('web.enabled')) require(path.join(__dirname, 'server', 'server.js'));
if (config.get('archival.enabled')) process.nextTick(() => {
config.get('trackedUsers').forEach((user) => {
twitter.get('users/lookup', {screen_name: user}, (error, result, response) => {
if (error || !result ) console.error(`Failed to lookup user '${user}'!`);
result.forEach((user) => {
trackTweets(user);
});
});
});
});