-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathserver.js
445 lines (375 loc) · 13.2 KB
/
server.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
var express = require('express');
var bodyParser = require('body-parser');
var http = require('http');
var request = require('request');
var axios = require('axios');
var cheerio = require('cheerio');
var sleep = require('sleep');
var fs = require('fs');
var config = require('config');
let app = express();
app.use(bodyParser.json()); // for parsing application/json
app.use(bodyParser.urlencoded({ extended: true })); // for parsing application/x-www-form-urlencoded
const USERS = {};
const ORGANIZATIONS = {};
var totalUsers;
var sessid = config.get('sessid')
var configured = false
if (sessid.toString() === "REPLACEME") {
console.log("You have not configured your sessid yet!")
console.log("Quitting...")
process.exit()
}
// helper fns
function orgNameToURL(name) {
if(name.split(' ').length > 1){
name = urlizeName(name);
}
return 'https://community.dualthegame.com/organization/' + name;
}
function writeLog(output) {
fs.appendFile('log.txt', output+'\n', function (err) {
if (err)
return console.log(err);
});
}
function addOrgToUser(user,org,joinDate,status) {
if(USERS[user] === undefined){
USERS[user] = { user: user, organizations: { } };
}
USERS[user].organizations[org] = {joinDate, status};
}
function addOrgWithDateAndMembers(org,date,membersArray){
if(ORGANIZATIONS[org] === undefined) {
ORGANIZATIONS[org] = { date, members: {} };
}
membersArray.forEach(member => {
ORGANIZATIONS[org].members[member.name] = { joinDate: member.joinDate, status: member.status, createdDate: member.createdDate };
});
}
function addCreateDateMembershipsAndPledgeStatus(username,createdDate, pledgeStatus) {
if(USERS[username]===undefined){
USERS[username] = {};
}
USERS[username].createdDate = createdDate;
USERS[username].pledgeStatus = pledgeStatus;
}
const BASE_URL = 'https://community.dualthegame.com';
function flatMap(arr){
return arr.reduce( (flatArr, item) => flatArr.concat(item),[]);
}
function urlizeName(name){
if(name === undefined){
console.error('Sad face');
} else {
return name.toLowerCase().split(' ').join('-');
}
}
function dataStringFnGenerator() {
var count = 0;
return function(start) {
count = 1;
return `draw=${count}&order%5B0%5D%5Bcolumn%5D=4&order%5B0%5D%5Bdir%5D=desc&start=${start}&length=10`;
}
}
function setupHeaders() {
return axios.get('https://community.dualthegame.com/organizations').then(resp => {
var setCookie = String(resp.headers['set-cookie']);
var startIndex = setCookie.indexOf('=')+1;
var endIndex = setCookie.indexOf(';');
var csrfToken = setCookie.slice(startIndex,endIndex);
//csrfToken = 'voJiPFqDfsWoEdPPHi9hpnXj5Kao0HmB';
//console.log('csrf token: ',csrfToken);
var cookieHeader = `cookieconsent_dismissed=yes; csrftoken=${csrfToken};`;
if(sessid !== undefined){
cookieHeader += 'authsessid=' + sessid + ';';
} else {
writeLog('No authsessid. Functionality limited to organization related data only.');
}
axios.defaults.headers.common['Cookie'] = cookieHeader;
axios.defaults.headers.common['X-CSRFToken'] = csrfToken;
axios.defaults.headers.common['X-Requested-With'] = 'XMLHttpRequest';
axios.defaults.headers.common['Host'] = 'community.dualthegame.com';
axios.defaults.headers.common['Referer'] = 'https://community.dualthegame.com/organizations';
axios.defaults.headers.common['Origin'] = 'https://community.dualthegame.com';
configured = true;
return csrfToken;
}).catch(err => writeLog('*****\n********\n'));
}
function buildOrgList(res){
var dataStringBuilder = dataStringFnGenerator();
var promArray = [];
let count = 0;
// this is very hacky. shouldn't matter if 1400 is bigger than total users....
while(count < 1400 && (totalUsers === undefined || count < totalUsers)) {
let c = count;
promArray.push(getPartialOrgList(res,dataStringBuilder(c)));
count+=10;
//sleep(5)
}
return Promise.all(promArray);
}
function getPartialOrgList(res,data) {
//console.log('Data: ',data);
return axios.post('https://community.dualthegame.com/organizations/list_ajax', data ).then(resp => {
totalUsers = resp.data.recordsTotal;
var orgs = resp.data.data.map(org => {
var name = org.name.slice(10,org.name.lastIndexOf('"'));
name = name.slice(name.indexOf('/')+1);
return name;
});
return orgs;
}).catch((x) => {writeLog(x); res.end('fail')});
}
function getUsersFromOrgName(name){
name = urlizeName(name);
var URL = BASE_URL + '/organization/' + name;
return axios.get(URL, { timeout: 90000 }).then(resp => {
let $ = cheerio.load(resp.data);
var joinDates = $('#all_members').find('td:contains("-")').map( (i,el) => {
return $(el).text();
}).get();
var statuses = $('#all_members').find('tr > td + td').map( (i,el) => {
return $(el).text();
}).get().map(x=>x.trim()).filter( val => val.includes('Member') || val.includes('Legate'));
var uniqueUsers = {};
var usersArray = $('#all_members td > a').map( (index,el) => {
var href = el.attribs.href;
var username = href.slice(href.lastIndexOf('/')+1);
if(username !== undefined && username.length && username.length > 0) uniqueUsers[username] = true;
addOrgToUser(username,name,joinDates[index],statuses[index]);
return { name: username, organization: name, joinDate: joinDates[index], status: statuses[index] };
}).get();
// get organization created date
// update "organizations" db
let created = $('div.text-center > p > small').text();
let ind = created.indexOf('d:')+2;
created = created.slice(ind,ind+11);
addOrgWithDateAndMembers(name,created,usersArray);
return Object.keys(uniqueUsers);
}).catch(err => writeLog('URL FAIL: ',URL,'\n',err.response.statusText));
}
function getUserInfo(name){
//sleep.msleep(100)
if(name === undefined){
writeLog('getUserInfo fail. name undefined');
return;
}
return axios.get('https://community.dualthegame.com/accounts/profile/' + name).then(resp => {
let $ = cheerio.load(resp.data);
// get pledgeStatus
let pledgeStatus = 'none';
if($('div.pledge_badge_anchor').length > 0) {
var src = $('div.pledge_badge_anchor > img.pledge_badge').get(0).attribs.src;
src = src.slice(src.lastIndexOf('/')+1,src.lastIndexOf('.'));
pledgeStatus = src;
}
// get join date
let createdDate = $(`small:contains('Joined:')`).text().slice('Joined:'.length);
// only used for individual userInfo requests - /user/:username
// get organizations and membership
let organizations = $('div.col-md-8 ul > li > a').map((i,el) => {
return $(el).text();
}).get();
let fullClanNames = $('div.col-md-8 ul > li').map( (i,el) => {
return $(el).text();
}).get();
let memberships = fullClanNames.map( clanName => {
if(clanName.includes('(')){
return clanName.slice(clanName.indexOf('(')+1,clanName.indexOf(')'));
} else {
return 'member';
}
});
addCreateDateMembershipsAndPledgeStatus(name, createdDate, pledgeStatus);
return { name, createdDate, pledgeStatus, organizations };
}).catch(err => writeLog('Problem getting user info.'));
}
// ======================================
// Begin ExpressJS Server / Endpoints
// ======================================
// use '/scrape' to scrape all orgs/users and fill database
// takes about 90s -- once completed, /stats will show summary
// /orgs & /users work only after /scrape
app.get('/', (req,res) => {
setupHeaders();
/*
if(axios.defaults.headers.common['Cookie'] && axios.defaults.headers.common['Cookie'].includes && axios.defaults.headers.common['Cookie'].includes('authsessid')){
res.end(`<html>cookie already set.<button onclick="document.location.href='/scrape';">Start scraping...</button></html>`);
} else {
res.end('<html>Input authssid token. Browser will hang while scraping. <form action="/sessid" method="post"><input type="text" name="sessid" placeholder="Sessid cookie"/><button type="submit">Submit</button></form></html>');
}
*/
});
app.get('/stats', (req,res) => {
var stats = '';
stats += 'Number of users: ' + Object.keys(USERS).length;
stats += '\nNumber of Orgs: ' + Object.keys(ORGANIZATIONS).length;
res.end(stats);
});
app.get('/scrape', (req,res) => {
if(!configured)
setupHeaders();
if(sessid==="REPLACEME" || sessid===undefined){
res.redirect('/');
} else {
writeLog('Getting CSRF token...');
setupHeaders().then(x => {
writeLog('Complete!\nBuilding list of organizations...');
buildOrgList(res).then(orgs => {
writeLog('Complete!\nBuilding master user list...')
orgs = flatMap(orgs);
Promise.all(orgs.map(getUsersFromOrgName)).then( usersArray => {
writeLog('Complete!\nScraping user data...');
usersArray = flatMap(usersArray);
var uniqueUsers = Object.keys(usersArray.reduce( (uniqueObj,item) => {
uniqueObj[item] = true;
return uniqueObj;
},{}));
Promise.all(uniqueUsers.map(userObj => getUserInfo(userObj))).then(userInfoObjArray => {
writeLog('Complete!','\n***\n',Object.keys(USERS).length + ' users added.');
res.end('Scraping complete. ' + Object.keys(USERS).length + ' users added.' );
}).catch(err => writeLog('Problem loading user data.'));
}).catch(err=> writeLog('Problem loading organization data.'));
});
})
}
writeLog('Complete!');
if(config.get('headless') == "true"){
getFormattedOrgs();
getFormattedUsers();
}
});
function getFormattedOrgs() {
var betterORGANIZATIONS = [];
Object.keys(ORGANIZATIONS).forEach(function(key) {
var org = ORGANIZATIONS[key];
var newOrg = {
name: key,
createdDate: org.date
};
var members = [];
if(org.members){
Object.keys(org.members).forEach(function(key) {
var member = {
name: key,
joinDate: org.members[key].joinDate,
status: org.members[key].status
};
members.push(member);
});
}
newOrg.members = members;
betterORGANIZATIONS.push(newOrg);
});
fs.writeFile("./orgs.json", JSON.stringify(betterORGANIZATIONS), function(err) {
if(err) {
return writeLog(err);
}
});
return betterORGANIZATIONS;
}
app.get('/orgs', (req,res) => {
//var resp = "// Orgs: "+Object.keys(ORGANIZATIONS).length + '\n'+ JSON.stringify(ORGANIZATIONS);
//console.log(resp);
if(!configured)
setupHeaders();
var formattedORGS = getFormattedOrgs();
var orgsText = "// Orgs: "+Object.keys(formattedORGS).length + '\n'+ JSON.stringify(formattedORGS);
res.end(orgsText);
});
function getFormattedUsers() {
var betterUSERS = [];
Object.keys(USERS).forEach(function(key) {
var user = USERS[key];
var newUser = {
user: user.user,
createdDate: user.createdDate,
pledgeStatus: user.pledgeStatus
};
var orgs = [];
if(user.organizations){
Object.keys(user.organizations).forEach(function(key) {
var org = {
orgname: key,
joinDate: user.organizations[key].joinDate,
status: user.organizations[key].status
};
orgs.push(org);
});
}
newUser.organizations = orgs;
betterUSERS.push(newUser);
});
fs.writeFile("./users.json", JSON.stringify(betterUSERS), function(err) {
if(err) {
return writeLog(err);
}
});
return betterUSERS;
}
app.get('/users', (req,res) => {
//var usersText = "// Users: "+Object.keys(USERS).length+"\n"+JSON.stringify(USERS);
if(!configured)
setupHeaders();
var formattedUSERS = getFormattedUsers();
var usersText = "// Users: "+Object.keys(formattedUSERS).length+"\n"+JSON.stringify(formattedUSERS);
res.end(usersText);
});
//app.post('/sessid', (req,res) => {
//sessid = req.body.sessid;
//res.end('<a href="/scrape">Start scraping...</a><small>browser will hang</small>');
//});
app.get('/user/:user',(req,res) => {
if(!configured)
setupHeaders();
var userInDb = USERS[req.params.user];
res.write('<html>');
var displayUser = (user) => {
for(var key in user) {
if(key === 'organizations' && Array.isArray(user[key])) {
var orgArray = user[key];
var liLinks = orgArray.reduce( (total, name) => {
return `${total}<li><a href="${orgNameToURL(name)}">${name}</a></li>`;
},'');
res.write(`<ul>${liLinks}</ul>`);
} else {
res.write(key + ': ' + user[key] + '<br />');
}
}
};
if(userInDb===undefined || userInDb.organizations === undefined ){
console.log('Sending getUserInfo request...');
setupHeaders().then(x=>{
getUserInfo(req.params.user).then(userObj => {
writeLog('Complete!')
displayUser(userObj);
res.end('</html>');
});
});
} else {
displayUser(USERS[req.params.user]);
res.end('</html>');
}
});
app.get('/api/user/:user',(req,res) => {
if(!configured)
setupHeaders();
var userInDb = USERS[req.params.user];
if(userInDb===undefined || userInDb.organizations === undefined ){
writeLog('Sending getUserInfo request...');
setupHeaders().then(x=>{
getUserInfo(req.params.user).then(userObj => {
console.log('Complete!')
res.end(JSON.stringify(userObj));
});
})
} else {
res.end(userInDb);
}
});
app.listen(3000, () => {
if(!configured)
setupHeaders();
writeLog('Listening on port 3000...');
});