bigly-caret/site.js

148 lines
3.8 KiB
JavaScript
Raw Normal View History

2025-01-30 07:59:30 -05:00
2025-01-30 21:00:26 -05:00
import { writeFile, readFile } from "fs/promises";
2025-01-30 07:59:30 -05:00
import { rankCalc } from "./rank.js";
2025-01-30 08:20:17 -05:00
let cache = {};
2025-01-30 08:42:27 -05:00
let site = process.env.site || 'darflen';
2025-01-31 17:39:47 -05:00
let route = process.env.route || './test.txt';
2025-01-31 17:58:09 -05:00
let pageLimit = process.env.pageLimit || Infinity;
2025-01-30 21:00:26 -05:00
let hh;
async function textCollector(word, path, file) {
2025-01-31 17:39:47 -05:00
if (!hh) hh = await readFile(file, 'utf8');
2025-01-30 21:00:26 -05:00
hh = hh.toLowerCase();
2025-01-31 17:39:47 -05:00
let words = hh.split(/[\n.]+/g).filter(x => word.length == 0 || ` ${x} `.includes(` ${word} `));
2025-01-30 21:00:26 -05:00
words = words.join(' ').split(/[^a-zA-Z0-9']+/g);
words = [...new Set(words)];
return words;
}
2025-01-30 07:59:30 -05:00
2025-01-31 18:05:21 -05:00
async function siteCollector(user, path, site, useLimit) {
2025-01-30 08:20:17 -05:00
let users = [];
2025-01-30 08:34:59 -05:00
let i = 1;
2025-01-30 20:17:43 -05:00
let out = [];
2025-01-30 21:00:26 -05:00
2025-01-31 17:39:47 -05:00
if (site == 'file') {
return await textCollector(user, path, route);
2025-01-30 21:00:26 -05:00
}
2025-01-30 07:59:30 -05:00
while (true) {
2025-01-30 08:42:27 -05:00
let p;
if (site == 'darflen') {
p = `https://api.darflen.com/users/${user}/${path}/${i}`;
} else if (site == 'scratch') {
2025-01-30 09:37:33 -05:00
p = `https://api.scratch.mit.edu/users/${user}/${path}/?limit=40&offset=${i * 40}`;
2025-01-30 08:42:27 -05:00
} else {
throw 'That site is not supported.';
}
2025-01-30 08:34:59 -05:00
let j1 = cache[p];
2025-01-30 08:20:17 -05:00
if (!j1) {
let h1 = await fetch(p);
2025-01-30 08:42:27 -05:00
try {
j1 = await h1.json();
2025-01-30 12:40:55 -05:00
} catch (err) {
2025-01-30 08:42:27 -05:00
j1 = [];
}
2025-01-30 08:20:17 -05:00
}
cache[p] = j1;
2025-01-30 07:59:30 -05:00
2025-01-31 18:05:21 -05:00
if (!j1.map || (i > pageLimit && useLimit)) break;
2025-01-31 17:56:05 -05:00
2025-01-30 08:42:27 -05:00
let users2;
if (site == 'darflen') {
users2 = j1[path].map(x => x.profile.username);
} else if (site == 'scratch') {
users2 = j1.map(x => x.username);
}
2025-01-30 07:59:30 -05:00
2025-01-30 20:17:43 -05:00
users.push(users2);
2025-01-30 07:59:30 -05:00
if (users2.length == 0) break;
i++;
2025-01-30 08:20:17 -05:00
console.log(`User ${user} has ${i} pages calculated`);
2025-01-30 07:59:30 -05:00
}
2025-01-30 20:17:43 -05:00
out = out.concat(...users);
return out;
2025-01-30 08:20:17 -05:00
}
(async function () {
2025-01-30 12:40:55 -05:00
let penv = process.env.user || 'paradock';
2025-01-31 17:42:18 -05:00
penv = penv.split(',');
2025-01-30 12:40:55 -05:00
2025-01-31 18:11:28 -05:00
let users = [...penv];
2025-01-31 18:05:21 -05:00
let legal = [];
2025-01-31 18:11:07 -05:00
let depth = process.env.depth || 1;
for (let i = 0; i < depth; i++) {
2025-01-31 18:12:03 -05:00
let b = [...users];
for (let u of b) {
2025-01-31 18:11:07 -05:00
let ca = await siteCollector(u, 'followers', site);
users = users.concat(ca);
legal = legal.concat(ca);
users = users.concat(await siteCollector(u, 'following', site));
}
users = [...new Set(users)];
2025-01-30 12:40:55 -05:00
}
2025-01-30 08:20:17 -05:00
2025-01-30 07:59:30 -05:00
let data = {};
let p = [];
2025-01-30 09:37:33 -05:00
let congested = [];
2025-01-30 07:59:30 -05:00
for (let u of users) {
2025-01-31 18:05:21 -05:00
let inLegal = legal.indexOf(u) != -1;
2025-01-30 09:37:33 -05:00
let it = 0;
2025-01-30 09:42:04 -05:00
while (p.length >= (process.env.maxRate || 15)) {
2025-01-30 09:37:33 -05:00
p = p.filter(x => x != 'hi');
2025-01-30 09:40:21 -05:00
if (p.length == 0) break;
2025-01-30 09:37:33 -05:00
let pv = await Promise.any(p);
it++;
if (it > 10) {
console.warn(`Promises got congested. Moving to another array...`)
congested = congested.concat(p);
p = [];
break;
}
2025-01-30 07:59:30 -05:00
}
2025-01-31 17:39:47 -05:00
data[u] = { followers: [], following: [] };
2025-01-30 20:17:43 -05:00
p.push(async function (k) {
2025-01-31 18:05:21 -05:00
let j1 = await siteCollector(u, 'followers', site,inLegal);
2025-01-30 07:59:30 -05:00
2025-01-30 20:17:43 -05:00
data[u].followers = j1;
console.log(`User ${u} followers fully calculated`);
2025-01-30 07:59:30 -05:00
2025-01-30 20:17:43 -05:00
p[k] = 'hi';
}(p.length));
p.push(async function (k) {
2025-01-31 18:05:21 -05:00
let j1 = await siteCollector(u, 'following', site,inLegal);
2025-01-30 20:17:43 -05:00
data[u].following = j1;
console.log(`User ${u} following fully calculated`);
2025-01-30 12:40:55 -05:00
2025-01-30 20:17:43 -05:00
p[k] = 'hi';
}(p.length));
2025-01-30 07:59:30 -05:00
}
2025-01-30 09:37:33 -05:00
p = p.concat(congested);
2025-01-30 07:59:30 -05:00
await Promise.all(p);
2025-01-31 17:42:18 -05:00
let dat = Object.entries(rankCalc(data, 100, penv));
2025-01-30 07:59:30 -05:00
dat = dat.sort((a, b) => a[1] - b[1]);
let dat2 = {};
for (let d of dat) {
dat2[d[0]] = d[1] * 100 + "%";
}
let srz = JSON.stringify(dat2);
await writeFile(`./users.json`, srz, 'utf8');
})()