awesome-docker/buildMetadata.js

121 lines
3.3 KiB
Markdown
Raw Normal View History

2018-06-07 09:06:04 +02:00
const fs = require('fs');
const { promisify } = require('util');
const fetch = require('node-fetch');
const dayjs = require('dayjs');
require('draftlog').into(console);
process.on('unhandledRejection', error => {
console.log('unhandledRejection', error.message);
});
if (!process.env.TOKEN) {
throw new Error('no github token found');
}
// --- ENV VAR ---
const BATCH_SIZE = parseInt(process.env.BATCH_SIZE, 10) || 10;
const DELAY = parseInt(process.env.DELAY, 10) || 3000;
// --- FILENAME ---
const README = 'README.md';
const GITHUB_METADATA_FILE = `data/${dayjs().format(
'YYYY-MM-DDTHH.mm.ss',
)}-fetched_repo_data.json`;
2018-06-09 19:51:40 +02:00
const LATEST_FILENAME = 'data/latest';
2018-06-07 09:06:04 +02:00
const GITHUB_REPOS = 'data/list_repos.json';
// --- HTTP ---
const API = 'https://api.github.com/';
const options = {
method: 'GET',
headers: {
'User-Agent': 'awesome-docker script listing',
'Content-Type': 'application/json',
Authorization: `token ${process.env.TOKEN}`,
},
};
const removeHost = x => x.slice('https://github.com/'.length, x.length);
const readFile = promisify(fs.readFile);
const writeFile = promisify(fs.writeFile);
const printError = err => err && console.error('❌ ERROR', err);
const barLine = console.draft('Starting batch...');
const delay = ms =>
new Promise(resolve => {
setTimeout(() => resolve(), ms);
});
const get = (path, opt) =>
fetch(`${API}repos/${path}`, {
...options,
...opt,
})
.catch(printError)
.then(response => {
if (response.ok) return response.json();
throw new Error('Network response was not ok.');
})
.catch(printError);
const fetchAll = batch => Promise.all(batch.map(async path => get(path)));
const extractAllRepos = markdown => {
const re = /https:\/\/github\.com\/([a-zA-Z0-9-._]+)\/([a-zA-Z0-9-._]+)/g;
const md = markdown.match(re);
return [...new Set(md)];
};
const ProgressBar = (i, batchSize, total) => {
const progress = Math.round((i / total) * 100);
const units = Math.round(progress / 2);
return barLine(
`[${'='.repeat(units)}${' '.repeat(50 - units)}] ${progress}% - # ${i}`,
);
};
async function batchFetchRepoMetadata(githubRepos) {
const repos = githubRepos.map(removeHost);
const metadata = [];
/* eslint-disable no-await-in-loop */
for (let i = 0; i < repos.length; i += BATCH_SIZE) {
const batch = repos.slice(i, i + BATCH_SIZE);
if (process.env.DEBUG) console.log({ batch });
const res = await fetchAll(batch);
metadata.push(...res);
ProgressBar(i, BATCH_SIZE, repos.length);
2018-06-09 16:08:57 +02:00
// poor man's rate limiting so github don't ban us
2018-06-07 09:06:04 +02:00
await delay(DELAY);
}
ProgressBar(repos.length, BATCH_SIZE, repos.length);
return metadata;
}
async function main() {
try {
const markdown = await readFile(README, { encoding: 'utf8' });
const githubRepos = extractAllRepos(markdown);
await writeFile(
GITHUB_REPOS,
JSON.stringify(githubRepos, null, 2),
printError,
);
2018-06-25 13:50:07 +02:00
const metadata = await batchFetchRepoMetadata(githubRepos);
2018-06-07 09:06:04 +02:00
2018-06-09 16:08:57 +02:00
await writeFile(
GITHUB_METADATA_FILE,
JSON.stringify(metadata, null, 2),
printError,
);
console.log('✅ metadata saved');
2018-06-07 09:06:04 +02:00
2018-06-09 19:51:40 +02:00
// save the latest
fs.writeFile(LATEST_FILENAME, GITHUB_METADATA_FILE, printError);
2018-06-07 09:06:04 +02:00
} catch (err) {
printError(err);
}
}
main();