Rinser/gather.js

174 lines
4.2 KiB
JavaScript
Raw Normal View History

2018-06-14 08:07:51 +00:00
const RssBraider = require('rss-braider');
const fs = require('fs');
const ejs = require(
'ejs');
const read = require('fs').readFileSync;
const join = require('path').join;
const cron = require('node-cron');
2018-06-18 23:10:50 +00:00
const util = require('util')
const fs_writeFile = util.promisify(fs.writeFile)
2018-06-14 08:07:51 +00:00
const str = read(
join(__dirname, '/templates/rss.ejs'),
'utf8');
const feeds = {};
const log4js = require('log4js');
const logger = log4js.getLogger();
logger.level = 'trace';
// Pull feeds from config files: ,
// feeds.simple_test_feed = require("./config/feed").feed;
// Or define in-line
feeds.news = require('./feeds/news.json');
feeds.jobsSpecial = require('./feeds/jobs-special.json');
feeds.jobsLocal = require('./feeds/jobs-local.json');
feeds.lifestyle = require('./feeds/lifestyle.json');
feeds.paleo = require('./feeds/paleo.json');
feeds.tech = require('./feeds/tech.json');
feeds.fit = require('./feeds/fit.json');
2018-06-18 22:01:32 +00:00
feeds.bored = require('./feeds/bored.json');
2018-06-14 08:07:51 +00:00
const braider_options = {
feeds: feeds,
indent: ' ',
date_sort_order: 'desc', // Newest first
log_level: 'warn',
dedupe_fields: ['link', 'guid'],
plugins_directories: [__dirname + '/plugins/']
};
const rss_braider = RssBraider.createClient(braider_options);
// Override logging level (debug, info, warn, err, off)
//rss_braider.logger.level('off');
2018-06-18 22:30:26 +00:00
function gatherV2(feedName, fileName, mode) {
return new Promise((resolve, reject) => {
2018-06-18 23:10:50 +00:00
const modeSuffix = {'rss': '.xml', 'json': '.json'};
logger.info(`Gathering ${feedName} as ${modeSuffix[mode]}...`);
rss_braider.processFeed(feedName, mode, (err, data) => {
if (err) {
logger.error(err);
return reject(err);
}
2018-06-18 22:30:26 +00:00
2018-06-18 23:10:50 +00:00
fs_writeFile(`${__dirname}/dist/${fileName}${modeSuffix[mode]}`, data).then(function(){
return resolve(`${feedName} saved`);
});
});
2018-06-18 22:30:26 +00:00
});
}
2018-06-14 08:07:51 +00:00
async function gather(feedName, fileName) {
logger.info(`Gathering ${feedName}...`);
rss_braider.processFeed(feedName, 'json', function (err, data) {
console.log('A');
if (err) {
logger.error(err);
return err;
}
console.log('B');
const j = JSON.parse(data);
console.log('C');
const ejsOutput = ejs.compile(str)(j);
console.log('D');
fs.writeFile(__dirname + '/dist/' + fileName + '.html',
ejsOutput,
function (err) {
if (err) {
logger.error(err);
return console.error(err);
}
console.log('The file was saved!');
});
fs.writeFile(__dirname + '/dist/' + fileName + '.json',
data,
function (err) {
if (err) {
logger.error(err);
return console.error(err);
}
console.log('The file was saved!');
});
});
}
async function gatherXML(feedName, fileName) {
2018-06-18 22:30:26 +00:00
rss_braider.processFeed(feedName, 'rss', function (err, data) {
2018-06-14 08:07:51 +00:00
if (err) {
return console.log(err);
}
2018-06-18 22:30:26 +00:00
console.log('Saving', __dirname + '/dist/' + fileName + '.xml');
fs.writeFile(__dirname + '/dist/' + fileName + '.xml', data, function (err) {
2018-06-14 08:07:51 +00:00
if (err) {
return console.log(err);
}
2018-06-18 22:30:26 +00:00
console.log('The file was saved!');
2018-06-14 08:07:51 +00:00
});
});
}
async function main() {
2018-06-18 22:30:26 +00:00
await gatherV2('jobsSpecial', 'jobs-special', 'rss').then((d) => {
2018-06-18 23:10:50 +00:00
logger.debug(d);
2018-06-18 22:30:26 +00:00
}).catch((e) => {
logger.error(e);
});
await gatherV2('news', 'news', 'json').then((d) => {
logger.info(d);
}).catch((e) => {
logger.error(e);
});
await gatherV2('lifestyle', 'lifestyle', 'json').then((d) => {
logger.info(d);
}).catch((e) => {
logger.error(e);
});
await gatherV2('paleo', 'paleo', 'json').then((d) => {
logger.info(d);
}).catch((e) => {
logger.error(e);
});
await gatherV2('tech', 'tech', 'json').then((d) => {
logger.info(d);
}).catch((e) => {
logger.error(e);
});
await gatherV2('fit', 'fit', 'json').then((d) => {
logger.info(d);
}).catch((e) => {
logger.error(e);
});
await gatherV2('bored', 'bored', 'json').then((d) => {
logger.info(d);
}).catch((e) => {
logger.error(e);
2018-06-18 22:01:32 +00:00
});
2018-06-18 22:30:26 +00:00
// await gatherXML('jobsLocal','jobs-local');
2018-06-14 08:07:51 +00:00
}
2018-06-18 22:01:32 +00:00
cron.schedule('3 * * * *', function () {
2018-06-14 08:07:51 +00:00
main();
return -1;
});
2018-06-18 22:13:29 +00:00
2018-06-18 23:10:50 +00:00
// main();