const Slimbot = require('slimbot'); const config = require('./config.json'); const bot = new Slimbot(config.TELEGRAM_API_KEY); bot.startPolling(); function logMessageToAdmin(message, type='Error') { bot.sendMessage(config.ADMIN_USER, `<b>${type}</b>\n<code>${message}</code>`, { parse_mode: 'HTML' }); } function postVacancy(message) { bot.sendMessage(config.TARGET_CHANNEL, message, { parse_mode: 'HTML', disable_web_page_preview: true, disable_notification: true }); } module.exports = { postVacancy, logMessageToAdmin };
const feed = require("feed-read"); const config = require('./config.json'); const HhAdapter = require('./adapters/hh'); const MoikrugAdapter = require('./adapters/moikrug'); const bot = require('./bot'); const { FeedItemModel } = require('./lib/models'); function processFeed(articles, adapter) { articles.forEach(article => { if (adapter.isValid((article))) { const key = adapter.getKey(article); new FeedItemModel({ key, data: article }).save().then( model => adapter.parseItem(article).then(bot.postVacancy), () => {} ); } }); } setInterval(() => { feed(config.HH_FEED, function (err, articles) { if (err) { bot.logMessageToAdmin(err); return; } processFeed(articles, HhAdapter); }); feed(config.MOIKRUG_FEED, function (err, articles) { if (err) { bot.logMessageToAdmin(err); return; } processFeed(articles, MoikrugAdapter); }); }, config.REQUEST_PERIOD_TIME);
const request = require('superagent'); const jsdom = require('jsdom'); const { JSDOM } = jsdom; const { getTags } = require('../lib/tagger'); const { getJobType } = require('../lib/jobType'); const { render } = require('../lib/render'); function parseItem(item) { return new Promise((resolve, reject) => { request .get(item.link) .end(function(err, res) { if(err) { console.log(err); reject(err); return; } const dom = new JSDOM(res.text); const element = dom.window.document.querySelector(".vacancy_description"); const salaryElem = dom.window.document.querySelector(".footer_meta .salary"); const salary = salaryElem ? salaryElem.textContent : ' .'; const locationElem = dom.window.document.querySelector(".footer_meta .location"); const location = locationElem && locationElem.textContent; const title = dom.window.document.querySelector(".company_name").textContent; const titleFooter = dom.window.document.querySelector(".footer_meta").textContent; const pureContent = element.textContent; resolve(render({ tags: getTags(pureContent), salary: `: ${salary}`, location, title, link: item.link, description: element.innerHTML, jobType: getJobType(titleFooter), important: Array.from(element.querySelectorAll('strong')).map(e => e.textContent) })) }); }); } function getKey(item) { return item.link; } function isValid() { return true } module.exports = { getKey, isValid, parseItem };
const request = require('superagent'); const jsdom = require('jsdom'); const { JSDOM } = jsdom; const { getTags } = require('../lib/tagger'); const { getJobType } = require('../lib/jobType'); const { render } = require('../lib/render'); function parseItem(item) { const splited = item.content.split(/\n<p>|<\/p><p>|<\/p>\n/).filter(i => i); const [ title, date, region, salary ] = splited; return new Promise((resolve, reject) => { request .get(item.link) .end(function(err, res) { if(err) { console.log(err); reject(err); return; } const dom = new JSDOM(res.text); const element = dom.window.document.querySelector('.b-vacancy-desc-wrapper'); const title = dom.window.document.querySelector('.companyname').textContent; const pureContent = element.textContent; const tags = getTags(pureContent); resolve(render({ title, location: region.split(': ')[1] || region, salary: `: ${salary.split(': ')[1] || salary}`, tags, description: element.innerHTML, link: item.link, jobType: getJobType(pureContent), important: Array.from(element.querySelectorAll('strong')).map(e => e.textContent) })) }); }); } function getKey(item) { return item.link; } function isValid() { return true } module.exports = { getKey, isValid, parseItem };
li
in lists, you have to cheat a little: const htmlToText = require('html-to-text'); const whiteSpaceRegex = /^\s*$/; function render({ title, location, salary, tags, description, link, important = [], jobType='' }) { let formattedDescription = htmlToText .fromString(description, { wordwrap: null, noLinkBrackets: true, hideLinkHrefIfSameAsText: true, format: { unorderedList: function formatUnorderedList(elem, fn, options) { let result = ''; const nonWhiteSpaceChildren = (elem.children || []).filter( c => c.type !== 'text' || !whiteSpaceRegex.test(c.data) ); nonWhiteSpaceChildren.forEach(function(elem) { result += ' <b>β</b> ' + fn(elem.children, options) + '\n'; }); return '\n' + result + '\n'; } } }) .replace(/\n\s*\n/g, '\n'); important.filter(text => text.includes(':')).forEach(text => { formattedDescription = formattedDescription.replace( new RegExp(text, 'g'), `<b>${text}</b>` ) }); const formattedTags = tags.map(t => '#' + t).join(' '); const locationFormatted = location ? `#${location.replace(/ |-/g, '_')} `: ''; return `<b>${title}</b>\n${locationFormatted}#${jobType}\n<b>${salary}</b>\n${formattedTags}\n${formattedDescription}\n${link}`; } module.exports = { render };
const Az = require('az'); const namesMap = require('../resources/tagNames.json'); function onlyUnique(value, index, self) { return self.indexOf(value) === index; } function getTags(pureContent) { const tokens = Az.Tokens(pureContent).done(); const tags = tokens.filter(t => t.type.toString() === 'WORD') .map(t => t.toString().toLowerCase().replace('-', '_')) .map(name => namesMap[name]) .filter(t => t) .filter(onlyUnique); return tags; } module.exports = { getTags };
{ "js": "JS", "javascript": "JS", "sql": "SQL", "": "Angular", "angular": "Angular", "angularjs": "Angular", "react": "React", "reactjs": "React", "": "React", "node": "NodeJS", "nodejs": "NodeJS", "linux": "Linux", "ubuntu": "Ubuntu", "unix": "UNIX", "windows": "Windows" .... }
#!/usr/bin/env bash # rs - rsync ./ rs:/var/www/js_jobs_bot --delete -r --exclude=node_modules ssh rs " . ~/.nvm/nvm.sh cd /var/www/js_jobs_bot/ mv prod-config.json config.json npm i && pm2 restart processes.json "
Source: https://habr.com/ru/post/337940/
All Articles