From da03107d96c4805a4a08574f9fd91f99d87f406c Mon Sep 17 00:00:00 2001 From: Martin Donnelly Date: Mon, 1 Jun 2020 09:25:13 +0100 Subject: [PATCH] added scraper test --- scrapers/cwjobs.js | 1 + scrapers/indeed.js | 2 ++ scrapers/totaljobs.js | 1 + test/indeed.js | 17 ++--------------- 4 files changed, 6 insertions(+), 15 deletions(-) diff --git a/scrapers/cwjobs.js b/scrapers/cwjobs.js index 41f0018..71db3e2 100644 --- a/scrapers/cwjobs.js +++ b/scrapers/cwjobs.js @@ -27,6 +27,7 @@ class CwjobsScraper extends TotaljobsScraper { // https://www.indeed.co.uk/jobs?as_and=&as_phr=&as_any=Html+Web+Sql+Delphi+Vb+Vbscript+Php+Ajax+Mysql+Sqlserver+Javascript+Nodejs+vuejs+sveltejs&as_not=React&as_ttl=&as_cmp=&jt=contract&st=&as_src=&salary=&radius=0&l=glasgow&fromage=1&limit=50&sort=&psf=advsrch&from=advancedsearch await this.processSite(); + console.log(`CWJobs ${location} completed`); } } diff --git a/scrapers/indeed.js b/scrapers/indeed.js index 4402b3e..db4513f 100644 --- a/scrapers/indeed.js +++ b/scrapers/indeed.js @@ -143,6 +143,8 @@ class IndeedScraper extends MasterScraper { // https://www.indeed.co.uk/jobs?as_and=&as_phr=&as_any=Html+Web+Sql+Delphi+Vb+Vbscript+Php+Ajax+Mysql+Sqlserver+Javascript+Nodejs+vuejs+sveltejs&as_not=React&as_ttl=&as_cmp=&jt=contract&st=&as_src=&salary=&radius=0&l=glasgow&fromage=1&limit=50&sort=&psf=advsrch&from=advancedsearch await this.processSite(); + + console.log(`Indeed ${location} completed`); } } diff --git a/scrapers/totaljobs.js b/scrapers/totaljobs.js index 2d45ba9..4ad06b0 100644 --- a/scrapers/totaljobs.js +++ b/scrapers/totaljobs.js @@ -131,6 +131,7 @@ class TotaljobsScraper extends MasterScraper { // https://www.indeed.co.uk/jobs?as_and=&as_phr=&as_any=Html+Web+Sql+Delphi+Vb+Vbscript+Php+Ajax+Mysql+Sqlserver+Javascript+Nodejs+vuejs+sveltejs&as_not=React&as_ttl=&as_cmp=&jt=contract&st=&as_src=&salary=&radius=0&l=glasgow&fromage=1&limit=50&sort=&psf=advsrch&from=advancedsearch await this.processSite(); + console.log(`TotalJobs ${location} completed`); } } diff --git a/test/indeed.js b/test/indeed.js index a478ad5..2df1b2d 100644 --- a/test/indeed.js +++ b/test/indeed.js @@ -21,7 +21,7 @@ const indeedScraper = new IndeedScraper(); const page = fs.readFileSync('data/indeed/page2.html'); test.test('Test Indeed scraper', async t => { - /*const $ = cheerio.load(page); + const $ = cheerio.load(page); indeedScraper.loadPage($); @@ -35,20 +35,7 @@ test.test('Test Indeed scraper', async t => { await indeedScraper.filterAdverts(); - // await indeedScraper.addToDB();*/ - - await indeedScraper.go('london'); - await totaljobsScraper.go('london'); - await cwjobsScraper.go('london'); - await indeedScraper.go('glasgow'); - await totaljobsScraper.go('glasgow'); - await cwjobsScraper.go('glasgow'); - await indeedScraper.go('edinburgh'); - await totaljobsScraper.go('edinburgh'); - await cwjobsScraper.go('edinburgh'); - await indeedScraper.go('milton keynes'); - await totaljobsScraper.go('milton keynes'); - await cwjobsScraper.go('milton keynes'); + // await indeedScraper.addToDB(); t.end(); });