From 9a70ea47c7573d07e276b66d412768e11106a369 Mon Sep 17 00:00:00 2001 From: Martin Donnelly Date: Wed, 31 May 2017 16:39:06 +0100 Subject: [PATCH] does xml now too --- jobs-corpus.js | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/jobs-corpus.js b/jobs-corpus.js index a4716d6..17a7b02 100644 --- a/jobs-corpus.js +++ b/jobs-corpus.js @@ -287,11 +287,13 @@ function processJson(j) { for (let item of j.items) { console.log(item.title); let description = striptags(item.description); + + description = description.replace(/( )/ig, ' '); let stripped = getNoneStopWords(description); //console.log(stripped); let score = scoreEntry(stripped); console.log(`Score ${score}`); - item.description = `
Score ${score}
` + item.description; + item.description = `
Score ${score}
` + description; } return j;