75 lines
2.4 KiB
JavaScript
75 lines
2.4 KiB
JavaScript
/*
|
|
* decaffeinate suggestions:
|
|
* DS102: Remove unnecessary code created because of implicit returns
|
|
* Full docs: https://github.com/decaffeinate/decaffeinate/blob/master/docs/suggestions.md
|
|
*/
|
|
/**
|
|
Keyword analysis for HackMyResume.
|
|
@license MIT. See LICENSE.md for details.
|
|
@module inspectors/keyword-inspector
|
|
*/
|
|
|
|
/**
|
|
Analyze the resume's use of keywords.
|
|
TODO: BUG: Keyword search regex is inaccurate, especially for one or two
|
|
letter keywords like "C" or "CLI".
|
|
@class keywordInspector
|
|
*/
|
|
module.exports = {
|
|
|
|
/** A unique name for this inspector. */
|
|
moniker: 'keyword-inspector',
|
|
|
|
/**
|
|
Run the Keyword Inspector on a resume.
|
|
@method run
|
|
@return An collection of statistical keyword data.
|
|
*/
|
|
run( rez ) {
|
|
|
|
// "Quote" or safely escape a keyword so it can be used as a regex. For
|
|
// example, if the keyword is "C++", yield "C\+\+".
|
|
// http://stackoverflow.com/a/2593661/4942583
|
|
const regex_quote = str => (str + '').replace(/[.?*+^$[\]\\(){}|-]/ig, '\\$&');
|
|
|
|
// Create a searchable plain-text digest of the resume
|
|
// TODO: BUG: Don't search within keywords for other keywords. Job A
|
|
// declares the "foo" keyword. Job B declares the "foo & bar" keyword. Job
|
|
// B's mention of "foobar" should not count as a mention of "foo".
|
|
// To achieve this, remove keywords from the search digest and treat them
|
|
// separately.
|
|
let searchable = '';
|
|
rez.transformStrings(['imp', 'computed', 'safe'], ( key, val ) => searchable += ` ${val}`);
|
|
|
|
// Assemble a regex skeleton we can use to test for keywords with a bit
|
|
// more
|
|
const prefix = `(?:${['^', '\\s+', '[\\.,]+'].join('|')})`;
|
|
const suffix = `(?:${['$', '\\s+', '[\\.,]+'].join('|')})`;
|
|
|
|
return rez.keywords().map(function(kw) {
|
|
|
|
// 1. Using word boundary or other regex class is inaccurate
|
|
//
|
|
// var regex = new RegExp( '\\b' + regex_quote( kw )/* + '\\b'*/, 'ig');
|
|
//
|
|
// 2. Searching for the raw keyword is inaccurate ("C" will match any
|
|
// word containing a 'c'!).
|
|
//
|
|
// var regex = new RegExp( regex_quote( kw ), 'ig');
|
|
//
|
|
// 3. Instead, use a custom regex with special delimeters.
|
|
|
|
const regex_str = prefix + regex_quote( kw ) + suffix;
|
|
const regex = new RegExp( regex_str, 'ig');
|
|
let count = 0;
|
|
while (regex.exec( searchable ) !== null) {
|
|
count++;
|
|
}
|
|
return {
|
|
name: kw,
|
|
count
|
|
};
|
|
});
|
|
}
|
|
};
|