Compare commits

...

4 Commits

Author SHA1 Message Date
moos 51c412e82e fix tests 2020-12-08 20:01:29 -08:00
moos 280bf22ad8 Merge branch 'master' of https://github.com/moos/wordpos 2020-12-08 19:42:29 -08:00
moos e331746994 Fix #41 2020-12-08 19:41:34 -08:00
Moos 6db40c8fa6
Fix link to WordNet lexNames docs. 2020-10-21 19:40:14 -07:00
8 changed files with 184 additions and 9 deletions

View File

@ -1,5 +1,10 @@
**2.0.0**
2.1.0
- Fix CLI script when used without specific POS (#41)
- :boom: Stopwords are now case-insensitive, i.e., "The", "And", "Him", etc. are all filtered out.
2.0.0
- Support for running wordpos in the **browser** (no breaking change for node environment)
- Dropped support for node 4.x.

View File

@ -206,7 +206,7 @@ wordpos.lookupAdjective('awesome', console.log);
```
In this case only one lookup was found, but there could be several.
Version 1.1 adds the `lexName` parameter, which maps the lexFilenum to one of [45 lexicographer domains](https://wordnet.princeton.edu/wordnet/man/lexnames.5WN.html).
Version 1.1 adds the `lexName` parameter, which maps the lexFilenum to one of [45 lexicographer domains](https://wordnet.princeton.edu/documentation/lexnames5wn).
#### seek(offset, pos, callback)

View File

@ -269,4 +269,3 @@ function sprint(results) {
},'');
}
}

View File

@ -1,6 +1,6 @@
{
"name": "wordpos",
"version": "2.0.0",
"version": "2.1.0",
"description": "wordpos is a set of part-of-speech utilities for Node.js & browser using the WordNet database.",
"author": "Moos <mooster@42at.com>",
"keywords": [

View File

@ -160,12 +160,12 @@ function get(isFn) {
words = this.parse(text),
results = [],
self = this,
first = words.shift();
first = words[0];
// test one first & check for error, otherwise
// map is inoccuous to errors!
return exec(first)
.then(() => Promise.all(words.map(exec)))
.then(() => Promise.all(words.slice(1).map(exec)))
.then(done)
.catch(err => {
// done(); // callback signature is same! // FIXME
@ -224,13 +224,13 @@ function getPOS(text, callback) {
var args = [data];
var matches = uniq(flat(Object.values(data)));
data.rest = diff(words, matches);
profile && args.push(new Date() - start);
nextTick(callback, args);
return data;
}
function error(err) {
console.log('Error >>> ', err);
nextTick(callback, []);
throw err;
}

View File

@ -33,7 +33,7 @@ function normalize(word) {
}
function isStopword(stopwordsStr, word) {
return stopwordsStr.indexOf(' '+word+' ') >= 0;
return stopwordsStr.indexOf(' '+ word.toLowerCase() +' ') >= 0;
}
function tokenizer(str) {

171
test/cli_test.js Normal file
View File

@ -0,0 +1,171 @@
/**
* cli_test.js
*
* Test CLI script
*
* Copyright (c) 2012-2020 mooster@42at.com
* https://github.com/moos/wordpos
*
* Released under MIT license
*/
var
chai = require('chai'),
assert = chai.assert,
exec = require('child_process').exec,
testStr = 'The angry bear chased the frightened little squirrel',
cmd = 'node ' + __dirname + '/../bin/wordpos-cli ',
gDone;
// compare two list of words independent of word order
function cmp(act, exp) {
assert.equal(act.trim().split(' ').sort().join(), exp.split(' ').sort().join());
}
describe('CLI tests', function() {
this.slow(300);
describe('Test CLI get', function() {
it('should get nouns', done => {
exec(cmd + '-n -b get ' + testStr, (error, stdout) => {
assert.isNull(error);
cmp(stdout, 'bear chased squirrel little');
done();
});
});
it('should get adjectives', done => {
exec(cmd + '-a -b get ' + testStr, (error, stdout) => {
assert.isNull(error);
cmp(stdout, 'angry frightened little');
done();
});
});
it('should get verbs', done => {
exec(cmd + '-v -b get ' + testStr, (error, stdout) => {
assert.isNull(error);
cmp(stdout, 'bear');
done();
});
});
it('should get adverbs', done => {
exec(cmd + '-r -b get ' + testStr, (error, stdout) => {
assert.isNull(error);
cmp(stdout, 'little');
done();
});
});
it('should get POS', done => {
exec(cmd + '-b get ' + testStr, (error, stdout, stderr) => {
assert.isNull(error);
cmp(stdout, 'bear chased squirrel little \n' +
'angry frightened little \n' +
'bear \n' +
'little');
done();
});
});
it('should get POS (single word)', done => {
exec(cmd + '-b get angry', (error, stdout, stderr) => {
assert.isNull(error);
assert.equal(stdout.trim(), 'angry');
done();
});
});
it('should get counts', done => {
exec(cmd + '-b -c get ' + testStr, (error, stdout, stderr) => {
assert.isNull(error);
assert.equal(stdout.trim(), '4 3 1 1 6');
done();
});
});
});
describe('Test CLI def', function() {
it('should define word', done => {
exec(cmd + 'def angry', (error, stdout) => {
assert.isNull(error);
assert(stdout.trim().startsWith('angry (def)\n a: feeling or showing anger;'));
done();
});
});
});
describe('Test CLI syn', function() {
it('should get synonyms', done => {
exec(cmd + 'syn angry', (error, stdout) => {
assert.isNull(error);
assert(stdout.trim().startsWith('angry (syn)\n a: angry'));
done();
});
});
});
describe('Test CLI exp', function() {
it('should get exmpale', done => {
exec(cmd + 'exp angry', (error, stdout) => {
assert.isNull(error);
assert(stdout.trim().startsWith('angry (exp)\n a: "angry at the weather"'));
done();
});
});
});
describe('Test CLI seek', function() {
it('should seek by offset', done => {
exec(cmd + '-a seek 00114629', (error, stdout) => {
assert.isNull(error);
assert(/lemma/.test(stdout), 'found lemma');
assert(/angry/.test(stdout), 'found angry');
done();
});
});
});
describe('Test CLI rand', function() {
it('should get a random word', done => {
exec(cmd + 'rand', (error, stdout) => {
assert.isNull(error);
assert(stdout.length > 1, 'got answer')
done();
});
});
it('should get a random word starting with...', done => {
exec(cmd + '-b rand angr', (error, stdout) => {
assert.isNull(error);
assert.equal(stdout.substr(0,4), 'angr');
done();
});
});
});
describe('Test CLI parse', function() {
it('should parse input', done => {
exec(cmd + '-b parse ' + testStr, (error, stdout) => {
assert.isNull(error);
assert.equal(stdout.trim(), 'angry bear chased frightened little squirrel');
done();
});
});
});
describe('Test CLI stopwords', function() {
let WordPOS = require('../src/wordpos');
it('should list stopwords', done => {
exec(cmd + '-j stopwords ' + testStr, (error, stdout) => {
assert.isNull(error);
assert.equal(stdout.trim(), JSON.stringify(WordPOS.stopwords));
done();
});
});
});
});

View File

@ -56,7 +56,7 @@ var str = "The angry bear chased the frightened little squirrel",
verbs: [ 'bear' ],
adjectives: [ 'little', 'angry', 'frightened' ],
adverbs: [ 'little' ],
rest: [ 'The' ]
rest: []
},
garble = 'garblegarble', // expect not to find word
offset = 1285602;