Permalink
Browse files

ticked 0.1.10

  • Loading branch information...
1 parent d1ec5dc commit e368c4348463f525e1e8aad21813b9e23a40be19 @chrisumbel chrisumbel committed May 26, 2012
Showing with 7 additions and 14 deletions.
  1. +6 −2 README.md
  2. +0 −11 io_spec/wordnet_spec.js
  3. +1 −1 package.json
@@ -12,7 +12,7 @@ Note that many algorithms from Rob Ellis's [node-nltools](https://github.com/Nat
being merged in to this project and will be maintained here going forward.
At the moment most algorithms are English-specific but long-term some diversity
-is in order.
+is in order. Thanks to Polyakov Vladimir Russian stemming has been added!
Aside from this README the only documentation is [this DZone article](http://www.dzone.com/links/r/using_natural_a_nlp_module_for_nodejs.html) and [here on my blog](http://www.chrisumbel.com/article/node_js_natural_language_porter_stemmer_lancaster_bayes_naive_metaphone_soundex) which is a bit older.
@@ -103,7 +103,7 @@ Output
Stemmers
--------
-Currently stemming is supported via the Porter and Lancaster (Paice/Husk)
+Currently stemming is supported via the Porter (English and Russian) and Lancaster (Paice/Husk)
algorithms.
var natural = require('natural');
@@ -112,6 +112,10 @@ this example uses a porter stemmer. "word" is returned.
console.log(natural.PorterStemmer.stem("words")); // stem a single word
+and in Russian
+
+ console.log(natural.PorterStemmerRu.stem("падший"));
+
attach() patches stem() and tokenizeAndStem() to String as a shortcut to
PorterStemmer.stem(token). tokenizeAndStem() breaks text up into single words
and returns an array of stemmed tokens.
View
@@ -55,17 +55,6 @@ describe('wordnet', function() {
asyncSpecWait();
});
- it('should resize buffer for large returns', function() {
- var wordnet = new WordNet('./io_spec/test_data/wordnet/download/', 'http://wordnet.naturalnode.com/');
-
- wordnet.lookupSynonyms('hot', function(records) {
- expect(records.length).toBe(53);
- asyncSpecDone();
- });
-
- asyncSpecWait();
- });
-
it('should lookup synonyms give a synset offset and a pos', function() {
var wordnet = new WordNet('./io_spec/test_data/wordnet/download/', 'http://wordnet.naturalnode.com/');
View
@@ -1,7 +1,7 @@
{
"name": "natural",
"description": "General natural language (tokenizing, stemming, classification, inflection, phonetics, tfidf, WordNet, jaro-winkler, Levenshtein distance, Dice's Coefficient) facilities for node.",
- "version": "0.1.9",
+ "version": "0.1.10",
"homepage": "https://github.com/NaturalNode/natural",
"engines": {
"node": ">=0.4.10"

0 comments on commit e368c43

Please sign in to comment.