You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nlpcraft.apache.org by ar...@apache.org on 2022/12/23 18:10:52 UTC
[incubator-nlpcraft] 01/02: WIP
This is an automated email from the ASF dual-hosted git repository.
aradzinski pushed a commit to branch NLPCRAFT-520
in repository https://gitbox.apache.org/repos/asf/incubator-nlpcraft.git
commit f3bfcbc3356498054838d7276a1aa5c7b03b89c4
Author: Aaron Radzinski <ar...@datalingvo.com>
AuthorDate: Fri Dec 23 10:10:39 2022 -0800
WIP
---
.../scala/org/apache/nlpcraft/nlp/parsers/NCNLPEntityParser.scala | 4 ++--
.../main/scala/org/apache/nlpcraft/nlp/stemmer/NCEnStemmer.scala | 2 --
.../src/main/scala/org/apache/nlpcraft/nlp/stemmer/NCStemmer.scala | 7 ++-----
3 files changed, 4 insertions(+), 9 deletions(-)
diff --git a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/parsers/NCNLPEntityParser.scala b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/parsers/NCNLPEntityParser.scala
index e5f62254..2a748616 100644
--- a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/parsers/NCNLPEntityParser.scala
+++ b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/parsers/NCNLPEntityParser.scala
@@ -25,13 +25,13 @@ import java.util.stream.Collectors
/**
* [[NCNLPEntityParser]] helper.
*/
-object NCNLPEntityParser:
+private object NCNLPEntityParser:
private val id: String = "nlp:entity"
import org.apache.nlpcraft.nlp.parsers.NCNLPEntityParser.*
/**
- * NLP data [[NCEntityParser entity parser]].
+ * NLP data [[NCEntityParser entity parser]].
*
* This parser converts list of input [[NCToken]] instances to list of [[NCEntity]] instances with ID **nlp:entity**.
* All [[NCEntity]] instances contain following mandatory [[NCPropertyMap metadata]] properties:
diff --git a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/stemmer/NCEnStemmer.scala b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/stemmer/NCEnStemmer.scala
index b794f931..81dd782a 100644
--- a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/stemmer/NCEnStemmer.scala
+++ b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/stemmer/NCEnStemmer.scala
@@ -23,8 +23,6 @@ import org.apache.nlpcraft.nlp.parsers.*
/**
* Stemmer implementation for the English language that delegates to
* [[https://opennlp.apache.org/ OpenNLP]] Porter Stemmer.
- *
- * @see More information about this stemmer algorithm can be found at [[https://tartarus.org/martin/PorterStemmer]].
*/
class NCEnStemmer extends NCStemmer:
private val stemmer = new PorterStemmer
diff --git a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/stemmer/NCStemmer.scala b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/stemmer/NCStemmer.scala
index 0009bab6..8a35f12e 100644
--- a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/stemmer/NCStemmer.scala
+++ b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/stemmer/NCStemmer.scala
@@ -21,13 +21,10 @@ import org.apache.nlpcraft.nlp.parsers.*
/**
* Trait defining a general stemmer. Stemming is the process of reducing inflected (or sometimes derived)
- * words to their word stem, base or root form—generally a written word form. Stemmer is used by some of the
- * built-in pipeline components. Stemmer is used by several built-in pipeline components.
+ * words to their word stem, base or root form—generally a written word form. Note that stemmer is used by
+ * several built-in pipeline components.
*
* Read more about stemming at [[https://en.wikipedia.org/wiki/Stemming]].
- *
- * @see [[org.apache.nlpcraft.nlp.enrichers.NCEnStopWordsTokenEnricher]]
- * @see [[NCSemanticEntityParser]]
*/
trait NCStemmer:
/**