You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nlpcraft.apache.org by se...@apache.org on 2022/02/25 15:55:00 UTC
[incubator-nlpcraft] branch NLPCRAFT-483 updated: EN adapters added.
This is an automated email from the ASF dual-hosted git repository.
sergeykamov pushed a commit to branch NLPCRAFT-483
in repository https://gitbox.apache.org/repos/asf/incubator-nlpcraft.git
The following commit(s) were added to refs/heads/NLPCRAFT-483 by this push:
new 315ec01 EN adapters added.
315ec01 is described below
commit 315ec01534224b54b7ad5bf2cc9fa40b845b82b2
Author: Sergey Kamov <sk...@gmail.com>
AuthorDate: Fri Feb 25 18:54:51 2022 +0300
EN adapters added.
---
.../org/apache/nlpcraft/nlp/NCENDefaultPipeline.java | 20 ++++++++++----------
.../nlpcraft/nlp/NCENSemanticEntityParser.java | 2 +-
2 files changed, 11 insertions(+), 11 deletions(-)
diff --git a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/NCENDefaultPipeline.java b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/NCENDefaultPipeline.java
index d679ed9..c504e78 100644
--- a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/NCENDefaultPipeline.java
+++ b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/NCENDefaultPipeline.java
@@ -34,12 +34,13 @@ import java.util.Collections;
import java.util.List;
/**
- *
+ * Default EN implementation based on Open Nlp token parser, and set of built token enrichers including stopword enricher.
+ * Also at least one entity parser must be defined.
*/
public class NCENDefaultPipeline implements NCModelPipeline {
private static final NCResourceReader reader = new NCResourceReader();
- private final NCTokenParser tp = new NCOpenNLPTokenParser(
+ private final NCTokenParser tokParser = new NCOpenNLPTokenParser(
reader.getPath("opennlp/en-token.bin"),
reader.getPath("opennlp/en-pos-maxent.bin"),
reader.getPath("opennlp/en-lemmatizer.dict")
@@ -51,17 +52,16 @@ public class NCENDefaultPipeline implements NCModelPipeline {
new NCQuotesTokenEnricher(),
new NCDictionaryTokenEnricher(),
new NCBracketsTokenEnricher()
-
);
- private final List<NCEntityParser> parsers;
+ private final List<NCEntityParser> entParsers;
/**
*
- * @param parsers
+ * @param entParsers
*/
- public NCENDefaultPipeline(List<NCEntityParser> parsers) {
- this.parsers = parsers;
+ public NCENDefaultPipeline(List<NCEntityParser> entParsers) {
+ this.entParsers = entParsers;
}
/**
@@ -69,17 +69,17 @@ public class NCENDefaultPipeline implements NCModelPipeline {
* @param parser
*/
public NCENDefaultPipeline(NCEntityParser parser) {
- this.parsers = Collections.singletonList(parser);
+ this.entParsers = Collections.singletonList(parser);
}
@Override
public NCTokenParser getTokenParser() {
- return tp;
+ return tokParser;
}
@Override
public List<NCEntityParser> getEntityParsers() {
- return parsers;
+ return entParsers;
}
@Override
diff --git a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/NCENSemanticEntityParser.java b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/NCENSemanticEntityParser.java
index 9a099dd..7cf3d55 100644
--- a/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/NCENSemanticEntityParser.java
+++ b/nlpcraft/src/main/scala/org/apache/nlpcraft/nlp/NCENSemanticEntityParser.java
@@ -29,7 +29,7 @@ import java.util.List;
import java.util.Map;
/**
- *
+ * Wrapper on {@link NCSemanticEntityParser} which uses Open Nlp token parser (same as {@link NCENDefaultPipeline}) and built EN stemmer.
*/
public class NCENSemanticEntityParser extends NCSemanticEntityParser {
private static final NCResourceReader reader = new NCResourceReader();