You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ma...@apache.org on 2016/03/02 06:42:20 UTC

[11/20] tika git commit: fix for TIKA-1876 contributed by manalishah

fix for TIKA-1876 contributed by manalishah


Project: http://git-wip-us.apache.org/repos/asf/tika/repo
Commit: http://git-wip-us.apache.org/repos/asf/tika/commit/a13369b0
Tree: http://git-wip-us.apache.org/repos/asf/tika/tree/a13369b0
Diff: http://git-wip-us.apache.org/repos/asf/tika/diff/a13369b0

Branch: refs/heads/master
Commit: a13369b098bea09421e35023c131adc092dcb6e4
Parents: 6c595fb
Author: manali <ma...@gmail.com>
Authored: Fri Feb 26 18:21:15 2016 -0800
Committer: manali <ma...@gmail.com>
Committed: Fri Feb 26 18:21:15 2016 -0800

----------------------------------------------------------------------
 .../org/apache/tika/parser/ner/nltk/NLTKNERecogniser.java   | 9 ---------
 .../org/apache/tika/parser/ner/nltk/NLTKServer.properties   | 2 +-
 .../apache/tika/parser/ner/nltk/NLTKNERecogniserTest.java   | 2 +-
 3 files changed, 2 insertions(+), 11 deletions(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/tika/blob/a13369b0/tika-parsers/src/main/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniser.java
----------------------------------------------------------------------
diff --git a/tika-parsers/src/main/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniser.java b/tika-parsers/src/main/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniser.java
index eddddcb..1edfe28 100644
--- a/tika-parsers/src/main/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniser.java
+++ b/tika-parsers/src/main/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniser.java
@@ -45,15 +45,6 @@ public class NLTKNERecogniser implements NERecogniser {
      * some common entities identified by NLTK
      */
     public static final Set<String> ENTITY_TYPES = new HashSet<String>(){{
-        add(PERSON);
-        add(TIME);
-        add(LOCATION);
-        add(ORGANIZATION);
-        add(MONEY);
-        add(PERCENT);
-        add(DATE);
-        add(FACILITY);
-        add(GPE);
         add("NAMES");
     }};
 

http://git-wip-us.apache.org/repos/asf/tika/blob/a13369b0/tika-parsers/src/main/resources/org/apache/tika/parser/ner/nltk/NLTKServer.properties
----------------------------------------------------------------------
diff --git a/tika-parsers/src/main/resources/org/apache/tika/parser/ner/nltk/NLTKServer.properties b/tika-parsers/src/main/resources/org/apache/tika/parser/ner/nltk/NLTKServer.properties
index 24f5a2e..5909b69 100644
--- a/tika-parsers/src/main/resources/org/apache/tika/parser/ner/nltk/NLTKServer.properties
+++ b/tika-parsers/src/main/resources/org/apache/tika/parser/ner/nltk/NLTKServer.properties
@@ -13,4 +13,4 @@
 #  See the License for the specific language governing permissions and
 #  limitations under the License.
 
-nltk.server.url=http://localhost:5000
+nltk.server.url=http://localhost:8881

http://git-wip-us.apache.org/repos/asf/tika/blob/a13369b0/tika-parsers/src/test/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniserTest.java
----------------------------------------------------------------------
diff --git a/tika-parsers/src/test/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniserTest.java b/tika-parsers/src/test/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniserTest.java
index a40ec24..5c1307f 100644
--- a/tika-parsers/src/test/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniserTest.java
+++ b/tika-parsers/src/test/java/org/apache/tika/parser/ner/nltk/NLTKNERecogniserTest.java
@@ -36,7 +36,7 @@ import static org.junit.Assert.assertTrue;
 public class NLTKNERecogniserTest {
     @Test
     public void testGetEntityTypes() throws Exception {
-        String text = "America";
+        String text = "America is a big country.";
         System.setProperty(NamedEntityParser.SYS_PROP_NER_IMPL, NLTKNERecogniser.class.getName());
         Tika tika = new Tika(new TikaConfig(NamedEntityParser.class.getResourceAsStream("tika-config.xml")));
         Metadata md = new Metadata();