You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@opennlp.apache.org by jo...@apache.org on 2014/02/28 17:38:45 UTC

svn commit: r1572991 - /opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java

Author: joern
Date: Fri Feb 28 16:38:45 2014
New Revision: 1572991

URL: http://svn.apache.org/r1572991
Log:
OPENNLP-658 Added an interface for the sequence coding. And implementations for IOB2 and BILOU coding 

Added:
    opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java

Added: opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java
URL: http://svn.apache.org/viewvc/opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java?rev=1572991&view=auto
==============================================================================
--- opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java (added)
+++ opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java Fri Feb 28 16:38:45 2014
@@ -0,0 +1,84 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package opennlp.tools.namefind;
+
+import java.util.ArrayList;
+import java.util.List;
+
+import opennlp.tools.util.SequenceCodec;
+import opennlp.tools.util.SequenceValidator;
+import opennlp.tools.util.Span;
+
+public class BilouNameFinderSequenceValidator implements
+    SequenceValidator<String> {
+  
+  public boolean validSequence(int i, String[] inputSequence,
+      String[] outcomesSequence, String outcome) {
+    
+    if (outcome.endsWith(NameFinderME.CONTINUE) || outcome.endsWith(BilouCodec.LAST)) {
+      
+      int li = outcomesSequence.length - 1;
+      
+      if (li == -1) {
+        return false;
+      } else if (outcomesSequence[li].endsWith(NameFinderME.OTHER) ||
+          outcomesSequence[li].endsWith(BilouCodec.UNIT)) {
+        return false;
+      } else if (outcomesSequence[li].endsWith(NameFinderME.CONTINUE) ||
+          outcomesSequence[li].endsWith(NameFinderME.START)) {
+        // if it is continue, we have to check if previous match was of the same type 
+        String previousNameType = NameFinderME.extractNameType(outcomesSequence[li]);
+        String nameType = NameFinderME.extractNameType(outcome);
+        if( previousNameType != null || nameType != null ) {
+          if( nameType != null ) {
+            if( nameType.equals(previousNameType) ){
+              return true;
+            }
+          }
+          return false; // outcomes types are not equal
+        }
+      }
+    }
+    
+    if (outcomesSequence.length - 1 > 0) {
+      if (outcome.endsWith(NameFinderME.OTHER)) {
+        if (outcomesSequence[outcomesSequence.length - 1].endsWith(NameFinderME.START) || outcomesSequence[outcomesSequence.length - 1].endsWith(NameFinderME.CONTINUE)) {
+          return false;
+        }
+      }
+    }
+    
+    return true;
+  }
+  
+  public static void main(String[] args) {
+    
+    SequenceCodec codec = new BilouCodec();
+    
+    List<String> outcomes = new ArrayList<String>();
+    outcomes.add("default-start");
+    outcomes.add("default-cont");
+    outcomes.add("default-last");
+    outcomes.add("default-unit");
+    
+    Span spans[] = codec.decode(outcomes);
+    
+    
+    System.out.println();
+  }
+}
\ No newline at end of file