You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@opennlp.apache.org by jo...@apache.org on 2014/02/28 17:38:45 UTC
svn commit: r1572991 -
/opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java
Author: joern
Date: Fri Feb 28 16:38:45 2014
New Revision: 1572991
URL: http://svn.apache.org/r1572991
Log:
OPENNLP-658 Added an interface for the sequence coding. And implementations for IOB2 and BILOU coding
Added:
opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java
Added: opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java
URL: http://svn.apache.org/viewvc/opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java?rev=1572991&view=auto
==============================================================================
--- opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java (added)
+++ opennlp/trunk/opennlp-tools/src/main/java/opennlp/tools/namefind/BilouNameFinderSequenceValidator.java Fri Feb 28 16:38:45 2014
@@ -0,0 +1,84 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package opennlp.tools.namefind;
+
+import java.util.ArrayList;
+import java.util.List;
+
+import opennlp.tools.util.SequenceCodec;
+import opennlp.tools.util.SequenceValidator;
+import opennlp.tools.util.Span;
+
+public class BilouNameFinderSequenceValidator implements
+ SequenceValidator<String> {
+
+ public boolean validSequence(int i, String[] inputSequence,
+ String[] outcomesSequence, String outcome) {
+
+ if (outcome.endsWith(NameFinderME.CONTINUE) || outcome.endsWith(BilouCodec.LAST)) {
+
+ int li = outcomesSequence.length - 1;
+
+ if (li == -1) {
+ return false;
+ } else if (outcomesSequence[li].endsWith(NameFinderME.OTHER) ||
+ outcomesSequence[li].endsWith(BilouCodec.UNIT)) {
+ return false;
+ } else if (outcomesSequence[li].endsWith(NameFinderME.CONTINUE) ||
+ outcomesSequence[li].endsWith(NameFinderME.START)) {
+ // if it is continue, we have to check if previous match was of the same type
+ String previousNameType = NameFinderME.extractNameType(outcomesSequence[li]);
+ String nameType = NameFinderME.extractNameType(outcome);
+ if( previousNameType != null || nameType != null ) {
+ if( nameType != null ) {
+ if( nameType.equals(previousNameType) ){
+ return true;
+ }
+ }
+ return false; // outcomes types are not equal
+ }
+ }
+ }
+
+ if (outcomesSequence.length - 1 > 0) {
+ if (outcome.endsWith(NameFinderME.OTHER)) {
+ if (outcomesSequence[outcomesSequence.length - 1].endsWith(NameFinderME.START) || outcomesSequence[outcomesSequence.length - 1].endsWith(NameFinderME.CONTINUE)) {
+ return false;
+ }
+ }
+ }
+
+ return true;
+ }
+
+ public static void main(String[] args) {
+
+ SequenceCodec codec = new BilouCodec();
+
+ List<String> outcomes = new ArrayList<String>();
+ outcomes.add("default-start");
+ outcomes.add("default-cont");
+ outcomes.add("default-last");
+ outcomes.add("default-unit");
+
+ Span spans[] = codec.decode(outcomes);
+
+
+ System.out.println();
+ }
+}
\ No newline at end of file