You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@opennlp.apache.org by jo...@apache.org on 2012/07/13 11:46:20 UTC

svn commit: r1361129 - in /opennlp/trunk/opennlp-tools/lang/fr: ./ tokenizer/ tokenizer/fr-detokenizer.xml

Author: joern
Date: Fri Jul 13 09:46:20 2012
New Revision: 1361129

URL: http://svn.apache.org/viewvc?rev=1361129&view=rev
Log:
OPENNLP-523 Initial check in of the French detokenizer dictionary.

Added:
    opennlp/trunk/opennlp-tools/lang/fr/
    opennlp/trunk/opennlp-tools/lang/fr/tokenizer/
    opennlp/trunk/opennlp-tools/lang/fr/tokenizer/fr-detokenizer.xml   (with props)

Added: opennlp/trunk/opennlp-tools/lang/fr/tokenizer/fr-detokenizer.xml
URL: http://svn.apache.org/viewvc/opennlp/trunk/opennlp-tools/lang/fr/tokenizer/fr-detokenizer.xml?rev=1361129&view=auto
==============================================================================
--- opennlp/trunk/opennlp-tools/lang/fr/tokenizer/fr-detokenizer.xml (added)
+++ opennlp/trunk/opennlp-tools/lang/fr/tokenizer/fr-detokenizer.xml Fri Jul 13 09:46:20 2012
@@ -0,0 +1,209 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.    
+-->
+
+<dictionary>
+  <entry operation="RIGHT_LEFT_MATCHING">
+    <token>"</token>
+  </entry>
+  <entry operation="RIGHT_LEFT_MATCHING">
+    <token>'</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>.</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>?</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>!</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>,</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>;</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>:</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>(</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>)</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>}</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>{</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>]</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>[</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>``</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>''</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>%</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>L'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>l'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>D'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>d'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>S'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>s'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>N'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>n'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>C'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>c'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>m'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>J'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>j'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>T'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>t'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Z'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>z'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Qu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>qu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Ma'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>ma'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Jusqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>jusqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>AUJOURD'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Aujourd'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>aujourd'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Lorsqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>lorsqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Puisqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>puisqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Presqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>presqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Prud'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>prud'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Quelqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>quelqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Quoiqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>quoiqu'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>dizaï'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Optim'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Demak'</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>Automobil'</token>
+  </entry>
+  <entry operation="MOVE_LEFT">
+    <token>s</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>ex-</token>
+  </entry>
+  <entry operation="MOVE_RIGHT">
+    <token>#</token>
+  </entry>
+</dictionary>

Propchange: opennlp/trunk/opennlp-tools/lang/fr/tokenizer/fr-detokenizer.xml
------------------------------------------------------------------------------
    svn:mime-type = text/plain