You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@lenya.apache.org by mi...@apache.org on 2005/11/16 16:24:54 UTC
svn commit: r345035 - in /lenya/trunk/src/webapp/WEB-INF: analyzer/
analyzer/stopword/ xconf/
Author: michi
Date: Wed Nov 16 07:24:44 2005
New Revision: 345035
URL: http://svn.apache.org/viewcvs?rev=345035&view=rev
Log:
more lucene stuff of Robert Goene added
Added:
lenya/trunk/src/webapp/WEB-INF/analyzer/
lenya/trunk/src/webapp/WEB-INF/analyzer/perfieldconf.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Danish_da.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Dutch_nl.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/English_en.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Finnish_fi.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/French_fr.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/German_de.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Italian_it.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Norwegian_no.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Polish_pl.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Portuguese_pt.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Spanish_es.xml
lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Swedish_sv.xml
lenya/trunk/src/webapp/WEB-INF/xconf/
lenya/trunk/src/webapp/WEB-INF/xconf/lucene2.xconf
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/perfieldconf.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/perfieldconf.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/perfieldconf.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/perfieldconf.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+<!-- allow to analyze multi-langage documents> -->
+ <config defaultAnalyzer="stopword_fr">
+ <field name="description_en" analyzer="stopword_en"/>
+ <field name="subject" analyzer="stopword_en"/>
+ </config>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Danish_da.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Danish_da.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Danish_da.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Danish_da.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,66 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>af</stopword>
+ <stopword>aldrig</stopword>
+ <stopword>alle</stopword>
+ <stopword>altid</stopword>
+ <stopword>bagved</stopword>
+ <stopword>de</stopword>
+ <stopword>der</stopword>
+ <stopword>du</stopword>
+ <stopword>efter</stopword>
+ <stopword>eller</stopword>
+ <stopword>en</stopword>
+ <stopword>endnu</stopword>
+ <stopword>et</stopword>
+ <stopword>fjernt</stopword>
+ <stopword>for</stopword>
+ <stopword>foran</stopword>
+ <stopword>fra</stopword>
+ <stopword>få</stopword>
+ <stopword>gennem</stopword>
+ <stopword>god</stopword>
+ <stopword>han</stopword>
+ <stopword>her</stopword>
+ <stopword>hos</stopword>
+ <stopword>hovfor</stopword>
+ <stopword>hun</stopword>
+ <stopword>hurtig</stopword>
+ <stopword>hvad</stopword>
+ <stopword>hvem</stopword>
+ <stopword>hvonår</stopword>
+ <stopword>hvor</stopword>
+ <stopword>hvordan</stopword>
+ <stopword>hvorhen</stopword>
+ <stopword>i</stopword>
+ <stopword>imod</stopword>
+ <stopword>ja</stopword>
+ <stopword>jeg</stopword>
+ <stopword>langsom</stopword>
+ <stopword>lidt</stopword>
+ <stopword>mange</stopword>
+ <stopword>med</stopword>
+ <stopword>meget</stopword>
+ <stopword>mellem</stopword>
+ <stopword>mere</stopword>
+ <stopword>mindre</stopword>
+ <stopword>måske</stopword>
+ <stopword>nede</stopword>
+ <stopword>nej</stopword>
+ <stopword>nok</stopword>
+ <stopword>nu</stopword>
+ <stopword>når</stopword>
+ <stopword>og</stopword>
+ <stopword>oppe</stopword>
+ <stopword>på</stopword>
+ <stopword>rask</stopword>
+ <stopword>sammen</stopword>
+ <stopword>temmelig</stopword>
+ <stopword>til</stopword>
+ <stopword>uden</stopword>
+ <stopword>udenfor</stopword>
+ <stopword>under</stopword>
+ <stopword>ved</stopword>
+ <stopword>vi</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Dutch_nl.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Dutch_nl.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Dutch_nl.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Dutch_nl.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,264 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>aan</stopword>
+ <stopword>aangaande</stopword>
+ <stopword>aangezien</stopword>
+ <stopword>achter</stopword>
+ <stopword>achterna</stopword>
+ <stopword>afgelopen</stopword>
+ <stopword>al</stopword>
+ <stopword>aldaar</stopword>
+ <stopword>aldus</stopword>
+ <stopword>alhoewel</stopword>
+ <stopword>alias</stopword>
+ <stopword>alle</stopword>
+ <stopword>allebei</stopword>
+ <stopword>alleen</stopword>
+ <stopword>alsnog</stopword>
+ <stopword>altijd</stopword>
+ <stopword>altoos</stopword>
+ <stopword>ander</stopword>
+ <stopword>andere</stopword>
+ <stopword>anders</stopword>
+ <stopword>anderszins</stopword>
+ <stopword>behalve</stopword>
+ <stopword>behoudens</stopword>
+ <stopword>beide</stopword>
+ <stopword>beiden</stopword>
+ <stopword>ben</stopword>
+ <stopword>beneden</stopword>
+ <stopword>bent</stopword>
+ <stopword>bepaald</stopword>
+ <stopword>betreffende</stopword>
+ <stopword>bij</stopword>
+ <stopword>binnen</stopword>
+ <stopword>binnenin</stopword>
+ <stopword>boven</stopword>
+ <stopword>bovenal</stopword>
+ <stopword>bovendien</stopword>
+ <stopword>bovengenoemd</stopword>
+ <stopword>bovenstaand</stopword>
+ <stopword>bovenvermeld</stopword>
+ <stopword>buiten</stopword>
+ <stopword>daar</stopword>
+ <stopword>daarheen</stopword>
+ <stopword>daarin</stopword>
+ <stopword>daarna</stopword>
+ <stopword>daarnet</stopword>
+ <stopword>daarom</stopword>
+ <stopword>daarop</stopword>
+ <stopword>daarvanlangs</stopword>
+ <stopword>dan</stopword>
+ <stopword>dat</stopword>
+ <stopword>de</stopword>
+ <stopword>die</stopword>
+ <stopword>dikwijls</stopword>
+ <stopword>dit</stopword>
+ <stopword>door</stopword>
+ <stopword>doorgaand</stopword>
+ <stopword>dus</stopword>
+ <stopword>echter</stopword>
+ <stopword>eer</stopword>
+ <stopword>eerdat</stopword>
+ <stopword>eerder</stopword>
+ <stopword>eerlang</stopword>
+ <stopword>eerst</stopword>
+ <stopword>elk</stopword>
+ <stopword>elke</stopword>
+ <stopword>en</stopword>
+ <stopword>enig</stopword>
+ <stopword>enigszins</stopword>
+ <stopword>enkel</stopword>
+ <stopword>er</stopword>
+ <stopword>erdoor</stopword>
+ <stopword>even</stopword>
+ <stopword>eveneens</stopword>
+ <stopword>evenwel</stopword>
+ <stopword>gauw</stopword>
+ <stopword>gedurende</stopword>
+ <stopword>geen</stopword>
+ <stopword>gehad</stopword>
+ <stopword>gekund</stopword>
+ <stopword>geleden</stopword>
+ <stopword>gelijk</stopword>
+ <stopword>gemoeten</stopword>
+ <stopword>gemogen</stopword>
+ <stopword>geweest</stopword>
+ <stopword>gewoon</stopword>
+ <stopword>gewoonweg</stopword>
+ <stopword>haar</stopword>
+ <stopword>had</stopword>
+ <stopword>hadden</stopword>
+ <stopword>hare</stopword>
+ <stopword>heb</stopword>
+ <stopword>hebben</stopword>
+ <stopword>hebt</stopword>
+ <stopword>heeft</stopword>
+ <stopword>hem</stopword>
+ <stopword>hen</stopword>
+ <stopword>het</stopword>
+ <stopword>hierbeneden</stopword>
+ <stopword>hierboven</stopword>
+ <stopword>hij</stopword>
+ <stopword>hoe</stopword>
+ <stopword>hoewel</stopword>
+ <stopword>hun</stopword>
+ <stopword>hunne</stopword>
+ <stopword>ik</stopword>
+ <stopword>ikzelf</stopword>
+ <stopword>in</stopword>
+ <stopword>inmiddels</stopword>
+ <stopword>inzake</stopword>
+ <stopword>is</stopword>
+ <stopword>jezelf</stopword>
+ <stopword>jij</stopword>
+ <stopword>jijzelf</stopword>
+ <stopword>jou</stopword>
+ <stopword>jouw</stopword>
+ <stopword>jouwe</stopword>
+ <stopword>juist</stopword>
+ <stopword>jullie</stopword>
+ <stopword>kan</stopword>
+ <stopword>klaar</stopword>
+ <stopword>kon</stopword>
+ <stopword>konden</stopword>
+ <stopword>krachtens</stopword>
+ <stopword>kunnen</stopword>
+ <stopword>kunt</stopword>
+ <stopword>later</stopword>
+ <stopword>liever</stopword>
+ <stopword>maar</stopword>
+ <stopword>mag</stopword>
+ <stopword>meer</stopword>
+ <stopword>met</stopword>
+ <stopword>mezelf</stopword>
+ <stopword>mij</stopword>
+ <stopword>mijn</stopword>
+ <stopword>mijnent</stopword>
+ <stopword>mijner</stopword>
+ <stopword>mijzelf</stopword>
+ <stopword>misschien</stopword>
+ <stopword>mocht</stopword>
+ <stopword>mochten</stopword>
+ <stopword>moest</stopword>
+ <stopword>moesten</stopword>
+ <stopword>moet</stopword>
+ <stopword>moeten</stopword>
+ <stopword>mogen</stopword>
+ <stopword>na</stopword>
+ <stopword>naar</stopword>
+ <stopword>nadat</stopword>
+ <stopword>net</stopword>
+ <stopword>niet</stopword>
+ <stopword>noch</stopword>
+ <stopword>nog</stopword>
+ <stopword>nogal</stopword>
+ <stopword>nu</stopword>
+ <stopword>of</stopword>
+ <stopword>ofschoon</stopword>
+ <stopword>om</stopword>
+ <stopword>omdat</stopword>
+ <stopword>omhoog</stopword>
+ <stopword>omlaag</stopword>
+ <stopword>omstreeks</stopword>
+ <stopword>omtrent</stopword>
+ <stopword>omver</stopword>
+ <stopword>onder</stopword>
+ <stopword>ondertussen</stopword>
+ <stopword>ongeveer</stopword>
+ <stopword>ons</stopword>
+ <stopword>onszelf</stopword>
+ <stopword>onze</stopword>
+ <stopword>ook</stopword>
+ <stopword>op</stopword>
+ <stopword>opnieuw</stopword>
+ <stopword>opzij</stopword>
+ <stopword>over</stopword>
+ <stopword>overeind</stopword>
+ <stopword>overigens</stopword>
+ <stopword>pas</stopword>
+ <stopword>precies</stopword>
+ <stopword>reeds</stopword>
+ <stopword>rond</stopword>
+ <stopword>rondom</stopword>
+ <stopword>sedert</stopword>
+ <stopword>sinds</stopword>
+ <stopword>sindsdien</stopword>
+ <stopword>slechts</stopword>
+ <stopword>sommige</stopword>
+ <stopword>spoedig</stopword>
+ <stopword>steeds</stopword>
+ <stopword>tamelijk</stopword>
+ <stopword>tenzij</stopword>
+ <stopword>terwijl</stopword>
+ <stopword>thans</stopword>
+ <stopword>tijdens</stopword>
+ <stopword>toch</stopword>
+ <stopword>toen</stopword>
+ <stopword>toenmaals</stopword>
+ <stopword>toenmalig</stopword>
+ <stopword>tot</stopword>
+ <stopword>totdat</stopword>
+ <stopword>tussen</stopword>
+ <stopword>uit</stopword>
+ <stopword>uitgezonderd</stopword>
+ <stopword>vaak</stopword>
+ <stopword>van</stopword>
+ <stopword>vandaan</stopword>
+ <stopword>vanuit</stopword>
+ <stopword>vanwege</stopword>
+ <stopword>veeleer</stopword>
+ <stopword>verder</stopword>
+ <stopword>vervolgens</stopword>
+ <stopword>vol</stopword>
+ <stopword>volgens</stopword>
+ <stopword>voor</stopword>
+ <stopword>vooraf</stopword>
+ <stopword>vooral</stopword>
+ <stopword>vooralsnog</stopword>
+ <stopword>voorbij</stopword>
+ <stopword>voordat</stopword>
+ <stopword>voordezen</stopword>
+ <stopword>voordien</stopword>
+ <stopword>voorheen</stopword>
+ <stopword>voorop</stopword>
+ <stopword>vooruit</stopword>
+ <stopword>vrij</stopword>
+ <stopword>vroeg</stopword>
+ <stopword>waar</stopword>
+ <stopword>waarom</stopword>
+ <stopword>wanneer</stopword>
+ <stopword>want</stopword>
+ <stopword>waren</stopword>
+ <stopword>was</stopword>
+ <stopword>wat</stopword>
+ <stopword>weer</stopword>
+ <stopword>weg</stopword>
+ <stopword>wegens</stopword>
+ <stopword>wel</stopword>
+ <stopword>weldra</stopword>
+ <stopword>welk</stopword>
+ <stopword>welke</stopword>
+ <stopword>wie</stopword>
+ <stopword>wiens</stopword>
+ <stopword>wier</stopword>
+ <stopword>wij</stopword>
+ <stopword>wijzelf</stopword>
+ <stopword>zal</stopword>
+ <stopword>ze</stopword>
+ <stopword>zelfs</stopword>
+ <stopword>zichzelf</stopword>
+ <stopword>zij</stopword>
+ <stopword>zijn</stopword>
+ <stopword>zijne</stopword>
+ <stopword>zo</stopword>
+ <stopword>zodra</stopword>
+ <stopword>zonder</stopword>
+ <stopword>zou</stopword>
+ <stopword>zouden</stopword>
+ <stopword>zowat</stopword>
+ <stopword>zulke</stopword>
+ <stopword>zullen</stopword>
+ <stopword>zult</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/English_en.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/English_en.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/English_en.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/English_en.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,80 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>a</stopword>
+ <stopword>about</stopword>
+ <stopword>after</stopword>
+ <stopword>all</stopword>
+ <stopword>also</stopword>
+ <stopword>an</stopword>
+ <stopword>and</stopword>
+ <stopword>any</stopword>
+ <stopword>are</stopword>
+ <stopword>as</stopword>
+ <stopword>at</stopword>
+ <stopword>be</stopword>
+ <stopword>because</stopword>
+ <stopword>been</stopword>
+ <stopword>but</stopword>
+ <stopword>by</stopword>
+ <stopword>can</stopword>
+ <stopword>co</stopword>
+ <stopword>corp</stopword>
+ <stopword>could</stopword>
+ <stopword>for</stopword>
+ <stopword>from</stopword>
+ <stopword>had</stopword>
+ <stopword>has</stopword>
+ <stopword>have</stopword>
+ <stopword>he</stopword>
+ <stopword>her</stopword>
+ <stopword>his</stopword>
+ <stopword>if</stopword>
+ <stopword>in</stopword>
+ <stopword>inc</stopword>
+ <stopword>into</stopword>
+ <stopword>is</stopword>
+ <stopword>it</stopword>
+ <stopword>its</stopword>
+ <stopword>last</stopword>
+ <stopword>more</stopword>
+ <stopword>most</stopword>
+ <stopword>mr</stopword>
+ <stopword>mrs</stopword>
+ <stopword>ms</stopword>
+ <stopword>mz</stopword>
+ <stopword>no</stopword>
+ <stopword>not</stopword>
+ <stopword>of</stopword>
+ <stopword>on</stopword>
+ <stopword>one</stopword>
+ <stopword>only</stopword>
+ <stopword>or</stopword>
+ <stopword>other</stopword>
+ <stopword>out</stopword>
+ <stopword>over</stopword>
+ <stopword>s</stopword>
+ <stopword>says</stopword>
+ <stopword>she</stopword>
+ <stopword>so</stopword>
+ <stopword>some</stopword>
+ <stopword>such</stopword>
+ <stopword>than</stopword>
+ <stopword>that</stopword>
+ <stopword>the</stopword>
+ <stopword>their</stopword>
+ <stopword>there</stopword>
+ <stopword>they</stopword>
+ <stopword>this</stopword>
+ <stopword>to</stopword>
+ <stopword>up</stopword>
+ <stopword>was</stopword>
+ <stopword>we</stopword>
+ <stopword>were</stopword>
+ <stopword>when</stopword>
+ <stopword>which</stopword>
+ <stopword>who</stopword>
+ <stopword>will</stopword>
+ <stopword>with</stopword>
+ <stopword>would</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Finnish_fi.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Finnish_fi.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Finnish_fi.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Finnish_fi.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,72 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>alla</stopword>
+ <stopword>ansiosta</stopword>
+ <stopword>ehkä</stopword>
+ <stopword>ei</stopword>
+ <stopword>enemmän</stopword>
+ <stopword>ennen</stopword>
+ <stopword>etessa</stopword>
+ <stopword>f</stopword>
+ <stopword>haikki</stopword>
+ <stopword>he</stopword>
+ <stopword>hitaasti</stopword>
+ <stopword>hoikein</stopword>
+ <stopword>hyvin</stopword>
+ <stopword>hän</stopword>
+ <stopword>ilman</stopword>
+ <stopword>ja</stopword>
+ <stopword>jos</stopword>
+ <stopword>jälkeen</stopword>
+ <stopword>kanssa</stopword>
+ <stopword>kaukana</stopword>
+ <stopword>kenties</stopword>
+ <stopword>keskellä</stopword>
+ <stopword>kesken</stopword>
+ <stopword>koskaan</stopword>
+ <stopword>kuinkan</stopword>
+ <stopword>kukka</stopword>
+ <stopword>kylliksi</stopword>
+ <stopword>kyllä</stopword>
+ <stopword>liian</stopword>
+ <stopword>lla</stopword>
+ <stopword>lla</stopword>
+ <stopword>luona</stopword>
+ <stopword>lähellä</stopword>
+ <stopword>läpi</stopword>
+ <stopword>me</stopword>
+ <stopword>miksi</stopword>
+ <stopword>mikä</stopword>
+ <stopword>milloin</stopword>
+ <stopword>milloinkan</stopword>
+ <stopword>minä</stopword>
+ <stopword>missä</stopword>
+ <stopword>miten</stopword>
+ <stopword>nopeasti</stopword>
+ <stopword>nyt</stopword>
+ <stopword>oikea</stopword>
+ <stopword>oikealla</stopword>
+ <stopword>paljon</stopword>
+ <stopword>siellä</stopword>
+ <stopword>sinä</stopword>
+ <stopword>ssa</stopword>
+ <stopword>sta</stopword>
+ <stopword>suoraan</stopword>
+ <stopword>tai</stopword>
+ <stopword>takana</stopword>
+ <stopword>takia</stopword>
+ <stopword>tarpeeksi</stopword>
+ <stopword>te</stopword>
+ <stopword>tässä</stopword>
+ <stopword>ulkopuolella</stopword>
+ <stopword>vahemmän</stopword>
+ <stopword>vasen</stopword>
+ <stopword>vasenmalla</stopword>
+ <stopword>vastan</stopword>
+ <stopword>vielä</stopword>
+ <stopword>vieressä</stopword>
+ <stopword>vähän</stopword>
+ <stopword>yhdessä</stopword>
+ <stopword>ylös</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/French_fr.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/French_fr.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/French_fr.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/French_fr.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,430 @@
+<?xml version="1.0" encoding="ISO-8859-1"?>
+
+<!--
+Contribution de Nico Maisonneuve, nicoo_@hotmail.com,
+construit à partir de la liste que l'on trouve sur le site:
+http://www.unine.ch/Info/clef/
+ -->
+
+<french useStopWords="true" keepAccents="false">
+
+<stopWords>
+ <stopWord>a</stopWord>
+ <stopWord>à</stopWord>
+ <stopWord>â</stopWord>
+ <stopWord>abord</stopWord>
+ <stopWord>afin</stopWord>
+ <stopWord>ah</stopWord>
+ <stopWord>ai</stopWord>
+ <stopWord>aie</stopWord>
+ <stopWord>ainsi</stopWord>
+ <stopWord>allaient</stopWord>
+ <stopWord>allo</stopWord>
+ <stopWord>allô</stopWord>
+ <stopWord>allons</stopWord>
+ <stopWord>après</stopWord>
+ <stopWord>assez</stopWord>
+ <stopWord>attendu</stopWord>
+ <stopWord>au</stopWord>
+ <stopWord>aucun</stopWord>
+ <stopWord>aucune</stopWord>
+ <stopWord>aujourd</stopWord>
+ <stopWord>aujourd'hui</stopWord>
+ <stopWord>auquel</stopWord>
+ <stopWord>aura</stopWord>
+ <stopWord>auront</stopWord>
+ <stopWord>aussi</stopWord>
+ <stopWord>autre</stopWord>
+ <stopWord>autres</stopWord>
+ <stopWord>aux</stopWord>
+ <stopWord>auxquelles</stopWord>
+ <stopWord>auxquels</stopWord>
+ <stopWord>avaient</stopWord>
+ <stopWord>avais</stopWord>
+ <stopWord>avait</stopWord>
+ <stopWord>avant</stopWord>
+ <stopWord>avec</stopWord>
+ <stopWord>avoir</stopWord>
+ <stopWord>ayant</stopWord>
+ <stopWord>b</stopWord>
+ <stopWord>bah</stopWord>
+ <stopWord>beaucoup</stopWord>
+ <stopWord>bien</stopWord>
+ <stopWord>bigre</stopWord>
+ <stopWord>boum</stopWord>
+ <stopWord>bravo</stopWord>
+ <stopWord>brrr</stopWord>
+ <stopWord>c</stopWord>
+ <stopWord>ça</stopWord>
+ <stopWord>car</stopWord>
+ <stopWord>ce</stopWord>
+ <stopWord>ceci</stopWord>
+ <stopWord>cela</stopWord>
+ <stopWord>celle</stopWord>
+ <stopWord>celle-ci</stopWord>
+ <stopWord>celle-là</stopWord>
+ <stopWord>celles</stopWord>
+ <stopWord>celles-ci</stopWord>
+ <stopWord>celles-là</stopWord>
+ <stopWord>celui</stopWord>
+ <stopWord>celui-ci</stopWord>
+ <stopWord>celui-là</stopWord>
+ <stopWord>cependant</stopWord>
+ <stopWord>certain</stopWord>
+ <stopWord>certaine</stopWord>
+ <stopWord>certaines</stopWord>
+ <stopWord>certains</stopWord>
+ <stopWord>certes</stopWord>
+ <stopWord>ces</stopWord>
+ <stopWord>cet</stopWord>
+ <stopWord>cette</stopWord>
+ <stopWord>ceux</stopWord>
+ <stopWord>ceux-ci</stopWord>
+ <stopWord>ceux-là</stopWord>
+ <stopWord>chacun</stopWord>
+ <stopWord>chaque</stopWord>
+ <stopWord>cher</stopWord>
+ <stopWord>chère</stopWord>
+ <stopWord>chères</stopWord>
+ <stopWord>chers</stopWord>
+ <stopWord>chez</stopWord>
+ <stopWord>chiche</stopWord>
+ <stopWord>chut</stopWord>
+ <stopWord>ci</stopWord>
+ <stopWord>clac</stopWord>
+ <stopWord>clic</stopWord>
+ <stopWord>comme</stopWord>
+ <stopWord>comment</stopWord>
+ <stopWord>compris</stopWord>
+ <stopWord>concernant</stopWord>
+ <stopWord>contre</stopWord>
+ <stopWord>couic</stopWord>
+ <stopWord>crac</stopWord>
+ <stopWord>d</stopWord>
+ <stopWord>da</stopWord>
+ <stopWord>dans</stopWord>
+ <stopWord>de</stopWord>
+ <stopWord>debout</stopWord>
+ <stopWord>dedans</stopWord>
+ <stopWord>dehors</stopWord>
+ <stopWord>delà</stopWord>
+ <stopWord>depuis</stopWord>
+ <stopWord>derrière</stopWord>
+ <stopWord>des</stopWord>
+ <stopWord>dès</stopWord>
+ <stopWord>désormais</stopWord>
+ <stopWord>desquelles</stopWord>
+ <stopWord>desquels</stopWord>
+ <stopWord>dessous</stopWord>
+ <stopWord>dessus</stopWord>
+ <stopWord>devant</stopWord>
+ <stopWord>devers</stopWord>
+ <stopWord>devra</stopWord>
+ <stopWord>dire</stopWord>
+ <stopWord>divers</stopWord>
+ <stopWord>diverse</stopWord>
+ <stopWord>diverses</stopWord>
+ <stopWord>doit</stopWord>
+ <stopWord>doivent</stopWord>
+ <stopWord>donc</stopWord>
+ <stopWord>dont</stopWord>
+ <stopWord>dring</stopWord>
+ <stopWord>du</stopWord>
+ <stopWord>duquel</stopWord>
+ <stopWord>durant</stopWord>
+ <stopWord>e</stopWord>
+ <stopWord>effet</stopWord>
+ <stopWord>eh</stopWord>
+ <stopWord>elle</stopWord>
+ <stopWord>elle-même</stopWord>
+ <stopWord>elles</stopWord>
+ <stopWord>elles-mêmes</stopWord>
+ <stopWord>en</stopWord>
+ <stopWord>entre</stopWord>
+ <stopWord>envers</stopWord>
+ <stopWord>environ</stopWord>
+ <stopWord>es</stopWord>
+ <stopWord>ès</stopWord>
+ <stopWord>est</stopWord>
+ <stopWord>et</stopWord>
+ <stopWord>etant</stopWord>
+ <stopWord>étaient</stopWord>
+ <stopWord>étais</stopWord>
+ <stopWord>était</stopWord>
+ <stopWord>étant</stopWord>
+ <stopWord>etc</stopWord>
+ <stopWord>été</stopWord>
+ <stopWord>etre</stopWord>
+ <stopWord>être</stopWord>
+ <stopWord>eu</stopWord>
+ <stopWord>euh</stopWord>
+ <stopWord>eux</stopWord>
+ <stopWord>eux-mêmes</stopWord>
+ <stopWord>excepté</stopWord>
+ <stopWord>f</stopWord>
+ <stopWord>façon</stopWord>
+ <stopWord>fais</stopWord>
+ <stopWord>faisaient</stopWord>
+ <stopWord>faisant</stopWord>
+ <stopWord>fait</stopWord>
+ <stopWord>feront</stopWord>
+ <stopWord>fi</stopWord>
+ <stopWord>flac</stopWord>
+ <stopWord>floc</stopWord>
+ <stopWord>font</stopWord>
+ <stopWord>g</stopWord>
+ <stopWord>gens</stopWord>
+ <stopWord>h</stopWord>
+ <stopWord>ha</stopWord>
+ <stopWord>hé</stopWord>
+ <stopWord>hein</stopWord>
+ <stopWord>hélas</stopWord>
+ <stopWord>hem</stopWord>
+ <stopWord>hep</stopWord>
+ <stopWord>hi</stopWord>
+ <stopWord>ho</stopWord>
+ <stopWord>holà</stopWord>
+ <stopWord>hop</stopWord>
+ <stopWord>hormis</stopWord>
+ <stopWord>hors</stopWord>
+ <stopWord>hou</stopWord>
+ <stopWord>houp</stopWord>
+ <stopWord>hue</stopWord>
+ <stopWord>hui</stopWord>
+ <stopWord>hum</stopWord>
+ <stopWord>hurrah</stopWord>
+ <stopWord>i</stopWord>
+ <stopWord>il</stopWord>
+ <stopWord>ils</stopWord>
+ <stopWord>importe</stopWord>
+ <stopWord>j</stopWord>
+ <stopWord>je</stopWord>
+ <stopWord>jusqu</stopWord>
+ <stopWord>jusque</stopWord>
+ <stopWord>k</stopWord>
+ <stopWord>l</stopWord>
+ <stopWord>la</stopWord>
+ <stopWord>là</stopWord>
+ <stopWord>laquelle</stopWord>
+ <stopWord>las</stopWord>
+ <stopWord>le</stopWord>
+ <stopWord>lequel</stopWord>
+ <stopWord>les</stopWord>
+ <stopWord>lès</stopWord>
+ <stopWord>lesquelles</stopWord>
+ <stopWord>lesquels</stopWord>
+ <stopWord>leur</stopWord>
+ <stopWord>leurs</stopWord>
+ <stopWord>longtemps</stopWord>
+ <stopWord>lorsque</stopWord>
+ <stopWord>lui</stopWord>
+ <stopWord>lui-même</stopWord>
+ <stopWord>m</stopWord>
+ <stopWord>ma</stopWord>
+ <stopWord>maint</stopWord>
+ <stopWord>mais</stopWord>
+ <stopWord>malgré</stopWord>
+ <stopWord>me</stopWord>
+ <stopWord>même</stopWord>
+ <stopWord>mêmes</stopWord>
+ <stopWord>merci</stopWord>
+ <stopWord>mes</stopWord>
+ <stopWord>mien</stopWord>
+ <stopWord>mienne</stopWord>
+ <stopWord>miennes</stopWord>
+ <stopWord>miens</stopWord>
+ <stopWord>mille</stopWord>
+ <stopWord>mince</stopWord>
+ <stopWord>moi</stopWord>
+ <stopWord>moi-même</stopWord>
+ <stopWord>moins</stopWord>
+ <stopWord>mon</stopWord>
+ <stopWord>moyennant</stopWord>
+ <stopWord>n</stopWord>
+ <stopWord>na</stopWord>
+ <stopWord>ne</stopWord>
+ <stopWord>néanmoins</stopWord>
+ <stopWord>ni</stopWord>
+ <stopWord>nombreuses</stopWord>
+ <stopWord>nombreux</stopWord>
+ <stopWord>non</stopWord>
+ <stopWord>nos</stopWord>
+ <stopWord>notre</stopWord>
+ <stopWord>nôtre</stopWord>
+ <stopWord>nôtres</stopWord>
+ <stopWord>nous</stopWord>
+ <stopWord>nous-mêmes</stopWord>
+ <stopWord>nul</stopWord>
+ <stopWord>o</stopWord>
+ <stopWord>o</stopWord>
+ <stopWord>ô</stopWord>
+ <stopWord>oh</stopWord>
+ <stopWord>ohé</stopWord>
+ <stopWord>olé</stopWord>
+ <stopWord>ollé</stopWord>
+ <stopWord>on</stopWord>
+ <stopWord>ont</stopWord>
+ <stopWord>ore</stopWord>
+ <stopWord>or</stopWord>
+ <stopWord>ou</stopWord>
+ <stopWord>où</stopWord>
+ <stopWord>ouf</stopWord>
+ <stopWord>ouias</stopWord>
+ <stopWord>oust</stopWord>
+ <stopWord>ouste</stopWord>
+ <stopWord>outre</stopWord>
+ <stopWord>p</stopWord>
+ <stopWord>paf</stopWord>
+ <stopWord>pan</stopWord>
+ <stopWord>par</stopWord>
+ <stopWord>parmi</stopWord>
+ <stopWord>partant</stopWord>
+ <stopWord>particulier</stopWord>
+ <stopWord>particulière</stopWord>
+ <stopWord>particulièrement</stopWord>
+ <stopWord>pas</stopWord>
+ <stopWord>passé</stopWord>
+ <stopWord>pendant</stopWord>
+ <stopWord>personne</stopWord>
+ <stopWord>peu</stopWord>
+ <stopWord>peut</stopWord>
+ <stopWord>peuvent</stopWord>
+ <stopWord>peux</stopWord>
+ <stopWord>pff</stopWord>
+ <stopWord>pfft</stopWord>
+ <stopWord>pfut</stopWord>
+ <stopWord>pif</stopWord>
+ <stopWord>plein</stopWord>
+ <stopWord>plouf</stopWord>
+ <stopWord>plus</stopWord>
+ <stopWord>plusieurs</stopWord>
+ <stopWord>plutôt</stopWord>
+ <stopWord>pouah</stopWord>
+ <stopWord>pour</stopWord>
+ <stopWord>pourquoi</stopWord>
+ <stopWord>près</stopWord>
+ <stopWord>proche</stopWord>
+ <stopWord>psitt</stopWord>
+ <stopWord>puisque</stopWord>
+ <stopWord>q</stopWord>
+ <stopWord>qu</stopWord>
+ <stopWord>quand</stopWord>
+ <stopWord>quant</stopWord>
+ <stopWord>quanta</stopWord>
+ <stopWord>quant-à-soi</stopWord>
+ <stopWord>que</stopWord>
+ <stopWord>quel</stopWord>
+ <stopWord>quelconque</stopWord>
+ <stopWord>quelle</stopWord>
+ <stopWord>quelles</stopWord>
+ <stopWord>quelque</stopWord>
+ <stopWord>quelques</stopWord>
+ <stopWord>quelqu'un</stopWord>
+ <stopWord>quels</stopWord>
+ <stopWord>qui</stopWord>
+ <stopWord>quiconque</stopWord>
+ <stopWord>quoi</stopWord>
+ <stopWord>quoique</stopWord>
+ <stopWord>r</stopWord>
+ <stopWord>revoici</stopWord>
+ <stopWord>revoilà</stopWord>
+ <stopWord>rien</stopWord>
+ <stopWord>s</stopWord>
+ <stopWord>sa</stopWord>
+ <stopWord>sacrebleu</stopWord>
+ <stopWord>sans</stopWord>
+ <stopWord>sapristi</stopWord>
+ <stopWord>sauf</stopWord>
+ <stopWord>se</stopWord>
+ <stopWord>selon</stopWord>
+ <stopWord>sept</stopWord>
+ <stopWord>sera</stopWord>
+ <stopWord>seront</stopWord>
+ <stopWord>ses</stopWord>
+ <stopWord>si</stopWord>
+ <stopWord>sien</stopWord>
+ <stopWord>sienne</stopWord>
+ <stopWord>siennes</stopWord>
+ <stopWord>siens</stopWord>
+ <stopWord>sinon</stopWord>
+ <stopWord>soi</stopWord>
+ <stopWord>soi-même</stopWord>
+ <stopWord>soit</stopWord>
+ <stopWord>sont</stopWord>
+ <stopWord>sous</stopWord>
+ <stopWord>stop</stopWord>
+ <stopWord>suis</stopWord>
+ <stopWord>suivant</stopWord>
+ <stopWord>sur</stopWord>
+ <stopWord>surtout</stopWord>
+ <stopWord>t</stopWord>
+ <stopWord>ta</stopWord>
+ <stopWord>tac</stopWord>
+ <stopWord>tant</stopWord>
+ <stopWord>te</stopWord>
+ <stopWord>té</stopWord>
+ <stopWord>tel</stopWord>
+ <stopWord>telle</stopWord>
+ <stopWord>tellement</stopWord>
+ <stopWord>telles</stopWord>
+ <stopWord>tels</stopWord>
+ <stopWord>tenant</stopWord>
+ <stopWord>tes</stopWord>
+ <stopWord>tic</stopWord>
+ <stopWord>tien</stopWord>
+ <stopWord>tienne</stopWord>
+ <stopWord>tiennes</stopWord>
+ <stopWord>tiens</stopWord>
+ <stopWord>toc</stopWord>
+ <stopWord>toi</stopWord>
+ <stopWord>toi-même</stopWord>
+ <stopWord>ton</stopWord>
+ <stopWord>touchant</stopWord>
+ <stopWord>toujours</stopWord>
+ <stopWord>tous</stopWord>
+ <stopWord>tout</stopWord>
+ <stopWord>toute</stopWord>
+ <stopWord>toutes</stopWord>
+ <stopWord>très</stopWord>
+ <stopWord>trois</stopWord>
+ <stopWord>trop</stopWord>
+ <stopWord>tsoin</stopWord>
+ <stopWord>tsouin</stopWord>
+ <stopWord>tu</stopWord>
+ <stopWord>u</stopWord>
+ <stopWord>un</stopWord>
+ <stopWord>une</stopWord>
+ <stopWord>unes</stopWord>
+ <stopWord>uns</stopWord>
+ <stopWord>v</stopWord>
+ <stopWord>va</stopWord>
+ <stopWord>vais</stopWord>
+ <stopWord>vas</stopWord>
+ <stopWord>vé</stopWord>
+ <stopWord>vers</stopWord>
+ <stopWord>via</stopWord>
+ <stopWord>vif</stopWord>
+ <stopWord>vifs</stopWord>
+ <stopWord>vivat</stopWord>
+ <stopWord>vive</stopWord>
+ <stopWord>vives</stopWord>
+ <stopWord>vlan</stopWord>
+ <stopWord>voici</stopWord>
+ <stopWord>voilà</stopWord>
+ <stopWord>vont</stopWord>
+ <stopWord>vos</stopWord>
+ <stopWord>votre</stopWord>
+ <stopWord>vôtre</stopWord>
+ <stopWord>vôtres</stopWord>
+ <stopWord>vous</stopWord>
+ <stopWord>vous-mêmes</stopWord>
+ <stopWord>vu</stopWord>
+ <stopWord>w</stopWord>
+ <stopWord>x</stopWord>
+ <stopWord>y</stopWord>
+ <stopWord>z</stopWord>
+ <stopWord>zut</stopWord>
+</stopWords>
+
+</french>
+
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/German_de.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/German_de.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/German_de.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/German_de.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,233 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>ab</stopword>
+ <stopword>aber</stopword>
+ <stopword>allein</stopword>
+ <stopword>als</stopword>
+ <stopword>also</stopword>
+ <stopword>am</stopword>
+ <stopword>an</stopword>
+ <stopword>auch</stopword>
+ <stopword>auf</stopword>
+ <stopword>aus</stopword>
+ <stopword>auÃer</stopword>
+ <stopword>bald</stopword>
+ <stopword>bei</stopword>
+ <stopword>beim</stopword>
+ <stopword>bin</stopword>
+ <stopword>bis</stopword>
+ <stopword>bist</stopword>
+ <stopword>biÃchen</stopword>
+ <stopword>da</stopword>
+ <stopword>dabei</stopword>
+ <stopword>dadurch</stopword>
+ <stopword>dafür</stopword>
+ <stopword>dagegen</stopword>
+ <stopword>dahinter</stopword>
+ <stopword>damit</stopword>
+ <stopword>danach</stopword>
+ <stopword>daneben</stopword>
+ <stopword>dann</stopword>
+ <stopword>daran</stopword>
+ <stopword>darauf</stopword>
+ <stopword>daraus</stopword>
+ <stopword>darin</stopword>
+ <stopword>darum</stopword>
+ <stopword>darunter</stopword>
+ <stopword>darüber</stopword>
+ <stopword>das</stopword>
+ <stopword>dasselbe</stopword>
+ <stopword>davon</stopword>
+ <stopword>davor</stopword>
+ <stopword>dazu</stopword>
+ <stopword>dazwischen</stopword>
+ <stopword>daÃ</stopword>
+ <stopword>dein</stopword>
+ <stopword>deine</stopword>
+ <stopword>deinem</stopword>
+ <stopword>deinen</stopword>
+ <stopword>deiner</stopword>
+ <stopword>deines</stopword>
+ <stopword>dem</stopword>
+ <stopword>demselben</stopword>
+ <stopword>den</stopword>
+ <stopword>denn</stopword>
+ <stopword>der</stopword>
+ <stopword>derselben</stopword>
+ <stopword>des</stopword>
+ <stopword>desselben</stopword>
+ <stopword>dessen</stopword>
+ <stopword>dich</stopword>
+ <stopword>die</stopword>
+ <stopword>dies</stopword>
+ <stopword>diese</stopword>
+ <stopword>dieselbe</stopword>
+ <stopword>dieselben</stopword>
+ <stopword>diesem</stopword>
+ <stopword>diesen</stopword>
+ <stopword>dieser</stopword>
+ <stopword>dieses</stopword>
+ <stopword>dir</stopword>
+ <stopword>doch</stopword>
+ <stopword>dort</stopword>
+ <stopword>du</stopword>
+ <stopword>ebenso</stopword>
+ <stopword>ehe</stopword>
+ <stopword>ein</stopword>
+ <stopword>eine</stopword>
+ <stopword>einem</stopword>
+ <stopword>einen</stopword>
+ <stopword>einer</stopword>
+ <stopword>eines</stopword>
+ <stopword>entlang</stopword>
+ <stopword>er</stopword>
+ <stopword>es</stopword>
+ <stopword>etwa</stopword>
+ <stopword>etwas</stopword>
+ <stopword>euch</stopword>
+ <stopword>euer</stopword>
+ <stopword>eure</stopword>
+ <stopword>eurem</stopword>
+ <stopword>euren</stopword>
+ <stopword>eurer</stopword>
+ <stopword>eures</stopword>
+ <stopword>für</stopword>
+ <stopword>fürs</stopword>
+ <stopword>ganz</stopword>
+ <stopword>gar</stopword>
+ <stopword>gegen</stopword>
+ <stopword>genau</stopword>
+ <stopword>gewesen</stopword>
+ <stopword>her</stopword>
+ <stopword>herein</stopword>
+ <stopword>herum</stopword>
+ <stopword>hin</stopword>
+ <stopword>hinter</stopword>
+ <stopword>hintern</stopword>
+ <stopword>ich</stopword>
+ <stopword>ihm</stopword>
+ <stopword>ihn</stopword>
+ <stopword>ihnen</stopword>
+ <stopword>ihr</stopword>
+ <stopword>ihre</stopword>
+ <stopword>ihrem</stopword>
+ <stopword>ihren</stopword>
+ <stopword>ihrer</stopword>
+ <stopword>ihres</stopword>
+ <stopword>im</stopword>
+ <stopword>in</stopword>
+ <stopword>ist</stopword>
+ <stopword>ja</stopword>
+ <stopword>je</stopword>
+ <stopword>jedesmal</stopword>
+ <stopword>jedoch</stopword>
+ <stopword>jene</stopword>
+ <stopword>jenem</stopword>
+ <stopword>jenen</stopword>
+ <stopword>jener</stopword>
+ <stopword>jenes</stopword>
+ <stopword>kaum</stopword>
+ <stopword>kein</stopword>
+ <stopword>keine</stopword>
+ <stopword>keinem</stopword>
+ <stopword>keinen</stopword>
+ <stopword>keiner</stopword>
+ <stopword>keines</stopword>
+ <stopword>man</stopword>
+ <stopword>mehr</stopword>
+ <stopword>mein</stopword>
+ <stopword>meine</stopword>
+ <stopword>meinem</stopword>
+ <stopword>meinen</stopword>
+ <stopword>meiner</stopword>
+ <stopword>meines</stopword>
+ <stopword>mich</stopword>
+ <stopword>mir</stopword>
+ <stopword>mit</stopword>
+ <stopword>nach</stopword>
+ <stopword>nachdem</stopword>
+ <stopword>neben</stopword>
+ <stopword>nein</stopword>
+ <stopword>nicht</stopword>
+ <stopword>nichts</stopword>
+ <stopword>noch</stopword>
+ <stopword>nun</stopword>
+ <stopword>nur</stopword>
+ <stopword>nämlich</stopword>
+ <stopword>ob</stopword>
+ <stopword>ober</stopword>
+ <stopword>obgleich</stopword>
+ <stopword>oder</stopword>
+ <stopword>ohne</stopword>
+ <stopword>paar</stopword>
+ <stopword>sehr</stopword>
+ <stopword>sei</stopword>
+ <stopword>sein</stopword>
+ <stopword>seine</stopword>
+ <stopword>seinem</stopword>
+ <stopword>seinen</stopword>
+ <stopword>seiner</stopword>
+ <stopword>seines</stopword>
+ <stopword>seit</stopword>
+ <stopword>seitdem</stopword>
+ <stopword>selbst</stopword>
+ <stopword>sich</stopword>
+ <stopword>sie</stopword>
+ <stopword>sind</stopword>
+ <stopword>so</stopword>
+ <stopword>sogar</stopword>
+ <stopword>solch</stopword>
+ <stopword>solche</stopword>
+ <stopword>solchem</stopword>
+ <stopword>solchen</stopword>
+ <stopword>solcher</stopword>
+ <stopword>solches</stopword>
+ <stopword>sondern</stopword>
+ <stopword>sonst</stopword>
+ <stopword>soviel</stopword>
+ <stopword>soweit</stopword>
+ <stopword>um</stopword>
+ <stopword>und</stopword>
+ <stopword>uns</stopword>
+ <stopword>unser</stopword>
+ <stopword>unsre</stopword>
+ <stopword>unsrem</stopword>
+ <stopword>unsren</stopword>
+ <stopword>unsrer</stopword>
+ <stopword>unsres</stopword>
+ <stopword>vom</stopword>
+ <stopword>von</stopword>
+ <stopword>vor</stopword>
+ <stopword>war</stopword>
+ <stopword>warum</stopword>
+ <stopword>was</stopword>
+ <stopword>wegen</stopword>
+ <stopword>weil</stopword>
+ <stopword>weit</stopword>
+ <stopword>welche</stopword>
+ <stopword>welchem</stopword>
+ <stopword>welchen</stopword>
+ <stopword>welcher</stopword>
+ <stopword>welches</stopword>
+ <stopword>wem</stopword>
+ <stopword>wen</stopword>
+ <stopword>wenn</stopword>
+ <stopword>wer</stopword>
+ <stopword>weshalb</stopword>
+ <stopword>wessen</stopword>
+ <stopword>wie</stopword>
+ <stopword>wir</stopword>
+ <stopword>wo</stopword>
+ <stopword>womit</stopword>
+ <stopword>während</stopword>
+ <stopword>wäre</stopword>
+ <stopword>wären</stopword>
+ <stopword>zu</stopword>
+ <stopword>zum</stopword>
+ <stopword>zur</stopword>
+ <stopword>zwar</stopword>
+ <stopword>zwischen</stopword>
+ <stopword>zwischens</stopword>
+ <stopword>über</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Italian_it.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Italian_it.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Italian_it.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Italian_it.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,136 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>a</stopword>
+ <stopword>affinchè</stopword>
+ <stopword>agl'</stopword>
+ <stopword>agli</stopword>
+ <stopword>ai</stopword>
+ <stopword>al</stopword>
+ <stopword>all'</stopword>
+ <stopword>alla</stopword>
+ <stopword>alle</stopword>
+ <stopword>allo</stopword>
+ <stopword>anche</stopword>
+ <stopword>anzichè</stopword>
+ <stopword>avere</stopword>
+ <stopword>bensì</stopword>
+ <stopword>che</stopword>
+ <stopword>chi</stopword>
+ <stopword>cioè</stopword>
+ <stopword>come</stopword>
+ <stopword>comunque</stopword>
+ <stopword>con</stopword>
+ <stopword>contro</stopword>
+ <stopword>cosa</stopword>
+ <stopword>da</stopword>
+ <stopword>dachè</stopword>
+ <stopword>dagl'</stopword>
+ <stopword>dagli</stopword>
+ <stopword>dai</stopword>
+ <stopword>dal</stopword>
+ <stopword>dall'</stopword>
+ <stopword>dalla</stopword>
+ <stopword>dalle</stopword>
+ <stopword>dallo</stopword>
+ <stopword>degl'</stopword>
+ <stopword>degli</stopword>
+ <stopword>dei</stopword>
+ <stopword>del</stopword>
+ <stopword>dell'</stopword>
+ <stopword>delle</stopword>
+ <stopword>dello</stopword>
+ <stopword>di</stopword>
+ <stopword>dopo</stopword>
+ <stopword>dove</stopword>
+ <stopword>dunque</stopword>
+ <stopword>durante</stopword>
+ <stopword>e</stopword>
+ <stopword>egli</stopword>
+ <stopword>eppure</stopword>
+ <stopword>essere</stopword>
+ <stopword>essi</stopword>
+ <stopword>finché</stopword>
+ <stopword>fino</stopword>
+ <stopword>fra</stopword>
+ <stopword>giacchè</stopword>
+ <stopword>gl'</stopword>
+ <stopword>gli</stopword>
+ <stopword>grazie</stopword>
+ <stopword>i</stopword>
+ <stopword>il</stopword>
+ <stopword>in</stopword>
+ <stopword>inoltre</stopword>
+ <stopword>io</stopword>
+ <stopword>l'</stopword>
+ <stopword>la</stopword>
+ <stopword>le</stopword>
+ <stopword>lo</stopword>
+ <stopword>loro</stopword>
+ <stopword>ma</stopword>
+ <stopword>mentre</stopword>
+ <stopword>mio</stopword>
+ <stopword>ne</stopword>
+ <stopword>neanche</stopword>
+ <stopword>negl'</stopword>
+ <stopword>negli</stopword>
+ <stopword>nei</stopword>
+ <stopword>nel</stopword>
+ <stopword>nell'</stopword>
+ <stopword>nella</stopword>
+ <stopword>nelle</stopword>
+ <stopword>nello</stopword>
+ <stopword>nemmeno</stopword>
+ <stopword>neppure</stopword>
+ <stopword>noi</stopword>
+ <stopword>nonchè</stopword>
+ <stopword>nondimeno</stopword>
+ <stopword>nostro</stopword>
+ <stopword>o</stopword>
+ <stopword>onde</stopword>
+ <stopword>oppure</stopword>
+ <stopword>ossia</stopword>
+ <stopword>ovvero</stopword>
+ <stopword>per</stopword>
+ <stopword>perchè</stopword>
+ <stopword>perciò</stopword>
+ <stopword>però</stopword>
+ <stopword>poichè</stopword>
+ <stopword>prima</stopword>
+ <stopword>purchè</stopword>
+ <stopword>quand'</stopword>
+ <stopword>quando</stopword>
+ <stopword>quantunque</stopword>
+ <stopword>quasi</stopword>
+ <stopword>quindi</stopword>
+ <stopword>se</stopword>
+ <stopword>sebbene</stopword>
+ <stopword>sennonchè</stopword>
+ <stopword>senza</stopword>
+ <stopword>seppure</stopword>
+ <stopword>si</stopword>
+ <stopword>siccome</stopword>
+ <stopword>sopra</stopword>
+ <stopword>sotto</stopword>
+ <stopword>su</stopword>
+ <stopword>subito</stopword>
+ <stopword>sugl'</stopword>
+ <stopword>sugli</stopword>
+ <stopword>sui</stopword>
+ <stopword>sul</stopword>
+ <stopword>sull'</stopword>
+ <stopword>sulla</stopword>
+ <stopword>sulle</stopword>
+ <stopword>sullo</stopword>
+ <stopword>suo</stopword>
+ <stopword>talchè</stopword>
+ <stopword>tu</stopword>
+ <stopword>tuo</stopword>
+ <stopword>tuttavia</stopword>
+ <stopword>tutti</stopword>
+ <stopword>un</stopword>
+ <stopword>una</stopword>
+ <stopword>uno</stopword>
+ <stopword>voi</stopword>
+ <stopword>vostro</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Norwegian_no.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Norwegian_no.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Norwegian_no.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Norwegian_no.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,123 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>alle</stopword>
+ <stopword>andre</stopword>
+ <stopword>arbeid</stopword>
+ <stopword>av</stopword>
+ <stopword>begge</stopword>
+ <stopword>bort</stopword>
+ <stopword>bra</stopword>
+ <stopword>bruke</stopword>
+ <stopword>da</stopword>
+ <stopword>denne</stopword>
+ <stopword>der</stopword>
+ <stopword>deres</stopword>
+ <stopword>det</stopword>
+ <stopword>din</stopword>
+ <stopword>disse</stopword>
+ <stopword>du</stopword>
+ <stopword>eller</stopword>
+ <stopword>en</stopword>
+ <stopword>ene</stopword>
+ <stopword>eneste</stopword>
+ <stopword>enhver</stopword>
+ <stopword>enn</stopword>
+ <stopword>er</stopword>
+ <stopword>et</stopword>
+ <stopword>folk</stopword>
+ <stopword>for</stopword>
+ <stopword>fordi</stopword>
+ <stopword>forsøke</stopword>
+ <stopword>fra</stopword>
+ <stopword>få</stopword>
+ <stopword>før</stopword>
+ <stopword>først</stopword>
+ <stopword>gjorde</stopword>
+ <stopword>gjøre</stopword>
+ <stopword>god</stopword>
+ <stopword>gå</stopword>
+ <stopword>ha</stopword>
+ <stopword>hadde</stopword>
+ <stopword>han</stopword>
+ <stopword>hans</stopword>
+ <stopword>hennes</stopword>
+ <stopword>her</stopword>
+ <stopword>hva</stopword>
+ <stopword>hvem</stopword>
+ <stopword>hver</stopword>
+ <stopword>hvilken</stopword>
+ <stopword>hvis</stopword>
+ <stopword>hvor</stopword>
+ <stopword>hvordan</stopword>
+ <stopword>hvorfor</stopword>
+ <stopword>i</stopword>
+ <stopword>ikke</stopword>
+ <stopword>inn</stopword>
+ <stopword>innen</stopword>
+ <stopword>kan</stopword>
+ <stopword>kunne</stopword>
+ <stopword>lage</stopword>
+ <stopword>lang</stopword>
+ <stopword>lik</stopword>
+ <stopword>like</stopword>
+ <stopword>makt</stopword>
+ <stopword>mange</stopword>
+ <stopword>med</stopword>
+ <stopword>meg</stopword>
+ <stopword>meget</stopword>
+ <stopword>men</stopword>
+ <stopword>mens</stopword>
+ <stopword>mer</stopword>
+ <stopword>mest</stopword>
+ <stopword>min</stopword>
+ <stopword>mye</stopword>
+ <stopword>må</stopword>
+ <stopword>måte</stopword>
+ <stopword>navn</stopword>
+ <stopword>nei</stopword>
+ <stopword>ny</stopword>
+ <stopword>nå</stopword>
+ <stopword>når</stopword>
+ <stopword>og</stopword>
+ <stopword>også</stopword>
+ <stopword>om</stopword>
+ <stopword>opp</stopword>
+ <stopword>oss</stopword>
+ <stopword>over</stopword>
+ <stopword>part</stopword>
+ <stopword>punkt</stopword>
+ <stopword>på</stopword>
+ <stopword>rett</stopword>
+ <stopword>riktig</stopword>
+ <stopword>samme</stopword>
+ <stopword>sant</stopword>
+ <stopword>si</stopword>
+ <stopword>siden</stopword>
+ <stopword>sist</stopword>
+ <stopword>skulle</stopword>
+ <stopword>slik</stopword>
+ <stopword>slutt</stopword>
+ <stopword>som</stopword>
+ <stopword>start</stopword>
+ <stopword>stille</stopword>
+ <stopword>så</stopword>
+ <stopword>tid</stopword>
+ <stopword>til</stopword>
+ <stopword>tilbake</stopword>
+ <stopword>tilstand</stopword>
+ <stopword>under</stopword>
+ <stopword>ut</stopword>
+ <stopword>uten</stopword>
+ <stopword>var</stopword>
+ <stopword>ved</stopword>
+ <stopword>verdi</stopword>
+ <stopword>vi</stopword>
+ <stopword>vil</stopword>
+ <stopword>ville</stopword>
+ <stopword>vite</stopword>
+ <stopword>vår</stopword>
+ <stopword>være</stopword>
+ <stopword>vært</stopword>
+ <stopword>Ã¥</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Polish_pl.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Polish_pl.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Polish_pl.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Polish_pl.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,114 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+<stopword>i</stopword>
+<stopword>w</stopword>
+<stopword>z</stopword>
+<stopword>o</stopword>
+<stopword>na</stopword>
+<stopword>do</stopword>
+<stopword>a</stopword>
+<stopword>jest</stopword>
+<stopword>od</stopword>
+<stopword>przez</stopword>
+<stopword>to</stopword>
+<stopword>po</stopword>
+<stopword>siÄ</stopword>
+<stopword>dla</stopword>
+<stopword>nie</stopword>
+<stopword>oraz</stopword>
+<stopword>jak</stopword>
+<stopword>za</stopword>
+<stopword>ze</stopword>
+<stopword>tym</stopword>
+<stopword>co</stopword>
+<stopword>przy</stopword>
+<stopword>tego</stopword>
+<stopword>ich</stopword>
+<stopword>ale</stopword>
+<stopword>tylko</stopword>
+<stopword>pod</stopword>
+<stopword>sÄ
</stopword>
+<stopword>jego</stopword>
+<stopword>jako</stopword>
+<stopword>czy</stopword>
+<stopword>że</stopword>
+<stopword>tak</stopword>
+<stopword>ma</stopword>
+<stopword>tej</stopword>
+<stopword>lub</stopword>
+<stopword>także</stopword>
+<stopword>jednak</stopword>
+<stopword>ten</stopword>
+<stopword>jej</stopword>
+<stopword>u</stopword>
+<stopword>już</stopword>
+<stopword>nad</stopword>
+<stopword>tych</stopword>
+<stopword>które</stopword>
+<stopword>te</stopword>
+<stopword>jeszcze</stopword>
+<stopword>bardzo</stopword>
+<stopword>może</stopword>
+<stopword>bez</stopword>
+<stopword>innych</stopword>
+<stopword>im</stopword>
+<stopword>przed</stopword>
+<stopword>wszystkich</stopword>
+<stopword>we</stopword>
+<stopword>można</stopword>
+<stopword>których</stopword>
+<stopword>wszystkim</stopword>
+<stopword>również</stopword>
+<stopword>który</stopword>
+<stopword>nawet</stopword>
+<stopword>też</stopword>
+<stopword>sobie</stopword>
+<stopword>tu</stopword>
+<stopword>nich</stopword>
+<stopword>byÅo</stopword>
+<stopword>byÅ</stopword>
+<stopword>bÄdzie</stopword>
+<stopword>wielu</stopword>
+<stopword>go</stopword>
+<stopword>gdy</stopword>
+<stopword>wiele</stopword>
+<stopword>ta</stopword>
+<stopword>nas</stopword>
+<stopword>aby</stopword>
+<stopword>gdzie</stopword>
+<stopword>bo</stopword>
+<stopword>wiÄc</stopword>
+<stopword>tam</stopword>
+<stopword>którzy</stopword>
+<stopword>która</stopword>
+<stopword>kilka</stopword>
+<stopword>miÄdzy</stopword>
+<stopword>naszego</stopword>
+<stopword>byÅa</stopword>
+<stopword>bardziej</stopword>
+<stopword>przede</stopword>
+<stopword>nam</stopword>
+<stopword>wszystko</stopword>
+<stopword>swoje</stopword>
+<stopword>której</stopword>
+<stopword>niż</stopword>
+<stopword>czyli</stopword>
+<stopword>zawsze</stopword>
+<stopword>którym</stopword>
+<stopword>takie</stopword>
+<stopword>bowiem</stopword>
+<stopword>nim</stopword>
+<stopword>poza</stopword>
+<stopword>wÅaÅnie</stopword>
+<stopword>iż</stopword>
+<stopword>byÅy</stopword>
+<stopword>kiedy</stopword>
+<stopword>mogÄ
</stopword>
+<stopword>mi</stopword>
+<stopword>którego</stopword>
+<stopword>mnie</stopword>
+<stopword>dlatego</stopword>
+<stopword>naszych</stopword>
+<stopword>jeÅli</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Portuguese_pt.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Portuguese_pt.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Portuguese_pt.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Portuguese_pt.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,66 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>a</stopword>
+ <stopword>abaixo</stopword>
+ <stopword>adiante</stopword>
+ <stopword>agora</stopword>
+ <stopword>ali</stopword>
+ <stopword>antes</stopword>
+ <stopword>aqui</stopword>
+ <stopword>atras</stopword>
+ <stopword>até</stopword>
+ <stopword>bastante</stopword>
+ <stopword>bem</stopword>
+ <stopword>com</stopword>
+ <stopword>como</stopword>
+ <stopword>contra</stopword>
+ <stopword>debaixo</stopword>
+ <stopword>demais</stopword>
+ <stopword>depois</stopword>
+ <stopword>depressa</stopword>
+ <stopword>devagar</stopword>
+ <stopword>direito</stopword>
+ <stopword>e</stopword>
+ <stopword>ela</stopword>
+ <stopword>elas</stopword>
+ <stopword>eles</stopword>
+ <stopword>em</stopword>
+ <stopword>entre</stopword>
+ <stopword>eu</stopword>
+ <stopword>fora</stopword>
+ <stopword>junto</stopword>
+ <stopword>longe</stopword>
+ <stopword>mais</stopword>
+ <stopword>menos</stopword>
+ <stopword>muito</stopword>
+ <stopword>ninguem</stopword>
+ <stopword>nunca</stopword>
+ <stopword>não</stopword>
+ <stopword>nós</stopword>
+ <stopword>onde</stopword>
+ <stopword>ou</stopword>
+ <stopword>para</stopword>
+ <stopword>por</stopword>
+ <stopword>porque</stopword>
+ <stopword>pouco</stopword>
+ <stopword>próximo</stopword>
+ <stopword>qual</stopword>
+ <stopword>quando</stopword>
+ <stopword>quanto</stopword>
+ <stopword>que</stopword>
+ <stopword>quem</stopword>
+ <stopword>se</stopword>
+ <stopword>sem</stopword>
+ <stopword>sempre</stopword>
+ <stopword>sim</stopword>
+ <stopword>sob</stopword>
+ <stopword>sobre</stopword>
+ <stopword>talvez</stopword>
+ <stopword>todas</stopword>
+ <stopword>todos</stopword>
+ <stopword>vagarosamente</stopword>
+ <stopword>você</stopword>
+ <stopword>vocês</stopword>
+ <stopword>êle</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,101 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<stopwords>
+<stopword>а</stopword>
+<stopword>без</stopword>
+<stopword>более</stopword>
+<stopword>бÑ</stopword>
+<stopword>бÑл</stopword>
+<stopword>бÑла</stopword>
+<stopword>бÑли</stopword>
+<stopword>бÑло</stopword>
+<stopword>бÑÑÑ</stopword>
+<stopword>в</stopword>
+<stopword>вам</stopword>
+<stopword>ваÑ?</stopword>
+<stopword>веÑ?Ñ</stopword>
+<stopword>во</stopword>
+<stopword>воÑ</stopword>
+<stopword>вÑ?е</stopword>
+<stopword>вÑ?его</stopword>
+<stopword>вÑ?еÑ
</stopword>
+<stopword>вÑ</stopword>
+<stopword>где</stopword>
+<stopword>да</stopword>
+<stopword>даже</stopword>
+<stopword>длÑ?</stopword>
+<stopword>до</stopword>
+<stopword>его</stopword>
+<stopword>ее</stopword>
+<stopword>еÑ?ли</stopword>
+<stopword>еÑ?ÑÑ</stopword>
+<stopword>еÑе</stopword>
+<stopword>же</stopword>
+<stopword>за</stopword>
+<stopword>здеÑ?Ñ</stopword>
+<stopword>и</stopword>
+<stopword>из</stopword>
+<stopword>или</stopword>
+<stopword>им</stopword>
+<stopword>иÑ
</stopword>
+<stopword>к</stopword>
+<stopword>как</stopword>
+<stopword>ко</stopword>
+<stopword>когда</stopword>
+<stopword>кÑо</stopword>
+<stopword>ли</stopword>
+<stopword>либо</stopword>
+<stopword>мне</stopword>
+<stopword>можеÑ</stopword>
+<stopword>мÑ</stopword>
+<stopword>на</stopword>
+<stopword>надо</stopword>
+<stopword>наÑ</stopword>
+<stopword>не</stopword>
+<stopword>него</stopword>
+<stopword>нее</stopword>
+<stopword>неÑ</stopword>
+<stopword>ни</stopword>
+<stopword>ниÑ
</stopword>
+<stopword>но</stopword>
+<stopword>нÑ</stopword>
+<stopword>о</stopword>
+<stopword>об</stopword>
+<stopword>однако</stopword>
+<stopword>он</stopword>
+<stopword>она</stopword>
+<stopword>они</stopword>
+<stopword>оно</stopword>
+<stopword>оÑ</stopword>
+<stopword>оÑенÑ</stopword>
+<stopword>по</stopword>
+<stopword>под</stopword>
+<stopword>пÑи</stopword>
+<stopword>Ñ?</stopword>
+<stopword>Ñ?о</stopword>
+<stopword>Ñак</stopword>
+<stopword>Ñакже</stopword>
+<stopword>Ñакой</stopword>
+<stopword>Ñам</stopword>
+<stopword>Ñе</stopword>
+<stopword>Ñем</stopword>
+<stopword>Ñо</stopword>
+<stopword>Ñого</stopword>
+<stopword>Ñоже</stopword>
+<stopword>Ñой</stopword>
+<stopword>ÑолÑко</stopword>
+<stopword>Ñом</stopword>
+<stopword>ÑÑ</stopword>
+<stopword>Ñ</stopword>
+<stopword>Ñже</stopword>
+<stopword>Ñ
оÑÑ?</stopword>
+<stopword>Ñего</stopword>
+<stopword>Ñей</stopword>
+<stopword>Ñем</stopword>
+<stopword>ÑÑо</stopword>
+<stopword>ÑÑобÑ</stopword>
+<stopword>ÑÑе</stopword>
+<stopword>ÑÑÑ?</stopword>
+<stopword>Ñ?Ñа</stopword>
+<stopword>Ñ?Ñи</stopword>
+<stopword>Ñ?Ñо</stopword>
+<stopword>Ñ?</stopword></stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Spanish_es.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Spanish_es.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Spanish_es.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Spanish_es.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,184 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>a</stopword>
+ <stopword>acá</stopword>
+ <stopword>ahÃ</stopword>
+ <stopword>ajena</stopword>
+ <stopword>ajenas</stopword>
+ <stopword>ajeno</stopword>
+ <stopword>ajenos</stopword>
+ <stopword>al</stopword>
+ <stopword>algo</stopword>
+ <stopword>alguna</stopword>
+ <stopword>algunas</stopword>
+ <stopword>alguno</stopword>
+ <stopword>algunos</stopword>
+ <stopword>algún</stopword>
+ <stopword>allá</stopword>
+ <stopword>allÃ</stopword>
+ <stopword>aquel</stopword>
+ <stopword>aquella</stopword>
+ <stopword>aquellas</stopword>
+ <stopword>aquello</stopword>
+ <stopword>aquellos</stopword>
+ <stopword>aquÃ</stopword>
+ <stopword>cada</stopword>
+ <stopword>cierta</stopword>
+ <stopword>ciertas</stopword>
+ <stopword>cierto</stopword>
+ <stopword>ciertos</stopword>
+ <stopword>como</stopword>
+ <stopword>con</stopword>
+ <stopword>conmigo</stopword>
+ <stopword>consigo</stopword>
+ <stopword>contigo</stopword>
+ <stopword>cualquier</stopword>
+ <stopword>cualquiera</stopword>
+ <stopword>cualquieras</stopword>
+ <stopword>cuan</stopword>
+ <stopword>cuanta</stopword>
+ <stopword>cuantas</stopword>
+ <stopword>cuanto</stopword>
+ <stopword>cuantos</stopword>
+ <stopword>cuán</stopword>
+ <stopword>cuánta</stopword>
+ <stopword>cuántas</stopword>
+ <stopword>cuánto</stopword>
+ <stopword>cuántos</stopword>
+ <stopword>cómo</stopword>
+ <stopword>de</stopword>
+ <stopword>dejar</stopword>
+ <stopword>del</stopword>
+ <stopword>demasiada</stopword>
+ <stopword>demasiadas</stopword>
+ <stopword>demasiado</stopword>
+ <stopword>demasiados</stopword>
+ <stopword>demás</stopword>
+ <stopword>el</stopword>
+ <stopword>ella</stopword>
+ <stopword>ellas</stopword>
+ <stopword>ellos</stopword>
+ <stopword>esa</stopword>
+ <stopword>esas</stopword>
+ <stopword>ese</stopword>
+ <stopword>esos</stopword>
+ <stopword>esta</stopword>
+ <stopword>estar</stopword>
+ <stopword>estas</stopword>
+ <stopword>este</stopword>
+ <stopword>estos</stopword>
+ <stopword>hacer</stopword>
+ <stopword>hasta</stopword>
+ <stopword>jamás</stopword>
+ <stopword>junto</stopword>
+ <stopword>juntos</stopword>
+ <stopword>la</stopword>
+ <stopword>las</stopword>
+ <stopword>lo</stopword>
+ <stopword>los</stopword>
+ <stopword>mas</stopword>
+ <stopword>me</stopword>
+ <stopword>menos</stopword>
+ <stopword>mientras</stopword>
+ <stopword>misma</stopword>
+ <stopword>mismas</stopword>
+ <stopword>mismo</stopword>
+ <stopword>mismos</stopword>
+ <stopword>mucha</stopword>
+ <stopword>muchas</stopword>
+ <stopword>mucho</stopword>
+ <stopword>muchos</stopword>
+ <stopword>muchÃsima</stopword>
+ <stopword>muchÃsimas</stopword>
+ <stopword>muchÃsimo</stopword>
+ <stopword>muchÃsimos</stopword>
+ <stopword>muy</stopword>
+ <stopword>más</stopword>
+ <stopword>mÃa</stopword>
+ <stopword>mÃo</stopword>
+ <stopword>nada</stopword>
+ <stopword>ni</stopword>
+ <stopword>ninguna</stopword>
+ <stopword>ningunas</stopword>
+ <stopword>ninguno</stopword>
+ <stopword>ningunos</stopword>
+ <stopword>no</stopword>
+ <stopword>nos</stopword>
+ <stopword>nosotras</stopword>
+ <stopword>nosotros</stopword>
+ <stopword>nuestra</stopword>
+ <stopword>nuestras</stopword>
+ <stopword>nuestro</stopword>
+ <stopword>nuestros</stopword>
+ <stopword>nunca</stopword>
+ <stopword>os</stopword>
+ <stopword>otra</stopword>
+ <stopword>otras</stopword>
+ <stopword>otro</stopword>
+ <stopword>otros</stopword>
+ <stopword>para</stopword>
+ <stopword>parecer</stopword>
+ <stopword>poca</stopword>
+ <stopword>pocas</stopword>
+ <stopword>poco</stopword>
+ <stopword>pocos</stopword>
+ <stopword>por</stopword>
+ <stopword>porque</stopword>
+ <stopword>que</stopword>
+ <stopword>querer</stopword>
+ <stopword>quien</stopword>
+ <stopword>quienes</stopword>
+ <stopword>quienesquiera</stopword>
+ <stopword>quienquiera</stopword>
+ <stopword>quién</stopword>
+ <stopword>qué</stopword>
+ <stopword>ser</stopword>
+ <stopword>si</stopword>
+ <stopword>siempre</stopword>
+ <stopword>sr</stopword>
+ <stopword>sra</stopword>
+ <stopword>sres</stopword>
+ <stopword>sta</stopword>
+ <stopword>suya</stopword>
+ <stopword>suyas</stopword>
+ <stopword>suyo</stopword>
+ <stopword>suyos</stopword>
+ <stopword>sÃ</stopword>
+ <stopword>sÃn</stopword>
+ <stopword>tal</stopword>
+ <stopword>tales</stopword>
+ <stopword>tan</stopword>
+ <stopword>tanta</stopword>
+ <stopword>tantas</stopword>
+ <stopword>tanto</stopword>
+ <stopword>tantos</stopword>
+ <stopword>te</stopword>
+ <stopword>tener</stopword>
+ <stopword>ti</stopword>
+ <stopword>toda</stopword>
+ <stopword>todas</stopword>
+ <stopword>todo</stopword>
+ <stopword>todos</stopword>
+ <stopword>tomar</stopword>
+ <stopword>tuya</stopword>
+ <stopword>tuyo</stopword>
+ <stopword>tú</stopword>
+ <stopword>un</stopword>
+ <stopword>una</stopword>
+ <stopword>unas</stopword>
+ <stopword>unos</stopword>
+ <stopword>usted</stopword>
+ <stopword>ustedes</stopword>
+ <stopword>varias</stopword>
+ <stopword>varios</stopword>
+ <stopword>vosotras</stopword>
+ <stopword>vosotros</stopword>
+ <stopword>vuestra</stopword>
+ <stopword>vuestras</stopword>
+ <stopword>vuestro</stopword>
+ <stopword>vuestros</stopword>
+ <stopword>y</stopword>
+ <stopword>yo</stopword>
+ <stopword>él</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Swedish_sv.xml
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Swedish_sv.xml?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Swedish_sv.xml (added)
+++ lenya/trunk/src/webapp/WEB-INF/analyzer/stopword/Swedish_sv.xml Wed Nov 16 07:24:44 2005
@@ -0,0 +1,108 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>ab</stopword>
+ <stopword>aldrig</stopword>
+ <stopword>all</stopword>
+ <stopword>alla</stopword>
+ <stopword>alltid</stopword>
+ <stopword>att</stopword>
+ <stopword>av</stopword>
+ <stopword>avser</stopword>
+ <stopword>avses</stopword>
+ <stopword>bakom</stopword>
+ <stopword>bra</stopword>
+ <stopword>bredvid</stopword>
+ <stopword>de</stopword>
+ <stopword>dem</stopword>
+ <stopword>den</stopword>
+ <stopword>denna</stopword>
+ <stopword>deras</stopword>
+ <stopword>dess</stopword>
+ <stopword>det</stopword>
+ <stopword>detta</stopword>
+ <stopword>du</stopword>
+ <stopword>dä</stopword>
+ <stopword>där</stopword>
+ <stopword>efter</stopword>
+ <stopword>eftersom</stopword>
+ <stopword>efterät</stopword>
+ <stopword>ej</stopword>
+ <stopword>eller</stopword>
+ <stopword>emot</stopword>
+ <stopword>en</stopword>
+ <stopword>ett</stopword>
+ <stopword>fastän</stopword>
+ <stopword>fort</stopword>
+ <stopword>framför</stopword>
+ <stopword>från</stopword>
+ <stopword>för</stopword>
+ <stopword>genom</stopword>
+ <stopword>gott</stopword>
+ <stopword>hamske</stopword>
+ <stopword>han</stopword>
+ <stopword>hellre</stopword>
+ <stopword>hon</stopword>
+ <stopword>hos</stopword>
+ <stopword>hur</stopword>
+ <stopword>här</stopword>
+ <stopword>i</stopword>
+ <stopword>in</stopword>
+ <stopword>ingen</stopword>
+ <stopword>innan</stopword>
+ <stopword>inte</stopword>
+ <stopword>ja</stopword>
+ <stopword>jag</stopword>
+ <stopword>lite</stopword>
+ <stopword>långsamt</stopword>
+ <stopword>långt</stopword>
+ <stopword>man</stopword>
+ <stopword>med</stopword>
+ <stopword>medan</stopword>
+ <stopword>mellan</stopword>
+ <stopword>mer</stopword>
+ <stopword>mera</stopword>
+ <stopword>mindre</stopword>
+ <stopword>mot</stopword>
+ <stopword>myckett</stopword>
+ <stopword>nej</stopword>
+ <stopword>nere</stopword>
+ <stopword>ni</stopword>
+ <stopword>nu</stopword>
+ <stopword>när</stopword>
+ <stopword>nära</stopword>
+ <stopword>och</stopword>
+ <stopword>oksa</stopword>
+ <stopword>om</stopword>
+ <stopword>på</stopword>
+ <stopword>sin</stopword>
+ <stopword>skall</stopword>
+ <stopword>som</stopword>
+ <stopword>så</stopword>
+ <stopword>sådan</stopword>
+ <stopword>till</stopword>
+ <stopword>tillräckligt</stopword>
+ <stopword>tillsammans</stopword>
+ <stopword>trots</stopword>
+ <stopword>under</stopword>
+ <stopword>uppe</stopword>
+ <stopword>ut</stopword>
+ <stopword>utan</stopword>
+ <stopword>utom</stopword>
+ <stopword>vad</stopword>
+ <stopword>var</stopword>
+ <stopword>varför</stopword>
+ <stopword>vart</stopword>
+ <stopword>varthän</stopword>
+ <stopword>vem</stopword>
+ <stopword>vems</stopword>
+ <stopword>vi</stopword>
+ <stopword>vid</stopword>
+ <stopword>vilken</stopword>
+ <stopword>väl</stopword>
+ <stopword>än</stopword>
+ <stopword>ännu</stopword>
+ <stopword>är</stopword>
+ <stopword>Ã¥nyo</stopword>
+ <stopword>över</stopword>
+</stopwords>
Added: lenya/trunk/src/webapp/WEB-INF/xconf/lucene2.xconf
URL: http://svn.apache.org/viewcvs/lenya/trunk/src/webapp/WEB-INF/xconf/lucene2.xconf?rev=345035&view=auto
==============================================================================
--- lenya/trunk/src/webapp/WEB-INF/xconf/lucene2.xconf (added)
+++ lenya/trunk/src/webapp/WEB-INF/xconf/lucene2.xconf Wed Nov 16 07:24:44 2005
@@ -0,0 +1,92 @@
+<?xml version="1.0"?>
+<!--
+ Copyright 1999-2005 The Apache Software Foundation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+<components>
+ <!-- Include dependencies -->
+ <include src="context://WEB-INF/xconf/cocoon-xsp.xconf"/>
+
+ <!-- Include roles -->
+ <include src="resource://org/apache/cocoon/components/search/lucene2.roles"/>
+
+ <!-- Search:
+ These are the components that handle the search.
+
+ -->
+ <analyzer_manager logger="core.search.analyzer_manager">
+ <analyzer id="standard" class="org.apache.lucene.analysis.standard.StandardAnalyzer"/>
+ <analyzer id="stopword_en" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/English_en.xml" checkupdate="true"/>
+ <analyzer id="stopword_fr" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/French_fr.xml" checkupdate="true"/>
+ <analyzer id="analyzer_research" class="org.apache.cocoon.components.search.analyzer.ConfigurablePerFieldAnalyzer" configfile="context://WEB-INF/analyzer/perfieldconf.xml" checkupdate="false"/>
+ </analyzer_manager>
+
+ <index_manager logger="core.search.index_manager">
+
+ <indexer role="org.apache.cocoon.components.search.components.Indexer/default" />
+
+ <!-- ALL indexes (BE CAREFUL: Change the directory attribute) -->
+ <indexes>
+
+ <!--
+ id attribute : the index id
+ defaultAnalyzer: the id of the default analyzer (registered in AnalyzerManager)
+ directory: the location of the physical index
+ -->
+ <index id="research" analyzer="analyzer_research" directory="d:\\index">
+ <structure>
+ <!--
+ type text: tokenized , indexed (with the additional attribute "storeText" : stored/ unstored)
+ type keyword: no tokenized , indexed, stored
+ type date = type keyword but for specific date type
+ -->
+ <field id="title" type="text" storetext="true"/>
+ <field id="author" type="text"/>
+ <field id="description_fr" type="text" storetext="true"/>
+ <field id="description_en" type="text" storetext="true"/>
+ <field id="date" type="date" dateformat="yyyy-MM-dd"/>
+ <field id="subject" type="keyword"/>
+ <field id="level" type="keyword"/>
+ <field id="type" type="keyword" />
+ <field id="format" type="keyword" />
+ <field id="topic" type="keyword" />
+ </structure>
+ </index>
+
+ <!-- STANDARD HTML INDEX -->
+ <index id="HTML" analyzer="stopword_en" directory="d:\\index2" >
+ <structure>
+ <field id="url" type="keyword" />
+ <field id="title" type="text" storetext="true"/>
+ <field id="body" type="text" storetext="false"/>
+ </structure>
+ </index>
+ </indexes>
+ </index_manager>
+
+<!-- default indexer component -->
+ <default_indexer logger="core.search.default_indexer">
+ <!-- number of lucene documents in the buffer -->
+ <buffersize>200</buffersize>
+ </default_indexer>
+
+<!-- parallel indexer component -->
+ <parallel_indexer logger="core.search.parallel_indexer">
+ <!-- number of thread (normaly = number of CPUs) -->
+ <numthread>2</numthread>
+ </parallel_indexer>
+
+
+</components>
---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscribe@lenya.apache.org
For additional commands, e-mail: commits-help@lenya.apache.org