You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@lenya.apache.org by ru...@apache.org on 2011/02/02 19:45:30 UTC
svn commit: r1066576 - in /lenya/branches/BRANCH_2_1_X/src:
modules/lucene/config/cocoon-xconf/analyzer_manager.xconf
webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml
webapp/WEB-INF/analyzer/stopword/Russian_ru.xml
Author: rudolf
Date: Wed Feb 2 18:45:29 2011
New Revision: 1066576
URL: http://svn.apache.org/viewvc?rev=1066576&view=rev
Log:
add russian and arabic stopword files
Added:
lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml
Modified:
lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf
lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml
Modified: lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf
URL: http://svn.apache.org/viewvc/lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf?rev=1066576&r1=1066575&r2=1066576&view=diff
==============================================================================
--- lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf (original)
+++ lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf Wed Feb 2 18:45:29 2011
@@ -21,6 +21,7 @@
<analyzer_manager logger="core.search.analyzer_manager">
<analyzer id="standard" class="org.apache.lucene.analysis.standard.StandardAnalyzer"/>
+ <analyzer id="stopword_ar" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Arabic_ar.xml" checkupdate="true"/>
<analyzer id="stopword_da" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Danish_da.xml" checkupdate="true"/>
<analyzer id="stopword_nl" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Dutch_nl.xml" checkupdate="true"/>
<analyzer id="stopword_en" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/English_en.xml" checkupdate="true"/>
@@ -31,9 +32,7 @@
<analyzer id="stopword_no" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Norwegian_no.xml" checkupdate="true"/>
<analyzer id="stopword_pl" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Polish_pl.xml" checkupdate="true"/>
<analyzer id="stopword_pt" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Portuguese_pt.xml" checkupdate="true"/>
- <!--
<analyzer id="stopword_ru" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Russian_ru.xml" checkupdate="true"/>
- -->
<analyzer id="stopword_es" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Spanish_es.xml" checkupdate="true"/>
<analyzer id="stopword_sv" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Swedish_sv.xml" checkupdate="true"/>
<analyzer id="analyzer_research" class="org.apache.cocoon.components.search.analyzer.ConfigurablePerFieldAnalyzer" configfile="context://WEB-INF/analyzer/perfieldconf.xml" checkupdate="false"/>
Added: lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml
URL: http://svn.apache.org/viewvc/lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml?rev=1066576&view=auto
==============================================================================
--- lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml (added)
+++ lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml Wed Feb 2 18:45:29 2011
@@ -0,0 +1,124 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<stopwords>
+ <stopword>Ù
Ù</stopword>
+ <stopword>ÙÙ
Ù</stopword>
+ <stopword>Ù
ÙÙا</stopword>
+ <stopword>Ù
ÙÙ</stopword>
+ <stopword>ÙÙ</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>ÙÙÙا</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>Ù</stopword>
+ <stopword>Ù</stopword>
+ <stopword>Ø«Ù
</stopword>
+ <stopword>اÙ</stopword>
+ <stopword>Ø£Ù</stopword>
+ <stopword>ب</stopword>
+ <stopword>بÙا</stopword>
+ <stopword>بÙ</stopword>
+ <stopword>ا</stopword>
+ <stopword>Ø£</stopword>
+ <stopword>اÙ</stopword>
+ <stopword>اÙ</stopword>
+ <stopword>Ø£Ù</stopword>
+ <stopword>Ø£Ù</stopword>
+ <stopword>Ùا</stopword>
+ <stopword>ÙÙا</stopword>
+ <stopword>اÙا</stopword>
+ <stopword>Ø£Ùا</stopword>
+ <stopword>Ø¥Ùا</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>Ù
ا</stopword>
+ <stopword>ÙÙ
ا</stopword>
+ <stopword>ÙÙ
ا</stopword>
+ <stopword>ÙÙ
ا</stopword>
+ <stopword>عÙ</stopword>
+ <stopword>Ù
ع</stopword>
+ <stopword>اذا</stopword>
+ <stopword>إذا</stopword>
+ <stopword>اÙ</stopword>
+ <stopword>Ø£Ù</stopword>
+ <stopword>Ø¥Ù</stopword>
+ <stopword>اÙÙا</stopword>
+ <stopword>Ø£ÙÙا</stopword>
+ <stopword>Ø¥ÙÙا</stopword>
+ <stopword>اÙÙ</stopword>
+ <stopword>Ø£ÙÙ</stopword>
+ <stopword>Ø¥ÙÙ</stopword>
+ <stopword>باÙ</stopword>
+ <stopword>بأÙ</stopword>
+ <stopword>ÙاÙ</stopword>
+ <stopword>ÙØ£Ù</stopword>
+ <stopword>ÙاÙ</stopword>
+ <stopword>ÙØ£Ù</stopword>
+ <stopword>ÙØ¥Ù</stopword>
+ <stopword>اÙتÙ</stopword>
+ <stopword>اÙتÙ</stopword>
+ <stopword>اÙØ°Ù</stopword>
+ <stopword>اÙØ°Ù</stopword>
+ <stopword>اÙØ°ÙÙ</stopword>
+ <stopword>اÙÙ</stopword>
+ <stopword>اÙÙ</stopword>
+ <stopword>Ø¥ÙÙ</stopword>
+ <stopword>Ø¥ÙÙ</stopword>
+ <stopword>عÙÙ</stopword>
+ <stopword>عÙÙÙا</stopword>
+ <stopword>عÙÙÙ</stopword>
+ <stopword>اÙ
ا</stopword>
+ <stopword>Ø£Ù
ا</stopword>
+ <stopword>Ø¥Ù
ا</stopword>
+ <stopword>اÙضا</stopword>
+ <stopword>Ø£Ùضا</stopword>
+ <stopword>ÙÙ</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>ÙÙ
</stopword>
+ <stopword>ÙÙÙ
</stopword>
+ <stopword>ÙÙ</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>ÙÙ</stopword>
+ <stopword>ÙÙ</stopword>
+ <stopword>ÙÙ</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>ÙÙÙ</stopword>
+ <stopword>اÙت</stopword>
+ <stopword>Ø£Ùت</stopword>
+ <stopword>ÙÙ</stopword>
+ <stopword>ÙÙا</stopword>
+ <stopword>ÙÙ</stopword>
+ <stopword>ÙØ°Ù</stopword>
+ <stopword>Ùذا</stopword>
+ <stopword>تÙÙ</stopword>
+ <stopword>Ø°ÙÙ</stopword>
+ <stopword>ÙÙاÙ</stopword>
+ <stopword>ÙاÙت</stopword>
+ <stopword>ÙاÙ</stopword>
+ <stopword>ÙÙÙÙ</stopword>
+ <stopword>تÙÙÙ</stopword>
+ <stopword>ÙÙاÙت</stopword>
+ <stopword>ÙÙاÙ</stopword>
+ <stopword>غÙر</stopword>
+ <stopword>بعض</stopword>
+ <stopword>Ùد</stopword>
+ <stopword>ÙØÙ</stopword>
+ <stopword>بÙÙ</stopword>
+ <stopword>بÙÙÙ
ا</stopword>
+ <stopword>Ù
ÙØ°</stopword>
+ <stopword>ضÙ
Ù</stopword>
+ <stopword>ØÙØ«</stopword>
+ <stopword>اÙاÙ</stopword>
+ <stopword>اÙØ¢Ù</stopword>
+ <stopword>Ø®ÙاÙ</stopword>
+ <stopword>بعد</stopword>
+ <stopword>ÙبÙ</stopword>
+ <stopword>ØتÙ</stopword>
+ <stopword>عÙد</stopword>
+ <stopword>عÙدÙ
ا</stopword>
+ <stopword>ÙدÙ</stopword>
+ <stopword>جÙ
Ùع</stopword>
+</stopwords>
+
Modified: lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml
URL: http://svn.apache.org/viewvc/lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml?rev=1066576&r1=1066575&r2=1066576&view=diff
==============================================================================
--- lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml (original)
+++ lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml Wed Feb 2 18:45:29 2011
@@ -1,101 +1,164 @@
<?xml version="1.0" encoding="UTF-8"?>
+
<stopwords>
-<stopword>а</stopword>
-<stopword>без</stopword>
-<stopword>более</stopword>
-<stopword>бÑ</stopword>
-<stopword>бÑл</stopword>
-<stopword>бÑла</stopword>
-<stopword>бÑли</stopword>
-<stopword>бÑло</stopword>
-<stopword>бÑÑÑ</stopword>
-<stopword>в</stopword>
-<stopword>вам</stopword>
-<stopword>ваÑ?</stopword>
-<stopword>веÑ?Ñ</stopword>
-<stopword>во</stopword>
-<stopword>воÑ</stopword>
-<stopword>вÑ?е</stopword>
-<stopword>вÑ?его</stopword>
-<stopword>вÑ?еÑ
</stopword>
-<stopword>вÑ</stopword>
-<stopword>где</stopword>
-<stopword>да</stopword>
-<stopword>даже</stopword>
-<stopword>длÑ?</stopword>
-<stopword>до</stopword>
-<stopword>его</stopword>
-<stopword>ее</stopword>
-<stopword>еÑ?ли</stopword>
-<stopword>еÑ?ÑÑ</stopword>
-<stopword>еÑе</stopword>
-<stopword>же</stopword>
-<stopword>за</stopword>
-<stopword>здеÑ?Ñ</stopword>
-<stopword>и</stopword>
-<stopword>из</stopword>
-<stopword>или</stopword>
-<stopword>им</stopword>
-<stopword>иÑ
</stopword>
-<stopword>к</stopword>
-<stopword>как</stopword>
-<stopword>ко</stopword>
-<stopword>когда</stopword>
-<stopword>кÑо</stopword>
-<stopword>ли</stopword>
-<stopword>либо</stopword>
-<stopword>мне</stopword>
-<stopword>можеÑ</stopword>
-<stopword>мÑ</stopword>
-<stopword>на</stopword>
-<stopword>надо</stopword>
-<stopword>наÑ</stopword>
-<stopword>не</stopword>
-<stopword>него</stopword>
-<stopword>нее</stopword>
-<stopword>неÑ</stopword>
-<stopword>ни</stopword>
-<stopword>ниÑ
</stopword>
-<stopword>но</stopword>
-<stopword>нÑ</stopword>
-<stopword>о</stopword>
-<stopword>об</stopword>
-<stopword>однако</stopword>
-<stopword>он</stopword>
-<stopword>она</stopword>
-<stopword>они</stopword>
-<stopword>оно</stopword>
-<stopword>оÑ</stopword>
-<stopword>оÑенÑ</stopword>
-<stopword>по</stopword>
-<stopword>под</stopword>
-<stopword>пÑи</stopword>
-<stopword>Ñ?</stopword>
-<stopword>Ñ?о</stopword>
-<stopword>Ñак</stopword>
-<stopword>Ñакже</stopword>
-<stopword>Ñакой</stopword>
-<stopword>Ñам</stopword>
-<stopword>Ñе</stopword>
-<stopword>Ñем</stopword>
-<stopword>Ñо</stopword>
-<stopword>Ñого</stopword>
-<stopword>Ñоже</stopword>
-<stopword>Ñой</stopword>
-<stopword>ÑолÑко</stopword>
-<stopword>Ñом</stopword>
-<stopword>ÑÑ</stopword>
-<stopword>Ñ</stopword>
-<stopword>Ñже</stopword>
-<stopword>Ñ
оÑÑ?</stopword>
-<stopword>Ñего</stopword>
-<stopword>Ñей</stopword>
-<stopword>Ñем</stopword>
-<stopword>ÑÑо</stopword>
-<stopword>ÑÑобÑ</stopword>
-<stopword>ÑÑе</stopword>
-<stopword>ÑÑÑ?</stopword>
-<stopword>Ñ?Ñа</stopword>
-<stopword>Ñ?Ñи</stopword>
-<stopword>Ñ?Ñо</stopword>
-<stopword>Ñ?</stopword></stopwords>
+ <stopword>и</stopword>
+ <stopword>в</stopword>
+ <stopword>во</stopword>
+ <stopword>не</stopword>
+ <stopword>ÑÑо</stopword>
+ <stopword>он</stopword>
+ <stopword>на</stopword>
+ <stopword>Ñ</stopword>
+ <stopword>Ñ</stopword>
+ <stopword>Ñо</stopword>
+ <stopword>как</stopword>
+ <stopword>а</stopword>
+ <stopword>Ñо</stopword>
+ <stopword>вÑе</stopword>
+ <stopword>она</stopword>
+ <stopword>Ñак</stopword>
+ <stopword>его</stopword>
+ <stopword>но</stopword>
+ <stopword>да</stopword>
+ <stopword>ÑÑ</stopword>
+ <stopword>к</stopword>
+ <stopword>Ñ</stopword>
+ <stopword>же</stopword>
+ <stopword>вÑ</stopword>
+ <stopword>за</stopword>
+ <stopword>бÑ</stopword>
+ <stopword>по</stopword>
+ <stopword>ÑолÑко</stopword>
+ <stopword>ее</stopword>
+ <stopword>мне</stopword>
+ <stopword>бÑло</stopword>
+ <stopword>воÑ</stopword>
+ <stopword>оÑ</stopword>
+ <stopword>менÑ</stopword>
+ <stopword>еÑе</stopword>
+ <stopword>неÑ</stopword>
+ <stopword>о</stopword>
+ <stopword>из</stopword>
+ <stopword>емÑ</stopword>
+ <stopword>ÑепеÑÑ</stopword>
+ <stopword>когда</stopword>
+ <stopword>даже</stopword>
+ <stopword>нÑ</stopword>
+ <stopword>вдÑÑг</stopword>
+ <stopword>ли</stopword>
+ <stopword>еÑли</stopword>
+ <stopword>Ñже</stopword>
+ <stopword>или</stopword>
+ <stopword>ни</stopword>
+ <stopword>бÑÑÑ</stopword>
+ <stopword>бÑл</stopword>
+ <stopword>него</stopword>
+ <stopword>до</stopword>
+ <stopword>ваÑ</stopword>
+ <stopword>нибÑдÑ</stopword>
+ <stopword>опÑÑÑ</stopword>
+ <stopword>Ñж</stopword>
+ <stopword>вам</stopword>
+ <stopword>Ñказал</stopword>
+ <stopword>ведÑ</stopword>
+ <stopword>Ñам</stopword>
+ <stopword>поÑом</stopword>
+ <stopword>ÑебÑ</stopword>
+ <stopword>ниÑего</stopword>
+ <stopword>ей</stopword>
+ <stopword>можеÑ</stopword>
+ <stopword>они</stopword>
+ <stopword>ÑÑÑ</stopword>
+ <stopword>где</stopword>
+ <stopword>еÑÑÑ</stopword>
+ <stopword>надо</stopword>
+ <stopword>ней</stopword>
+ <stopword>длÑ</stopword>
+ <stopword>мÑ</stopword>
+ <stopword>ÑебÑ</stopword>
+ <stopword>иÑ
</stopword>
+ <stopword>Ñем</stopword>
+ <stopword>бÑла</stopword>
+ <stopword>Ñам</stopword>
+ <stopword>ÑÑоб</stopword>
+ <stopword>без</stopword>
+ <stopword>бÑдÑо</stopword>
+ <stopword>Ñеловек</stopword>
+ <stopword>Ñего</stopword>
+ <stopword>Ñаз</stopword>
+ <stopword>Ñоже</stopword>
+ <stopword>Ñебе</stopword>
+ <stopword>под</stopword>
+ <stopword>жизнÑ</stopword>
+ <stopword>бÑдеÑ</stopword>
+ <stopword>ж</stopword>
+ <stopword>Ñогда</stopword>
+ <stopword>кÑо</stopword>
+ <stopword>ÑÑоÑ</stopword>
+ <stopword>говоÑил</stopword>
+ <stopword>Ñого</stopword>
+ <stopword>поÑомÑ</stopword>
+ <stopword>ÑÑого</stopword>
+ <stopword>какой</stopword>
+ <stopword>ÑовÑем</stopword>
+ <stopword>ним</stopword>
+ <stopword>здеÑÑ</stopword>
+ <stopword>ÑÑом</stopword>
+ <stopword>один</stopword>
+ <stopword>поÑÑи</stopword>
+ <stopword>мой</stopword>
+ <stopword>Ñем</stopword>
+ <stopword>ÑÑобÑ</stopword>
+ <stopword>нее</stopword>
+ <stopword>кажеÑÑÑ</stopword>
+ <stopword>ÑейÑаÑ</stopword>
+ <stopword>бÑли</stopword>
+ <stopword>кÑда</stopword>
+ <stopword>заÑем</stopword>
+ <stopword>ÑказаÑÑ</stopword>
+ <stopword>вÑеÑ
</stopword>
+ <stopword>никогда</stopword>
+ <stopword>ÑегоднÑ</stopword>
+ <stopword>можно</stopword>
+ <stopword>пÑи</stopword>
+ <stopword>наконеÑ</stopword>
+ <stopword>два</stopword>
+ <stopword>об</stopword>
+ <stopword>дÑÑгой</stopword>
+ <stopword>Ñ
оÑÑ</stopword>
+ <stopword>поÑле</stopword>
+ <stopword>над</stopword>
+ <stopword>болÑÑе</stopword>
+ <stopword>ÑоÑ</stopword>
+ <stopword>ÑеÑез</stopword>
+ <stopword>ÑÑи</stopword>
+ <stopword>наÑ</stopword>
+ <stopword>пÑо</stopword>
+ <stopword>вÑего</stopword>
+ <stopword>ниÑ
</stopword>
+ <stopword>какаÑ</stopword>
+ <stopword>много</stopword>
+ <stopword>Ñазве</stopword>
+ <stopword>Ñказала</stopword>
+ <stopword>ÑÑи</stopword>
+ <stopword>ÑÑÑ</stopword>
+ <stopword>моÑ</stopword>
+ <stopword>впÑоÑем</stopword>
+ <stopword>Ñ
оÑоÑо</stopword>
+ <stopword>ÑвоÑ</stopword>
+ <stopword>ÑÑой</stopword>
+ <stopword>пеÑед</stopword>
+ <stopword>иногда</stopword>
+ <stopword>лÑÑÑе</stopword>
+ <stopword>ÑÑÑÑ</stopword>
+ <stopword>Ñом</stopword>
+ <stopword>нелÑзÑ</stopword>
+ <stopword>Ñакой</stopword>
+ <stopword>им</stopword>
+ <stopword>более</stopword>
+ <stopword>вÑегда</stopword>
+ <stopword>конеÑно</stopword>
+ <stopword>вÑÑ</stopword>
+ <stopword>междÑ</stopword>
+</stopwords>
+
---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscribe@lenya.apache.org
For additional commands, e-mail: commits-help@lenya.apache.org
Re: svn commit: r1066576 - in /lenya/branches/BRANCH_2_1_X/src: modules/lucene/config/cocoon-xconf/analyzer_manager.xconf
webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml webapp/WEB-INF/analyzer/stopword/Russian_ru.xml
Posted by ru...@uniklinik-freiburg.de.
Hi Florent,
florent andré <fl...@4sengines.com> schrieb am 03.02.2011
01:14:24:
> Von: florent andré <fl...@4sengines.com>
> An: dev@lenya.apache.org
> Datum: 03.02.2011 01:15
> Betreff: Re: svn commit: r1066576 - in /lenya/branches/BRANCH_2_1_X/
> src: modules/lucene/config/cocoon-xconf/analyzer_manager.xconf
> webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml webapp/WEB-INF/
> analyzer/stopword/Russian_ru.xml
>
> Hi,
> What is stopword ? Used for ?
>
Stopwords are simple words that are not indexed by lucene.
We are building a site with russian and arabic language, but for this
languages using of stopwords was not implemented.
Does anyone know how to do it in chinese ?
(Maybe we have to provide this in the near future)
Rudolf
---------------------------------------------------------------------
To unsubscribe, e-mail: dev-unsubscribe@lenya.apache.org
For additional commands, e-mail: dev-help@lenya.apache.org
Re: svn commit: r1066576 - in /lenya/branches/BRANCH_2_1_X/src: modules/lucene/config/cocoon-xconf/analyzer_manager.xconf
webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml webapp/WEB-INF/analyzer/stopword/Russian_ru.xml
Posted by florent andré <fl...@4sengines.com>.
Hi,
What is stopword ? Used for ?
Seems cool, linked to Lucene...
Thanks.
On 02/02/2011 07:45 PM, rudolf@apache.org wrote:
> Author: rudolf
> Date: Wed Feb 2 18:45:29 2011
> New Revision: 1066576
>
> URL: http://svn.apache.org/viewvc?rev=1066576&view=rev
> Log:
> add russian and arabic stopword files
>
> Added:
> lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml
> Modified:
> lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf
> lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml
>
> Modified: lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf
> URL: http://svn.apache.org/viewvc/lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf?rev=1066576&r1=1066575&r2=1066576&view=diff
> ==============================================================================
> --- lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf (original)
> +++ lenya/branches/BRANCH_2_1_X/src/modules/lucene/config/cocoon-xconf/analyzer_manager.xconf Wed Feb 2 18:45:29 2011
> @@ -21,6 +21,7 @@
>
> <analyzer_manager logger="core.search.analyzer_manager">
> <analyzer id="standard" class="org.apache.lucene.analysis.standard.StandardAnalyzer"/>
> + <analyzer id="stopword_ar" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Arabic_ar.xml" checkupdate="true"/>
> <analyzer id="stopword_da" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Danish_da.xml" checkupdate="true"/>
> <analyzer id="stopword_nl" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Dutch_nl.xml" checkupdate="true"/>
> <analyzer id="stopword_en" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/English_en.xml" checkupdate="true"/>
> @@ -31,9 +32,7 @@
> <analyzer id="stopword_no" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Norwegian_no.xml" checkupdate="true"/>
> <analyzer id="stopword_pl" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Polish_pl.xml" checkupdate="true"/>
> <analyzer id="stopword_pt" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Portuguese_pt.xml" checkupdate="true"/>
> - <!--
> <analyzer id="stopword_ru" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Russian_ru.xml" checkupdate="true"/>
> - -->
> <analyzer id="stopword_es" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Spanish_es.xml" checkupdate="true"/>
> <analyzer id="stopword_sv" class="org.apache.cocoon.components.search.analyzer.ConfigurableStopwordAnalyzer" configfile="context://WEB-INF/analyzer/stopword/Swedish_sv.xml" checkupdate="true"/>
> <analyzer id="analyzer_research" class="org.apache.cocoon.components.search.analyzer.ConfigurablePerFieldAnalyzer" configfile="context://WEB-INF/analyzer/perfieldconf.xml" checkupdate="false"/>
>
> Added: lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml
> URL: http://svn.apache.org/viewvc/lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml?rev=1066576&view=auto
> ==============================================================================
> --- lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml (added)
> +++ lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Arabic_ar.xml Wed Feb 2 18:45:29 2011
> @@ -0,0 +1,124 @@
> +<?xml version="1.0" encoding="UTF-8"?>
> +
> +<stopwords>
> + <stopword>Ù
Ù</stopword>
> + <stopword>ÙÙ
Ù</stopword>
> + <stopword>Ù
ÙÙا</stopword>
> + <stopword>Ù
ÙÙ</stopword>
> + <stopword>ÙÙ</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>ÙÙÙا</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>Ù</stopword>
> + <stopword>Ù</stopword>
> + <stopword>Ø«Ù
</stopword>
> + <stopword>اÙ</stopword>
> + <stopword>Ø£Ù</stopword>
> + <stopword>ب</stopword>
> + <stopword>بÙا</stopword>
> + <stopword>بÙ</stopword>
> + <stopword>ا</stopword>
> + <stopword>Ø£</stopword>
> + <stopword>اÙ</stopword>
> + <stopword>اÙ</stopword>
> + <stopword>Ø£Ù</stopword>
> + <stopword>Ø£Ù</stopword>
> + <stopword>Ùا</stopword>
> + <stopword>ÙÙا</stopword>
> + <stopword>اÙا</stopword>
> + <stopword>Ø£Ùا</stopword>
> + <stopword>Ø¥Ùا</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>Ù
ا</stopword>
> + <stopword>ÙÙ
ا</stopword>
> + <stopword>ÙÙ
ا</stopword>
> + <stopword>ÙÙ
ا</stopword>
> + <stopword>عÙ</stopword>
> + <stopword>Ù
ع</stopword>
> + <stopword>اذا</stopword>
> + <stopword>إذا</stopword>
> + <stopword>اÙ</stopword>
> + <stopword>Ø£Ù</stopword>
> + <stopword>Ø¥Ù</stopword>
> + <stopword>اÙÙا</stopword>
> + <stopword>Ø£ÙÙا</stopword>
> + <stopword>Ø¥ÙÙا</stopword>
> + <stopword>اÙÙ</stopword>
> + <stopword>Ø£ÙÙ</stopword>
> + <stopword>Ø¥ÙÙ</stopword>
> + <stopword>باÙ</stopword>
> + <stopword>بأÙ</stopword>
> + <stopword>ÙاÙ</stopword>
> + <stopword>ÙØ£Ù</stopword>
> + <stopword>ÙاÙ</stopword>
> + <stopword>ÙØ£Ù</stopword>
> + <stopword>ÙØ¥Ù</stopword>
> + <stopword>اÙتÙ</stopword>
> + <stopword>اÙتÙ</stopword>
> + <stopword>اÙØ°Ù</stopword>
> + <stopword>اÙØ°Ù</stopword>
> + <stopword>اÙØ°ÙÙ</stopword>
> + <stopword>اÙÙ</stopword>
> + <stopword>اÙÙ</stopword>
> + <stopword>Ø¥ÙÙ</stopword>
> + <stopword>Ø¥ÙÙ</stopword>
> + <stopword>عÙÙ</stopword>
> + <stopword>عÙÙÙا</stopword>
> + <stopword>عÙÙÙ</stopword>
> + <stopword>اÙ
ا</stopword>
> + <stopword>Ø£Ù
ا</stopword>
> + <stopword>Ø¥Ù
ا</stopword>
> + <stopword>اÙضا</stopword>
> + <stopword>Ø£Ùضا</stopword>
> + <stopword>ÙÙ</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>ÙÙ
</stopword>
> + <stopword>ÙÙÙ
</stopword>
> + <stopword>ÙÙ</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>ÙÙ</stopword>
> + <stopword>ÙÙ</stopword>
> + <stopword>ÙÙ</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>ÙÙÙ</stopword>
> + <stopword>اÙت</stopword>
> + <stopword>Ø£Ùت</stopword>
> + <stopword>ÙÙ</stopword>
> + <stopword>ÙÙا</stopword>
> + <stopword>ÙÙ</stopword>
> + <stopword>ÙØ°Ù</stopword>
> + <stopword>Ùذا</stopword>
> + <stopword>تÙÙ</stopword>
> + <stopword>Ø°ÙÙ</stopword>
> + <stopword>ÙÙاÙ</stopword>
> + <stopword>ÙاÙت</stopword>
> + <stopword>ÙاÙ</stopword>
> + <stopword>ÙÙÙÙ</stopword>
> + <stopword>تÙÙÙ</stopword>
> + <stopword>ÙÙاÙت</stopword>
> + <stopword>ÙÙاÙ</stopword>
> + <stopword>غÙر</stopword>
> + <stopword>بعض</stopword>
> + <stopword>Ùد</stopword>
> + <stopword>ÙØÙ</stopword>
> + <stopword>بÙÙ</stopword>
> + <stopword>بÙÙÙ
ا</stopword>
> + <stopword>Ù
ÙØ°</stopword>
> + <stopword>ضÙ
Ù</stopword>
> + <stopword>ØÙØ«</stopword>
> + <stopword>اÙاÙ</stopword>
> + <stopword>اÙØ¢Ù</stopword>
> + <stopword>Ø®ÙاÙ</stopword>
> + <stopword>بعد</stopword>
> + <stopword>ÙبÙ</stopword>
> + <stopword>ØتÙ</stopword>
> + <stopword>عÙد</stopword>
> + <stopword>عÙدÙ
ا</stopword>
> + <stopword>ÙدÙ</stopword>
> + <stopword>جÙ
Ùع</stopword>
> +</stopwords>
> +
>
> Modified: lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml
> URL: http://svn.apache.org/viewvc/lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml?rev=1066576&r1=1066575&r2=1066576&view=diff
> ==============================================================================
> --- lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml (original)
> +++ lenya/branches/BRANCH_2_1_X/src/webapp/WEB-INF/analyzer/stopword/Russian_ru.xml Wed Feb 2 18:45:29 2011
> @@ -1,101 +1,164 @@
> <?xml version="1.0" encoding="UTF-8"?>
> +
> <stopwords>
> -<stopword>а</stopword>
> -<stopword>без</stopword>
> -<stopword>более</stopword>
> -<stopword>бÑ</stopword>
> -<stopword>бÑл</stopword>
> -<stopword>бÑла</stopword>
> -<stopword>бÑли</stopword>
> -<stopword>бÑло</stopword>
> -<stopword>бÑÑÑ</stopword>
> -<stopword>в</stopword>
> -<stopword>вам</stopword>
> -<stopword>ваÑ?</stopword>
> -<stopword>веÑ?Ñ</stopword>
> -<stopword>во</stopword>
> -<stopword>воÑ</stopword>
> -<stopword>вÑ?е</stopword>
> -<stopword>вÑ?его</stopword>
> -<stopword>вÑ?еÑ
</stopword>
> -<stopword>вÑ</stopword>
> -<stopword>где</stopword>
> -<stopword>да</stopword>
> -<stopword>даже</stopword>
> -<stopword>длÑ?</stopword>
> -<stopword>до</stopword>
> -<stopword>его</stopword>
> -<stopword>ее</stopword>
> -<stopword>еÑ?ли</stopword>
> -<stopword>еÑ?ÑÑ</stopword>
> -<stopword>еÑе</stopword>
> -<stopword>же</stopword>
> -<stopword>за</stopword>
> -<stopword>здеÑ?Ñ</stopword>
> -<stopword>и</stopword>
> -<stopword>из</stopword>
> -<stopword>или</stopword>
> -<stopword>им</stopword>
> -<stopword>иÑ
</stopword>
> -<stopword>к</stopword>
> -<stopword>как</stopword>
> -<stopword>ко</stopword>
> -<stopword>когда</stopword>
> -<stopword>кÑо</stopword>
> -<stopword>ли</stopword>
> -<stopword>либо</stopword>
> -<stopword>мне</stopword>
> -<stopword>можеÑ</stopword>
> -<stopword>мÑ</stopword>
> -<stopword>на</stopword>
> -<stopword>надо</stopword>
> -<stopword>наÑ</stopword>
> -<stopword>не</stopword>
> -<stopword>него</stopword>
> -<stopword>нее</stopword>
> -<stopword>неÑ</stopword>
> -<stopword>ни</stopword>
> -<stopword>ниÑ
</stopword>
> -<stopword>но</stopword>
> -<stopword>нÑ</stopword>
> -<stopword>о</stopword>
> -<stopword>об</stopword>
> -<stopword>однако</stopword>
> -<stopword>он</stopword>
> -<stopword>она</stopword>
> -<stopword>они</stopword>
> -<stopword>оно</stopword>
> -<stopword>оÑ</stopword>
> -<stopword>оÑенÑ</stopword>
> -<stopword>по</stopword>
> -<stopword>под</stopword>
> -<stopword>пÑи</stopword>
> -<stopword>Ñ?</stopword>
> -<stopword>Ñ?о</stopword>
> -<stopword>Ñак</stopword>
> -<stopword>Ñакже</stopword>
> -<stopword>Ñакой</stopword>
> -<stopword>Ñам</stopword>
> -<stopword>Ñе</stopword>
> -<stopword>Ñем</stopword>
> -<stopword>Ñо</stopword>
> -<stopword>Ñого</stopword>
> -<stopword>Ñоже</stopword>
> -<stopword>Ñой</stopword>
> -<stopword>ÑолÑко</stopword>
> -<stopword>Ñом</stopword>
> -<stopword>ÑÑ</stopword>
> -<stopword>Ñ</stopword>
> -<stopword>Ñже</stopword>
> -<stopword>Ñ
оÑÑ?</stopword>
> -<stopword>Ñего</stopword>
> -<stopword>Ñей</stopword>
> -<stopword>Ñем</stopword>
> -<stopword>ÑÑо</stopword>
> -<stopword>ÑÑобÑ</stopword>
> -<stopword>ÑÑе</stopword>
> -<stopword>ÑÑÑ?</stopword>
> -<stopword>Ñ?Ñа</stopword>
> -<stopword>Ñ?Ñи</stopword>
> -<stopword>Ñ?Ñо</stopword>
> -<stopword>Ñ?</stopword></stopwords>
> + <stopword>и</stopword>
> + <stopword>в</stopword>
> + <stopword>во</stopword>
> + <stopword>не</stopword>
> + <stopword>ÑÑо</stopword>
> + <stopword>он</stopword>
> + <stopword>на</stopword>
> + <stopword>Ñ</stopword>
> + <stopword>Ñ</stopword>
> + <stopword>Ñо</stopword>
> + <stopword>как</stopword>
> + <stopword>а</stopword>
> + <stopword>Ñо</stopword>
> + <stopword>вÑе</stopword>
> + <stopword>она</stopword>
> + <stopword>Ñак</stopword>
> + <stopword>его</stopword>
> + <stopword>но</stopword>
> + <stopword>да</stopword>
> + <stopword>ÑÑ</stopword>
> + <stopword>к</stopword>
> + <stopword>Ñ</stopword>
> + <stopword>же</stopword>
> + <stopword>вÑ</stopword>
> + <stopword>за</stopword>
> + <stopword>бÑ</stopword>
> + <stopword>по</stopword>
> + <stopword>ÑолÑко</stopword>
> + <stopword>ее</stopword>
> + <stopword>мне</stopword>
> + <stopword>бÑло</stopword>
> + <stopword>воÑ</stopword>
> + <stopword>оÑ</stopword>
> + <stopword>менÑ</stopword>
> + <stopword>еÑе</stopword>
> + <stopword>неÑ</stopword>
> + <stopword>о</stopword>
> + <stopword>из</stopword>
> + <stopword>емÑ</stopword>
> + <stopword>ÑепеÑÑ</stopword>
> + <stopword>когда</stopword>
> + <stopword>даже</stopword>
> + <stopword>нÑ</stopword>
> + <stopword>вдÑÑг</stopword>
> + <stopword>ли</stopword>
> + <stopword>еÑли</stopword>
> + <stopword>Ñже</stopword>
> + <stopword>или</stopword>
> + <stopword>ни</stopword>
> + <stopword>бÑÑÑ</stopword>
> + <stopword>бÑл</stopword>
> + <stopword>него</stopword>
> + <stopword>до</stopword>
> + <stopword>ваÑ</stopword>
> + <stopword>нибÑдÑ</stopword>
> + <stopword>опÑÑÑ</stopword>
> + <stopword>Ñж</stopword>
> + <stopword>вам</stopword>
> + <stopword>Ñказал</stopword>
> + <stopword>ведÑ</stopword>
> + <stopword>Ñам</stopword>
> + <stopword>поÑом</stopword>
> + <stopword>ÑебÑ</stopword>
> + <stopword>ниÑего</stopword>
> + <stopword>ей</stopword>
> + <stopword>можеÑ</stopword>
> + <stopword>они</stopword>
> + <stopword>ÑÑÑ</stopword>
> + <stopword>где</stopword>
> + <stopword>еÑÑÑ</stopword>
> + <stopword>надо</stopword>
> + <stopword>ней</stopword>
> + <stopword>длÑ</stopword>
> + <stopword>мÑ</stopword>
> + <stopword>ÑебÑ</stopword>
> + <stopword>иÑ
</stopword>
> + <stopword>Ñем</stopword>
> + <stopword>бÑла</stopword>
> + <stopword>Ñам</stopword>
> + <stopword>ÑÑоб</stopword>
> + <stopword>без</stopword>
> + <stopword>бÑдÑо</stopword>
> + <stopword>Ñеловек</stopword>
> + <stopword>Ñего</stopword>
> + <stopword>Ñаз</stopword>
> + <stopword>Ñоже</stopword>
> + <stopword>Ñебе</stopword>
> + <stopword>под</stopword>
> + <stopword>жизнÑ</stopword>
> + <stopword>бÑдеÑ</stopword>
> + <stopword>ж</stopword>
> + <stopword>Ñогда</stopword>
> + <stopword>кÑо</stopword>
> + <stopword>ÑÑоÑ</stopword>
> + <stopword>говоÑил</stopword>
> + <stopword>Ñого</stopword>
> + <stopword>поÑомÑ</stopword>
> + <stopword>ÑÑого</stopword>
> + <stopword>какой</stopword>
> + <stopword>ÑовÑем</stopword>
> + <stopword>ним</stopword>
> + <stopword>здеÑÑ</stopword>
> + <stopword>ÑÑом</stopword>
> + <stopword>один</stopword>
> + <stopword>поÑÑи</stopword>
> + <stopword>мой</stopword>
> + <stopword>Ñем</stopword>
> + <stopword>ÑÑобÑ</stopword>
> + <stopword>нее</stopword>
> + <stopword>кажеÑÑÑ</stopword>
> + <stopword>ÑейÑаÑ</stopword>
> + <stopword>бÑли</stopword>
> + <stopword>кÑда</stopword>
> + <stopword>заÑем</stopword>
> + <stopword>ÑказаÑÑ</stopword>
> + <stopword>вÑеÑ
</stopword>
> + <stopword>никогда</stopword>
> + <stopword>ÑегоднÑ</stopword>
> + <stopword>можно</stopword>
> + <stopword>пÑи</stopword>
> + <stopword>наконеÑ</stopword>
> + <stopword>два</stopword>
> + <stopword>об</stopword>
> + <stopword>дÑÑгой</stopword>
> + <stopword>Ñ
оÑÑ</stopword>
> + <stopword>поÑле</stopword>
> + <stopword>над</stopword>
> + <stopword>болÑÑе</stopword>
> + <stopword>ÑоÑ</stopword>
> + <stopword>ÑеÑез</stopword>
> + <stopword>ÑÑи</stopword>
> + <stopword>наÑ</stopword>
> + <stopword>пÑо</stopword>
> + <stopword>вÑего</stopword>
> + <stopword>ниÑ
</stopword>
> + <stopword>какаÑ</stopword>
> + <stopword>много</stopword>
> + <stopword>Ñазве</stopword>
> + <stopword>Ñказала</stopword>
> + <stopword>ÑÑи</stopword>
> + <stopword>ÑÑÑ</stopword>
> + <stopword>моÑ</stopword>
> + <stopword>впÑоÑем</stopword>
> + <stopword>Ñ
оÑоÑо</stopword>
> + <stopword>ÑвоÑ</stopword>
> + <stopword>ÑÑой</stopword>
> + <stopword>пеÑед</stopword>
> + <stopword>иногда</stopword>
> + <stopword>лÑÑÑе</stopword>
> + <stopword>ÑÑÑÑ</stopword>
> + <stopword>Ñом</stopword>
> + <stopword>нелÑзÑ</stopword>
> + <stopword>Ñакой</stopword>
> + <stopword>им</stopword>
> + <stopword>более</stopword>
> + <stopword>вÑегда</stopword>
> + <stopword>конеÑно</stopword>
> + <stopword>вÑÑ</stopword>
> + <stopword>междÑ</stopword>
> +</stopwords>
> +
>
>
>
> ---------------------------------------------------------------------
> To unsubscribe, e-mail: commits-unsubscribe@lenya.apache.org
> For additional commands, e-mail: commits-help@lenya.apache.org
>
---------------------------------------------------------------------
To unsubscribe, e-mail: dev-unsubscribe@lenya.apache.org
For additional commands, e-mail: dev-help@lenya.apache.org