You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@lucy.apache.org by nw...@apache.org on 2012/02/11 18:05:39 UTC
[lucy-commits] svn commit: r1243100 - in /incubator/lucy/trunk:
core/Lucy/Analysis/PolyAnalyzer.cfh
perl/buildlib/Lucy/Build/Binding/Analysis.pm
Author: nwellnhof
Date: Sat Feb 11 17:05:39 2012
New Revision: 1243100
URL: http://svn.apache.org/viewvc?rev=1243100&view=rev
Log:
Update Analyzer documentation
Modified:
incubator/lucy/trunk/core/Lucy/Analysis/PolyAnalyzer.cfh
incubator/lucy/trunk/perl/buildlib/Lucy/Build/Binding/Analysis.pm
Modified: incubator/lucy/trunk/core/Lucy/Analysis/PolyAnalyzer.cfh
URL: http://svn.apache.org/viewvc/incubator/lucy/trunk/core/Lucy/Analysis/PolyAnalyzer.cfh?rev=1243100&r1=1243099&r2=1243100&view=diff
==============================================================================
--- incubator/lucy/trunk/core/Lucy/Analysis/PolyAnalyzer.cfh (original)
+++ incubator/lucy/trunk/core/Lucy/Analysis/PolyAnalyzer.cfh Sat Feb 11 17:05:39 2012
@@ -26,6 +26,9 @@ parcel Lucy;
* L<RegexTokenizer|Lucy::Analysis::RegexTokenizer>, and a
* L<SnowballStemmer|Lucy::Analysis::SnowballStemmer> will be generated for you.
*
+ * The language parameter is DEPRECATED. Use
+ * L<EasyAnalyzer|Lucy::Analysis::EasyAnalyzer> instead.
+ *
* Supported languages:
*
* en => English,
@@ -54,11 +57,12 @@ class Lucy::Analysis::PolyAnalyzer
/**
* @param language An ISO code from the list of supported languages.
+ * DEPRECATED, use L<EasyAnalyzer|Lucy::Analysis::EasyAnalyzer> instead.
* @param analyzers An array of Analyzers. The order of the analyzers
* matters. Don't put a SnowballStemmer before a RegexTokenizer (can't stem whole
* documents or paragraphs -- just individual words), or a SnowballStopFilter
* after a SnowballStemmer (stemmed words, e.g. "themselv", will not appear in a
- * stoplist). In general, the sequence should be: normalize, tokenize,
+ * stoplist). In general, the sequence should be: tokenize, normalize,
* stopalize, stem.
*/
public inert PolyAnalyzer*
Modified: incubator/lucy/trunk/perl/buildlib/Lucy/Build/Binding/Analysis.pm
URL: http://svn.apache.org/viewvc/incubator/lucy/trunk/perl/buildlib/Lucy/Build/Binding/Analysis.pm?rev=1243100&r1=1243099&r2=1243100&view=diff
==============================================================================
--- incubator/lucy/trunk/perl/buildlib/Lucy/Build/Binding/Analysis.pm (original)
+++ incubator/lucy/trunk/perl/buildlib/Lucy/Build/Binding/Analysis.pm Sat Feb 11 17:05:39 2012
@@ -54,7 +54,7 @@ sub bind_casefolder {
my $case_folder = Lucy::Analysis::CaseFolder->new;
my $polyanalyzer = Lucy::Analysis::PolyAnalyzer->new(
- analyzers => [ $case_folder, $tokenizer, $stemmer ],
+ analyzers => [ $tokenizer, $case_folder, $stemmer ],
);
END_SYNOPSIS
my $constructor = <<'END_CONSTRUCTOR';
@@ -155,7 +155,7 @@ sub bind_normalizer {
my $normalizer = Lucy::Analysis::Normalizer->new;
my $polyanalyzer = Lucy::Analysis::PolyAnalyzer->new(
- analyzers => [ $normalizer, $tokenizer, $stemmer ],
+ analyzers => [ $tokenizer, $normalizer, $stemmer ],
);
END_SYNOPSIS
my $constructor = <<'END_CONSTRUCTOR';
@@ -231,7 +231,7 @@ sub bind_regextokenizer {
# Then... once you have a tokenizer, put it into a PolyAnalyzer:
my $polyanalyzer = Lucy::Analysis::PolyAnalyzer->new(
- analyzers => [ $case_folder, $word_char_tokenizer, $stemmer ], );
+ analyzers => [ $word_char_tokenizer, $normalizer, $stemmer ], );
END_SYNOPSIS
my $constructor = <<'END_CONSTRUCTOR';
my $word_char_tokenizer = Lucy::Analysis::RegexTokenizer->new(
@@ -257,7 +257,7 @@ sub bind_snowballstemmer {
my $stemmer = Lucy::Analysis::SnowballStemmer->new( language => 'es' );
my $polyanalyzer = Lucy::Analysis::PolyAnalyzer->new(
- analyzers => [ $case_folder, $tokenizer, $stemmer ],
+ analyzers => [ $tokenizer, $normalizer, $stemmer ],
);
This class is a wrapper around the Snowball stemming library, so it supports
@@ -286,7 +286,7 @@ sub bind_snowballstopfilter {
language => 'fr',
);
my $polyanalyzer = Lucy::Analysis::PolyAnalyzer->new(
- analyzers => [ $case_folder, $tokenizer, $stopfilter, $stemmer ],
+ analyzers => [ $tokenizer, $normalizer, $stopfilter, $stemmer ],
);
END_SYNOPSIS
my $constructor = <<'END_CONSTRUCTOR';
@@ -319,7 +319,7 @@ sub bind_standardtokenizer {
# Then... once you have a tokenizer, put it into a PolyAnalyzer:
my $polyanalyzer = Lucy::Analysis::PolyAnalyzer->new(
- analyzers => [ $case_folder, $tokenizer, $stemmer ], );
+ analyzers => [ $tokenizer, $normalizer, $stemmer ], );
END_SYNOPSIS
my $constructor = <<'END_CONSTRUCTOR';
my $tokenizer = Lucy::Analysis::StandardTokenizer->new;