You are viewing a plain text version of this content. The canonical link for it is here.
Posted to solr-user@lucene.apache.org by Giovanni Gherdovich <g....@gmail.com> on 2012/06/30 15:51:51 UTC

documentation on the pragmatics behind the example schema.xml

Hi all,

in the example schema.xml I can find a wide variety
of fieldType and field, already there to be used.

I believe each of them has been designed for a specific
usage case, with some pragmatics in mind.

Where can I find documentation on what those field / fieldTypes
were designed for? Is the best place to get those info
the schema.xml file and its comments?

cheers,
GGhh

here I cut and paste fields and fieldTypes I have:

-- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8
   <field name="id" type="string" indexed="true" stored="true"
required="true" />
   <field name="sku" type="textTight" indexed="true" stored="true"
omitNorms="true"/>
   <field name="name" type="textgen" indexed="true" stored="true"/>
   <field name="alphaNameSort" type="alphaOnlySort" indexed="true"
stored="false"/>
   <field name="manu" type="textgen" indexed="true" stored="true"
omitNorms="true"/>
   <field name="cat" type="text_ws" indexed="true" stored="true"
multiValued="true" omitNorms="true" />
   <field name="features" type="text" indexed="true" stored="true"
multiValued="true"/>
   <field name="includes" type="text" indexed="true" stored="true"
termVectors="true" termPositions="true" termOffsets="true" />
   <field name="weight" type="float" indexed="true" stored="true"/>
   <field name="price"  type="float" indexed="true" stored="true"/>
   <field name="popularity" type="int" indexed="true" stored="true" />
   <field name="inStock" type="boolean" indexed="true" stored="true" />
   <field name="title" type="text" indexed="true" stored="true"
multiValued="true"/>
   <field name="subject" type="text" indexed="true" stored="true"/>
   <field name="description" type="text" indexed="true" stored="true"/>
   <field name="comments" type="text" indexed="true" stored="true"/>
   <field name="author" type="textgen" indexed="true" stored="true"/>
   <field name="keywords" type="textgen" indexed="true" stored="true"/>
   <field name="category" type="textgen" indexed="true" stored="true"/>
   <field name="content_type" type="string" indexed="true"
stored="true" multiValued="true"/>
   <field name="last_modified" type="date" indexed="true" stored="true"/>
   <field name="links" type="string" indexed="true" stored="true"
multiValued="true"/>
   <field name="text" type="text" indexed="true" stored="false"
multiValued="true"/>
   <field name="text_rev" type="text_rev" indexed="true"
stored="false" multiValued="true"/>
   <field name="manu_exact" type="string" indexed="true" stored="false"/>
   <field name="payloads" type="payloads" indexed="true" stored="true"/>
   <field name="timestamp" type="date" indexed="true" stored="true"
default="NOW" multiValued="false"/>
-- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8

-- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8
    <fieldType name="string" class="solr.StrField"
sortMissingLast="true" omitNorms="true"/>
    <fieldType name="boolean" class="solr.BoolField"
sortMissingLast="true" omitNorms="true"/>
    <fieldType name="int" class="solr.TrieIntField" precisionStep="0"
omitNorms="true" positionIncrementGap="0"/>
    <fieldType name="float" class="solr.TrieFloatField"
precisionStep="0" omitNorms="true" positionIncrementGap="0"/>
    <fieldType name="long" class="solr.TrieLongField"
precisionStep="0" omitNorms="true" positionIncrementGap="0"/>
    <fieldType name="double" class="solr.TrieDoubleField"
precisionStep="0" omitNorms="true" positionIncrementGap="0"/>
    <fieldType name="tint" class="solr.TrieIntField" precisionStep="8"
omitNorms="true" positionIncrementGap="0"/>
    <fieldType name="tfloat" class="solr.TrieFloatField"
precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
    <fieldType name="tlong" class="solr.TrieLongField"
precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
    <fieldType name="tdouble" class="solr.TrieDoubleField"
precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
    <fieldType name="date" class="solr.TrieDateField" omitNorms="true"
precisionStep="0" positionIncrementGap="0"/>
    <fieldType name="tdate" class="solr.TrieDateField"
omitNorms="true" precisionStep="6" positionIncrementGap="0"/>
    <fieldType name="pint" class="solr.IntField" omitNorms="true"/>
    <fieldType name="plong" class="solr.LongField" omitNorms="true"/>
    <fieldType name="pfloat" class="solr.FloatField" omitNorms="true"/>
    <fieldType name="pdouble" class="solr.DoubleField" omitNorms="true"/>
    <fieldType name="pdate" class="solr.DateField"
sortMissingLast="true" omitNorms="true"/>
    <fieldType name="sint" class="solr.SortableIntField"
sortMissingLast="true" omitNorms="true"/>
    <fieldType name="slong" class="solr.SortableLongField"
sortMissingLast="true" omitNorms="true"/>
    <fieldType name="sfloat" class="solr.SortableFloatField"
sortMissingLast="true" omitNorms="true"/>
    <fieldType name="sdouble" class="solr.SortableDoubleField"
sortMissingLast="true" omitNorms="true"/>
    <fieldType name="random" class="solr.RandomSortField" indexed="true" />
    <fieldType name="text_greek" class="solr.TextField">
    <fieldType name="text_ws" class="solr.TextField" positionIncrementGap="100">
    <fieldType name="text" class="solr.TextField" positionIncrementGap="100">
    <fieldType name="textTight" class="solr.TextField"
positionIncrementGap="100" >
    <fieldType name="textgen" class="solr.TextField" positionIncrementGap="100">
    <fieldType name="text_rev" class="solr.TextField"
positionIncrementGap="100">
    <fieldType name="textCharNorm" class="solr.TextField"
positionIncrementGap="100" >
    <fieldType name="alphaOnlySort" class="solr.TextField"
sortMissingLast="true" omitNorms="true">
    <fieldType name="lowercase" class="solr.TextField"
positionIncrementGap="100">
-- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8

Re: documentation on the pragmatics behind the example schema.xml

Posted by Giovanni Gherdovich <g....@gmail.com>.
Hello Eric,

2012/7/1 Erick Erickson <er...@gmail.com>:
> Your very best way of figuring this out is to use the admin/analysis
> page. [...]

thank you for this advice. I'll make myself comfortable
with the admin/analysis page.

cheers,
GGhh

Re: documentation on the pragmatics behind the example schema.xml

Posted by Erick Erickson <er...@gmail.com>.
Your very best way of figuring this out is to use the admin/analysis
page. It will show
you the exact effects of each element of the analysis chains for the
field type you
specify. From there it's just a matter of getting your head around the fact that
the various filters and tokenizers can be combined in many different
ways to suit your
particular purpose. Be sure to check the "verbose" checkbox!

But other than the comments in the schema file, there's no source of
documentation for
the purposes of the field types that I know of...

Best
Erick

On Sat, Jun 30, 2012 at 9:51 AM, Giovanni Gherdovich
<g....@gmail.com> wrote:
> Hi all,
>
> in the example schema.xml I can find a wide variety
> of fieldType and field, already there to be used.
>
> I believe each of them has been designed for a specific
> usage case, with some pragmatics in mind.
>
> Where can I find documentation on what those field / fieldTypes
> were designed for? Is the best place to get those info
> the schema.xml file and its comments?
>
> cheers,
> GGhh
>
> here I cut and paste fields and fieldTypes I have:
>
> -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8
>    <field name="id" type="string" indexed="true" stored="true"
> required="true" />
>    <field name="sku" type="textTight" indexed="true" stored="true"
> omitNorms="true"/>
>    <field name="name" type="textgen" indexed="true" stored="true"/>
>    <field name="alphaNameSort" type="alphaOnlySort" indexed="true"
> stored="false"/>
>    <field name="manu" type="textgen" indexed="true" stored="true"
> omitNorms="true"/>
>    <field name="cat" type="text_ws" indexed="true" stored="true"
> multiValued="true" omitNorms="true" />
>    <field name="features" type="text" indexed="true" stored="true"
> multiValued="true"/>
>    <field name="includes" type="text" indexed="true" stored="true"
> termVectors="true" termPositions="true" termOffsets="true" />
>    <field name="weight" type="float" indexed="true" stored="true"/>
>    <field name="price"  type="float" indexed="true" stored="true"/>
>    <field name="popularity" type="int" indexed="true" stored="true" />
>    <field name="inStock" type="boolean" indexed="true" stored="true" />
>    <field name="title" type="text" indexed="true" stored="true"
> multiValued="true"/>
>    <field name="subject" type="text" indexed="true" stored="true"/>
>    <field name="description" type="text" indexed="true" stored="true"/>
>    <field name="comments" type="text" indexed="true" stored="true"/>
>    <field name="author" type="textgen" indexed="true" stored="true"/>
>    <field name="keywords" type="textgen" indexed="true" stored="true"/>
>    <field name="category" type="textgen" indexed="true" stored="true"/>
>    <field name="content_type" type="string" indexed="true"
> stored="true" multiValued="true"/>
>    <field name="last_modified" type="date" indexed="true" stored="true"/>
>    <field name="links" type="string" indexed="true" stored="true"
> multiValued="true"/>
>    <field name="text" type="text" indexed="true" stored="false"
> multiValued="true"/>
>    <field name="text_rev" type="text_rev" indexed="true"
> stored="false" multiValued="true"/>
>    <field name="manu_exact" type="string" indexed="true" stored="false"/>
>    <field name="payloads" type="payloads" indexed="true" stored="true"/>
>    <field name="timestamp" type="date" indexed="true" stored="true"
> default="NOW" multiValued="false"/>
> -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8
>
> -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8
>     <fieldType name="string" class="solr.StrField"
> sortMissingLast="true" omitNorms="true"/>
>     <fieldType name="boolean" class="solr.BoolField"
> sortMissingLast="true" omitNorms="true"/>
>     <fieldType name="int" class="solr.TrieIntField" precisionStep="0"
> omitNorms="true" positionIncrementGap="0"/>
>     <fieldType name="float" class="solr.TrieFloatField"
> precisionStep="0" omitNorms="true" positionIncrementGap="0"/>
>     <fieldType name="long" class="solr.TrieLongField"
> precisionStep="0" omitNorms="true" positionIncrementGap="0"/>
>     <fieldType name="double" class="solr.TrieDoubleField"
> precisionStep="0" omitNorms="true" positionIncrementGap="0"/>
>     <fieldType name="tint" class="solr.TrieIntField" precisionStep="8"
> omitNorms="true" positionIncrementGap="0"/>
>     <fieldType name="tfloat" class="solr.TrieFloatField"
> precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
>     <fieldType name="tlong" class="solr.TrieLongField"
> precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
>     <fieldType name="tdouble" class="solr.TrieDoubleField"
> precisionStep="8" omitNorms="true" positionIncrementGap="0"/>
>     <fieldType name="date" class="solr.TrieDateField" omitNorms="true"
> precisionStep="0" positionIncrementGap="0"/>
>     <fieldType name="tdate" class="solr.TrieDateField"
> omitNorms="true" precisionStep="6" positionIncrementGap="0"/>
>     <fieldType name="pint" class="solr.IntField" omitNorms="true"/>
>     <fieldType name="plong" class="solr.LongField" omitNorms="true"/>
>     <fieldType name="pfloat" class="solr.FloatField" omitNorms="true"/>
>     <fieldType name="pdouble" class="solr.DoubleField" omitNorms="true"/>
>     <fieldType name="pdate" class="solr.DateField"
> sortMissingLast="true" omitNorms="true"/>
>     <fieldType name="sint" class="solr.SortableIntField"
> sortMissingLast="true" omitNorms="true"/>
>     <fieldType name="slong" class="solr.SortableLongField"
> sortMissingLast="true" omitNorms="true"/>
>     <fieldType name="sfloat" class="solr.SortableFloatField"
> sortMissingLast="true" omitNorms="true"/>
>     <fieldType name="sdouble" class="solr.SortableDoubleField"
> sortMissingLast="true" omitNorms="true"/>
>     <fieldType name="random" class="solr.RandomSortField" indexed="true" />
>     <fieldType name="text_greek" class="solr.TextField">
>     <fieldType name="text_ws" class="solr.TextField" positionIncrementGap="100">
>     <fieldType name="text" class="solr.TextField" positionIncrementGap="100">
>     <fieldType name="textTight" class="solr.TextField"
> positionIncrementGap="100" >
>     <fieldType name="textgen" class="solr.TextField" positionIncrementGap="100">
>     <fieldType name="text_rev" class="solr.TextField"
> positionIncrementGap="100">
>     <fieldType name="textCharNorm" class="solr.TextField"
> positionIncrementGap="100" >
>     <fieldType name="alphaOnlySort" class="solr.TextField"
> sortMissingLast="true" omitNorms="true">
>     <fieldType name="lowercase" class="solr.TextField"
> positionIncrementGap="100">
> -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8  -- -- >8