Hi - You should stick to Nutch' schema.xml and not manually add a text or body 
field that aren't going to be populated anyway. Nutch sends data, by default, 
to the content field.
  
-----Original message-----
> From:Rafał Kuć <r....@solr.pl>
> Sent: Tue 09-Oct-2012 14:32
> To: solr-user@lucene.apache.org
> Subject: Re: Search in body
> 
> Hello!
> 
> I assume you've added the body field, but you don't populate it. As
> far as I remember Nutch don't fill the body field by default. What
> you are expecting to have in the body field ?
> 
> -- 
> Regards,
>  Rafał Kuć
>  Sematext :: http://sematext.com/ :: Solr - Lucene - Nutch - ElasticSearch
> 
> > I've just indexed again, and no luck.
> 
> > Below is my schema
> 
> > <schema name="nutch" version="1.4">
> >      <types>
> >          <fieldType name="string" class="solr.StrField" 
> > sortMissingLast="true"
> >              omitNorms="true"/>
> >          <fieldType name="long" class="solr.TrieLongField" precisionStep="0"
> >              omitNorms="true" positionIncrementGap="0"/>
> >          <fieldType name="float" class="solr.TrieFloatField" 
> > precisionStep="0"
> >              omitNorms="true" positionIncrementGap="0"/>
> >          <fieldType name="date" class="solr.TrieDateField" precisionStep="0"
> >              omitNorms="true" positionIncrementGap="0"/>
> 
> >          <fieldType name="text" class="solr.TextField"
> >              positionIncrementGap="100">
> >              <analyzer>
> >                  <tokenizer class="solr.WhitespaceTokenizerFactory"/>
> >                  <filter class="solr.StopFilterFactory"
> >                      ignoreCase="true" words="stopwords.txt"/>
> >                  <filter class="solr.WordDelimiterFilterFactory"
> >                      generateWordParts="1" generateNumberParts="1"
> >                      catenateWords="1" catenateNumbers="1" catenateAll="0"
> >                      splitOnCaseChange="1"/>
> >                  <filter class="solr.LowerCaseFilterFactory"/>
> >                  <filter class="solr.EnglishPorterFilterFactory"
> >                      protected="protwords.txt"/>
> >                  <filter
> > class="solr.RemoveDuplicatesTokenFilterFactory"/>
> >              </analyzer>
> >          </fieldType>
> >          <fieldType name="url" class="solr.TextField"
> >              positionIncrementGap="100">
> >              <analyzer>
> >                  <tokenizer class="solr.StandardTokenizerFactory"/>
> >                  <filter class="solr.LowerCaseFilterFactory"/>
> >                  <filter class="solr.WordDelimiterFilterFactory"
> >                      generateWordParts="1" generateNumberParts="1"/>
> >              </analyzer>
> >          </fieldType>
> >      </types>
> >      <fields>
> >          <field name="id" type="string" stored="true" indexed="true"/>
> 
> >          <!-- core fields -->
> >          <field name="segment" type="string" stored="true" indexed="false"/>
> >          <field name="digest" type="string" stored="true" indexed="false"/>
> >          <field name="boost" type="float" stored="true" indexed="false"/>
> 
> >          <!-- fields for index-basic plugin -->
> >          <field name="host" type="string" stored="false" indexed="true"/>
> >          <field name="url" type="url" stored="true" indexed="true"
> >              required="true"/>
> >          <field name="content" type="text" stored="false" indexed="true"/>
> >          <field name="title" type="text" stored="true" indexed="true"/>
> >          <field name="text" type="text" stored="true" indexed="true"/>
> >          <field name="body" type="text" stored="true" indexed="true"/>
> >          <field name="cache" type="string" stored="true" indexed="false"/>
> >          <field name="tstamp" type="date" stored="true" indexed="false"/>
> 
> >          <!-- fields for index-anchor plugin -->
> >          <field name="anchor" type="string" stored="true" indexed="true"
> >              multiValued="true"/>
> 
> >          <!-- fields for index-more plugin -->
> >          <field name="type" type="string" stored="true" indexed="true"
> >              multiValued="true"/>
> >          <field name="contentLength" type="long" stored="true"
> >              indexed="false"/>
> >          <field name="lastModified" type="date" stored="true"
> >              indexed="false"/>
> >          <field name="date" type="date" stored="true" indexed="true"/>
> 
> >          <!-- fields for languageidentifier plugin -->
> >          <field name="lang" type="string" stored="true" indexed="true"/>
> 
> >          <!-- fields for subcollection plugin -->
> >          <field name="subcollection" type="string" stored="true"
> >              indexed="true" multiValued="true"/>
> 
> >          <!-- fields for feed plugin (tag is also used by 
> > microformats-reltag)-->
> >          <field name="author" type="string" stored="true" indexed="true"/>
> >          <field name="tag" type="string" stored="true" indexed="true" 
> multiValued="true"/>>
> >          <field name="feed" type="string" stored="true" indexed="true"/>
> >          <field name="publishedDate" type="date" stored="true"
> >              indexed="true"/>
> >          <field name="updatedDate" type="date" stored="true"
> >              indexed="true"/>
> 
> >          <!-- fields for creativecommons plugin -->
> >          <field name="cc" type="string" stored="true" indexed="true"
> >              multiValued="true"/>
> >      </fields>
> >      <uniqueKey>id</uniqueKey>
> >      <defaultSearchField>content</defaultSearchField>
> >      <solrQueryParser defaultOperator="OR"/>
> > </schema>
> 
> > I don't know how to show you example data, my URL is 
> > http://www.sabanciuniv.edu
> 
> > Regards,
> 
> > On 10/09/2012 02:58 PM, Rafał Kuć wrote:
> >> Hello!
> >>
> >> After altering your schema.xml have you indexed your documents again ?
> >>
> >> It would be nice to see how you schema.xml looks like and example of
> >> the data, because otherwise we can only guess.
> >>
> 
> 

Reply via email to