Hello!

I assume you've added the body field, but you don't populate it. As
far as I remember Nutch don't fill the body field by default. What
you are expecting to have in the body field ?

-- 
Regards,
 Rafał Kuć
 Sematext :: http://sematext.com/ :: Solr - Lucene - Nutch - ElasticSearch

> I've just indexed again, and no luck.

> Below is my schema

> <schema name="nutch" version="1.4">
>      <types>
>          <fieldType name="string" class="solr.StrField" 
> sortMissingLast="true"
>              omitNorms="true"/>
>          <fieldType name="long" class="solr.TrieLongField" precisionStep="0"
>              omitNorms="true" positionIncrementGap="0"/>
>          <fieldType name="float" class="solr.TrieFloatField" 
> precisionStep="0"
>              omitNorms="true" positionIncrementGap="0"/>
>          <fieldType name="date" class="solr.TrieDateField" precisionStep="0"
>              omitNorms="true" positionIncrementGap="0"/>

>          <fieldType name="text" class="solr.TextField"
>              positionIncrementGap="100">
>              <analyzer>
>                  <tokenizer class="solr.WhitespaceTokenizerFactory"/>
>                  <filter class="solr.StopFilterFactory"
>                      ignoreCase="true" words="stopwords.txt"/>
>                  <filter class="solr.WordDelimiterFilterFactory"
>                      generateWordParts="1" generateNumberParts="1"
>                      catenateWords="1" catenateNumbers="1" catenateAll="0"
>                      splitOnCaseChange="1"/>
>                  <filter class="solr.LowerCaseFilterFactory"/>
>                  <filter class="solr.EnglishPorterFilterFactory"
>                      protected="protwords.txt"/>
>                  <filter
> class="solr.RemoveDuplicatesTokenFilterFactory"/>
>              </analyzer>
>          </fieldType>
>          <fieldType name="url" class="solr.TextField"
>              positionIncrementGap="100">
>              <analyzer>
>                  <tokenizer class="solr.StandardTokenizerFactory"/>
>                  <filter class="solr.LowerCaseFilterFactory"/>
>                  <filter class="solr.WordDelimiterFilterFactory"
>                      generateWordParts="1" generateNumberParts="1"/>
>              </analyzer>
>          </fieldType>
>      </types>
>      <fields>
>          <field name="id" type="string" stored="true" indexed="true"/>

>          <!-- core fields -->
>          <field name="segment" type="string" stored="true" indexed="false"/>
>          <field name="digest" type="string" stored="true" indexed="false"/>
>          <field name="boost" type="float" stored="true" indexed="false"/>

>          <!-- fields for index-basic plugin -->
>          <field name="host" type="string" stored="false" indexed="true"/>
>          <field name="url" type="url" stored="true" indexed="true"
>              required="true"/>
>          <field name="content" type="text" stored="false" indexed="true"/>
>          <field name="title" type="text" stored="true" indexed="true"/>
>          <field name="text" type="text" stored="true" indexed="true"/>
>          <field name="body" type="text" stored="true" indexed="true"/>
>          <field name="cache" type="string" stored="true" indexed="false"/>
>          <field name="tstamp" type="date" stored="true" indexed="false"/>

>          <!-- fields for index-anchor plugin -->
>          <field name="anchor" type="string" stored="true" indexed="true"
>              multiValued="true"/>

>          <!-- fields for index-more plugin -->
>          <field name="type" type="string" stored="true" indexed="true"
>              multiValued="true"/>
>          <field name="contentLength" type="long" stored="true"
>              indexed="false"/>
>          <field name="lastModified" type="date" stored="true"
>              indexed="false"/>
>          <field name="date" type="date" stored="true" indexed="true"/>

>          <!-- fields for languageidentifier plugin -->
>          <field name="lang" type="string" stored="true" indexed="true"/>

>          <!-- fields for subcollection plugin -->
>          <field name="subcollection" type="string" stored="true"
>              indexed="true" multiValued="true"/>

>          <!-- fields for feed plugin (tag is also used by 
> microformats-reltag)-->
>          <field name="author" type="string" stored="true" indexed="true"/>
>          <field name="tag" type="string" stored="true" indexed="true" 
multiValued="true"/>>
>          <field name="feed" type="string" stored="true" indexed="true"/>
>          <field name="publishedDate" type="date" stored="true"
>              indexed="true"/>
>          <field name="updatedDate" type="date" stored="true"
>              indexed="true"/>

>          <!-- fields for creativecommons plugin -->
>          <field name="cc" type="string" stored="true" indexed="true"
>              multiValued="true"/>
>      </fields>
>      <uniqueKey>id</uniqueKey>
>      <defaultSearchField>content</defaultSearchField>
>      <solrQueryParser defaultOperator="OR"/>
> </schema>

> I don't know how to show you example data, my URL is 
> http://www.sabanciuniv.edu

> Regards,

> On 10/09/2012 02:58 PM, Rafał Kuć wrote:
>> Hello!
>>
>> After altering your schema.xml have you indexed your documents again ?
>>
>> It would be nice to see how you schema.xml looks like and example of
>> the data, because otherwise we can only guess.
>>

Reply via email to