Ok, so i've been working on updating hte ref guide to account for hte new way to run the "examples" in 5.0.

The spell checking page...

        https://cwiki.apache.org/confluence/display/solr/Spell+Checking

...has some examples that loosely corroloate to the "techproducts" example, but even if you ignore the specifics of those examples, i need help understanding the basic behavior of hte spellchecker as configured in the techproducts

Assuming you run this...

        bin/solr -e techproducts

....with that example running & those docs indexed, this URL gives me results i can't explain...

http://localhost:8983/solr/techproducts/spell?spellcheck.q=hell+ultrashar&df=text&spellcheck=true&spellcheck.build=true

(see below)

1) "dell" is not listed as a possible suggestion for for "hell" (even if the dictionary thinks "hold" is a better suggestion, why isn't "dell" even included in the list of possibilities?

2) in the "collation" section, i can't make any sense of what these results mean -- how is "hello ultrasharp" a suggested collationQuery when *none* of the example docs contain both "hello" and "ultrasharp" ?

http://localhost:8983/solr/techproducts/select?df=text&q=%2Bhello+%2Bultrasharp


So WTF is up with these spell check results?


<?xml version="1.0" encoding="UTF-8"?>
<response>

<lst name="responseHeader">
  <int name="status">0</int>
  <int name="QTime">15</int>
</lst>
<str name="command">build</str>
<result name="response" numFound="0" start="0">
</result>
<lst name="spellcheck">
  <lst name="suggestions">
    <lst name="hell">
      <int name="numFound">6</int>
      <int name="startOffset">0</int>
      <int name="endOffset">4</int>
      <int name="origFreq">0</int>
      <arr name="suggestion">
        <lst>
          <str name="word">hello</str>
          <int name="freq">1</int>
        </lst>
        <lst>
          <str name="word">here</str>
          <int name="freq">2</int>
        </lst>
        <lst>
          <str name="word">heat</str>
          <int name="freq">1</int>
        </lst>
        <lst>
          <str name="word">hold</str>
          <int name="freq">1</int>
        </lst>
        <lst>
          <str name="word">html</str>
          <int name="freq">1</int>
        </lst>
        <lst>
          <str name="word">héllo</str>
          <int name="freq">1</int>
        </lst>
      </arr>
    </lst>
    <lst name="ultrashar">
      <int name="numFound">1</int>
      <int name="startOffset">5</int>
      <int name="endOffset">14</int>
      <int name="origFreq">0</int>
      <arr name="suggestion">
        <lst>
          <str name="word">ultrasharp</str>
          <int name="freq">1</int>
        </lst>
      </arr>
    </lst>
  </lst>
  <bool name="correctlySpelled">false</bool>
  <lst name="collations">
    <lst name="collation">
      <str name="collationQuery">hello ultrasharp</str>
      <int name="hits">2</int>
      <lst name="misspellingsAndCorrections">
        <str name="hell">hello</str>
        <str name="ultrashar">ultrasharp</str>
      </lst>
    </lst>
    <lst name="collation">
      <str name="collationQuery">here ultrasharp</str>
      <int name="hits">3</int>
      <lst name="misspellingsAndCorrections">
        <str name="hell">here</str>
        <str name="ultrashar">ultrasharp</str>
      </lst>
    </lst>
    <lst name="collation">
      <str name="collationQuery">heat ultrasharp</str>
      <int name="hits">2</int>
      <lst name="misspellingsAndCorrections">
        <str name="hell">heat</str>
        <str name="ultrashar">ultrasharp</str>
      </lst>
    </lst>
    <lst name="collation">
      <str name="collationQuery">hold ultrasharp</str>
      <int name="hits">2</int>
      <lst name="misspellingsAndCorrections">
        <str name="hell">hold</str>
        <str name="ultrashar">ultrasharp</str>
      </lst>
    </lst>
    <lst name="collation">
      <str name="collationQuery">html ultrasharp</str>
      <int name="hits">2</int>
      <lst name="misspellingsAndCorrections">
        <str name="hell">html</str>
        <str name="ultrashar">ultrasharp</str>
      </lst>
    </lst>
  </lst>
</lst>
</response>






-Hoss
http://www.lucidworks.com/

Reply via email to