On 10/23/2011 09:34 PM, Erick Erickson wrote:
Hmmm dismax is, indeed, different. Note that dismax doesn't respect
the default operator at all, so don't be mislead there.
Could you paste the debug output for both the queries? Perhaps something
will jump out at us.
Best
Erick
Thank you Erick. I've tried to paste the query results here.
First one is the query with ""'s around the terms and returns 6888 results.
I've hid the explain parts of most of the results (and timing) just to
keep the email reasonably short.
If you need to see them let me know.
+ designates hidden "subtree".
Best regards,
Lauri
<lst name="responseHeader">
<int name="status">0</int>
<int name="QTime">91</int>
<lst name="params">
<str name="explainOther"/>
<str name="indent">on</str>
<str name="hl.fl"/>
<str name="wt">standard</str>
<str name="version">2.2</str>
<str name="rows">10</str>
<str name="fl">*,score</str>
<str name="debugQuery">on</str>
<str name="start">0</str>
<str name="q">"asuntojen hinnat"</str>
<str name="qt">dismax</str>
<str name="fq"/>
</lst>
</lst>
+<result name="response" numFound="6888" start="0" maxScore="3.0879765">
<lst name="debug">
<lst name="queryBoosting">
<str name="q">asuntojenhinnat</str>
<null name="match"/>
</lst><str name="rawquerystring">"asuntojen hinnat"</str>
<str name="querystring">"asuntojen hinnat"</str>
<str name="parsedquery">+DisjunctionMaxQuery((table.title_t:"asuntojen
hinnat"^2.0 | title_t:"asuntojen hinnat"^2.0 | ingress_t:"asuntojen
hinnat" | (text_fi:asunto text_fi:hinta) | (table.description_fi:asunto
table.description_fi:hinta) | table.description_t:"asuntojen hinnat" |
graphic.title_t:"asuntojen hinnat"^2.0 | ((graphic.title_fi:asunto
graphic.title_fi:hinta)^2.0) | ((table.title_fi:asunto
table.title_fi:hinta)^2.0) | table.contents_t:"asuntojen hinnat" |
text_t:"asuntojen hinnat" | (ingress_fi:asunto ingress_fi:hinta) |
(table.contents_fi:asunto table.contents_fi:hinta) | ((title_fi:asunto
title_fi:hinta)^2.0))~0.01) () type:tie^6.0 type:kuv^2.0 type:tau^2.0
FunctionQuery((1.0/(3.16E-11*float(ms(const(1319437912691),date(date.modified_dt)))+1.0))^100.0)</str>
<str name="parsedquery_toString">+(table.title_t:"asuntojen hinnat"^2.0
| title_t:"asuntojen hinnat"^2.0 | ingress_t:"asuntojen hinnat" |
(text_fi:asunto text_fi:hinta) | (table.description_fi:asunto
table.description_fi:hinta) | table.description_t:"asuntojen hinnat" |
graphic.title_t:"asuntojen hinnat"^2.0 | ((graphic.title_fi:asunto
graphic.title_fi:hinta)^2.0) | ((table.title_fi:asunto
table.title_fi:hinta)^2.0) | table.contents_t:"asuntojen hinnat" |
text_t:"asuntojen hinnat" | (ingress_fi:asunto ingress_fi:hinta) |
(table.contents_fi:asunto table.contents_fi:hinta) | ((title_fi:asunto
title_fi:hinta)^2.0))~0.01 () type:tie^6.0 type:kuv^2.0 type:tau^2.0
(1.0/(3.16E-11*float(ms(const(1319437912691),date(date.modified_dt)))+1.0))^100.0</str>
<lst name="explain">
<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/07/ashi_2011_07_2011-08-26_tie_001_fi.html">
3.1653805 = (MATCH) sum of:
1.9299976 = (MATCH) max plus 0.01 times others of:
1.9211313 = weight(title_t:"asuntojen hinnat"^2.0 in 5891), product of:
0.26658234 = queryWeight(title_t:"asuntojen hinnat"^2.0), product of:
2.0 = boost
14.413042 = idf(title_t: asuntojen=250 hinnat=329)
0.009247955 = queryNorm
7.206521 = fieldWeight(title_t:"asuntojen hinnat" in 5891),
product of:
1.0 = tf(phraseFreq=1.0)
14.413042 = idf(title_t: asuntojen=250 hinnat=329)
0.5 = fieldNorm(field=title_t, doc=5891)
0.03292808 = (MATCH) sum of:
0.016520109 = (MATCH) weight(text_fi:asunto in 5891), product of:
0.044221584 = queryWeight(text_fi:asunto), product of:
4.781769 = idf(docFreq=3251, maxDocs=142742)
0.009247955 = queryNorm
0.3735757 = (MATCH) fieldWeight(text_fi:asunto in 5891),
product of:
1.0 = tf(termFreq(text_fi:asunto)=1)
4.781769 = idf(docFreq=3251, maxDocs=142742)
0.078125 = fieldNorm(field=text_fi, doc=5891)
0.016407972 = (MATCH) weight(text_fi:hinta in 5891), product of:
0.03705935 = queryWeight(text_fi:hinta), product of:
4.0073023 = idf(docFreq=7054, maxDocs=142742)
0.009247955 = queryNorm
0.44274852 = (MATCH) fieldWeight(text_fi:hinta in 5891),
product of:
1.4142135 = tf(termFreq(text_fi:hinta)=2)
4.0073023 = idf(docFreq=7054, maxDocs=142742)
0.078125 = fieldNorm(field=text_fi, doc=5891)
0.34379265 = (MATCH) sum of:
0.19207533 = (MATCH) weight(graphic.title_fi:asunto in 5891),
product of:
0.10662244 = queryWeight(graphic.title_fi:asunto), product of:
5.76465 = idf(docFreq=1216, maxDocs=142742)
0.01849591 = queryNorm
1.8014531 = (MATCH) fieldWeight(graphic.title_fi:asunto in
5891), product of:
1.0 = tf(termFreq(graphic.title_fi:asunto)=1)
5.76465 = idf(docFreq=1216, maxDocs=142742)
0.3125 = fieldNorm(field=graphic.title_fi, doc=5891)
0.15171732 = (MATCH) weight(graphic.title_fi:hinta in 5891),
product of:
0.09476117 = queryWeight(graphic.title_fi:hinta), product of:
5.1233582 = idf(docFreq=2310, maxDocs=142742)
0.01849591 = queryNorm
1.6010494 = (MATCH) fieldWeight(graphic.title_fi:hinta in
5891), product of:
1.0 = tf(termFreq(graphic.title_fi:hinta)=1)
5.1233582 = idf(docFreq=2310, maxDocs=142742)
0.3125 = fieldNorm(field=graphic.title_fi, doc=5891)
0.5099132 = (MATCH) sum of:
0.302103 = (MATCH) weight(title_fi:asunto in 5891), product of:
0.122067414 = queryWeight(title_fi:asunto), product of:
6.5996976 = idf(docFreq=527, maxDocs=142742)
0.01849591 = queryNorm
2.4748867 = (MATCH) fieldWeight(title_fi:asunto in 5891),
product of:
1.0 = tf(termFreq(title_fi:asunto)=1)
6.5996976 = idf(docFreq=527, maxDocs=142742)
0.375 = fieldNorm(field=title_fi, doc=5891)
0.2078102 = (MATCH) weight(title_fi:hinta in 5891), product of:
0.101240814 = queryWeight(title_fi:hinta), product of:
5.4736867 = idf(docFreq=1627, maxDocs=142742)
0.01849591 = queryNorm
2.0526326 = (MATCH) fieldWeight(title_fi:hinta in 5891),
product of:
1.0 = tf(termFreq(title_fi:hinta)=1)
5.4736867 = idf(docFreq=1627, maxDocs=142742)
0.375 = fieldNorm(field=title_fi, doc=5891)
0.43939918 = (MATCH) weight(type:tie^6.0 in 5891), product of:
0.156145 = queryWeight(type:tie^6.0), product of:
6.0 = boost
2.8140457 = idf(docFreq=23265, maxDocs=142742)
0.009247955 = queryNorm
2.8140457 = (MATCH) fieldWeight(type:tie in 5891), product of:
1.0 = tf(termFreq(type:tie)=1)
2.8140457 = idf(docFreq=23265, maxDocs=142742)
1.0 = fieldNorm(field=type, doc=5891)
0.7959837 = (MATCH)
FunctionQuery(1.0/(3.16E-11*float(ms(const(1319437912691),date(date.modified_dt)))+1.0)),
product of:
0.8607132 =
1.0/(3.16E-11*float(ms(const(1319437912691),date(date.modified_dt)=1314316800000))+1.0)
100.0 = boost
0.009247955 = queryNorm
</str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/08/ashi_2011_08_2011-09-30_tie_001_fi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/08/ashi_2011_08_2011-09-30_laa_001_fi.html"></str>
+<str
name="http://pxweb2.stat.fi/database/StatFin/asu/ashi/005_ashi_tau_102_fi.px"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/07/ashi_2011_07_2011-08-26_laa_001_fi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/02/ashi_2011_02_2011-07-29_laa_001_fi.html"></str>
+<str name="/media/nss/DATA2/data/wwwprod/meta/til/ashi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/02/ashi_2011_02_2011-07-29_tie_001_fi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2008/03/ashi_2008_03_2008-10-30_tie_001.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/01/ashi_2011_01_2011-04-28_laa_001_fi.html"></str>
</lst>
<str name="QParser">DisMaxQParser</str>
<null name="altquerystring"/>
<arr name="boost_queries"><str>type:tie^6 type:kuv^2 type:tau^2</str></arr>
<arr name="parsed_boost_queries"><str>type:tie^6.0 type:kuv^2.0
type:tau^2.0</str></arr>
<arr
name="boostfuncs"><str>recip(ms(NOW,date.modified_dt),3.16e-11,1,1)^100</str></arr>
<arr name="filter_queries"><str/></arr>
<arr name="parsed_filter_queries"/>
+<lst name="timing"></lst>
</lst>
******************************This is the same query without ""'s and
returns 1065 results.
<lst name="responseHeader">
<int name="status">0</int>
<int name="QTime">158</int>
<lst name="params">
<str name="explainOther"/>
<str name="indent">on</str>
<str name="hl.fl"/>
<str name="wt">standard</str>
<str name="version">2.2</str>
<str name="rows">10</str>
<str name="fl">*,score</str>
<str name="debugQuery">on</str>
<str name="start">0</str>
<str name="q">asuntojen hinnat</str>
<str name="qt">dismax</str>
<str name="fq"/>
</lst>
</lst>
+<result name="response" numFound="1065" start="0"
maxScore="2.230382"></result>
<lst name="debug">
<lst name="queryBoosting"><str name="q">asuntojenhinnat</str><null
name="match"/></lst>
<str name="rawquerystring">asuntojen hinnat</str>
<str name="querystring">asuntojen hinnat</str>
<str
name="parsedquery">+((DisjunctionMaxQuery((table.title_t:asuntojen^2.0 |
title_t:asuntojen^2.0 | ingress_t:asuntojen | text_fi:asunto |
table.description_fi:asunto | table.description_t:asuntojen |
graphic.title_t:asuntojen^2.0 | graphic.title_fi:asunto^2.0 |
table.title_fi:asunto^2.0 | table.contents_t:asuntojen |
text_t:asuntojen | ingress_fi:asunto | table.contents_fi:asunto |
title_fi:asunto^2.0)~0.01) DisjunctionMaxQuery((table.title_t:hinnat^2.0
| title_t:hinnat^2.0 | ingress_t:hinnat | text_fi:hinta |
table.description_fi:hinta | table.description_t:hinnat |
graphic.title_t:hinnat^2.0 | graphic.title_fi:hinta^2.0 |
table.title_fi:hinta^2.0 | table.contents_t:hinnat | text_t:hinnat |
ingress_fi:hinta | table.contents_fi:hinta |
title_fi:hinta^2.0)~0.01))~2) () type:tie^6.0 type:kuv^2.0 type:tau^2.0
FunctionQuery((1.0/(3.16E-11*float(ms(const(1319438484878),date(date.modified_dt)))+1.0))^100.0)</str>
<str name="parsedquery_toString">+(((table.title_t:asuntojen^2.0 |
title_t:asuntojen^2.0 | ingress_t:asuntojen | text_fi:asunto |
table.description_fi:asunto | table.description_t:asuntojen |
graphic.title_t:asuntojen^2.0 | graphic.title_fi:asunto^2.0 |
table.title_fi:asunto^2.0 | table.contents_t:asuntojen |
text_t:asuntojen | ingress_fi:asunto | table.contents_fi:asunto |
title_fi:asunto^2.0)~0.01 (table.title_t:hinnat^2.0 | title_t:hinnat^2.0
| ingress_t:hinnat | text_fi:hinta | table.description_fi:hinta |
table.description_t:hinnat | graphic.title_t:hinnat^2.0 |
graphic.title_fi:hinta^2.0 | table.title_fi:hinta^2.0 |
table.contents_t:hinnat | text_t:hinnat | ingress_fi:hinta |
table.contents_fi:hinta | title_fi:hinta^2.0)~0.01)~2) () type:tie^6.0
type:kuv^2.0 type:tau^2.0
(1.0/(3.16E-11*float(ms(const(1319438484878),date(date.modified_dt)))+1.0))^100.0</str>
<lst name="explain">
<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/07/ashi_2011_07_2011-08-26_tie_001_fi.html">
2.230382 = (MATCH) sum of:
0.9582871 = (MATCH) sum of:
0.4943457 = (MATCH) max plus 0.01 times others of:
0.485919 = (MATCH) weight(title_t:asuntojen^2.0 in 2499), product of:
0.13619305 = queryWeight(title_t:asuntojen^2.0), product of:
2.0 = boost
7.1357384 = idf(docFreq=311, maxDocs=144169)
0.009543024 = queryNorm
3.5678692 = (MATCH) fieldWeight(title_t:asuntojen in 2499),
product of:
1.0 = tf(termFreq(title_t:asuntojen)=1)
7.1357384 = idf(docFreq=311, maxDocs=144169)
0.5 = fieldNorm(field=title_t, doc=2499)
0.016945006 = (MATCH) weight(text_fi:asunto in 2499), product of:
0.045495544 = queryWeight(text_fi:asunto), product of:
4.7674136 = idf(docFreq=3331, maxDocs=144169)
0.009543024 = queryNorm
0.3724542 = (MATCH) fieldWeight(text_fi:asunto in 2499),
product of:
1.0 = tf(termFreq(text_fi:asunto)=1)
4.7674136 = idf(docFreq=3331, maxDocs=144169)
0.078125 = fieldNorm(field=text_fi, doc=2499)
0.30261597 = (MATCH) weight(graphic.title_t:asuntojen^2.0 in
2499), product of:
0.13594991 = queryWeight(graphic.title_t:asuntojen^2.0),
product of:
2.0 = boost
7.122999 = idf(docFreq=315, maxDocs=144169)
0.009543024 = queryNorm
2.2259374 = (MATCH) fieldWeight(graphic.title_t:asuntojen in
2499), product of:
1.0 = tf(termFreq(graphic.title_t:asuntojen)=1)
7.122999 = idf(docFreq=315, maxDocs=144169)
0.3125 = fieldNorm(field=graphic.title_t, doc=2499)
0.1929724 = (MATCH) weight(graphic.title_fi:asunto^2.0 in 2499),
product of:
0.10856269 = queryWeight(graphic.title_fi:asunto^2.0), product of:
2.0 = boost
5.6880655 = idf(docFreq=1326, maxDocs=144169)
0.009543024 = queryNorm
1.7775204 = (MATCH) fieldWeight(graphic.title_fi:asunto in
2499), product of:
1.0 = tf(termFreq(graphic.title_fi:asunto)=1)
5.6880655 = idf(docFreq=1326, maxDocs=144169)
0.3125 = fieldNorm(field=graphic.title_fi, doc=2499)
0.030048115 = (MATCH) weight(text_t:asuntojen in 2499), product of:
0.0553052 = queryWeight(text_t:asuntojen), product of:
5.795354 = idf(docFreq=1191, maxDocs=144169)
0.009543024 = queryNorm
0.54331446 = (MATCH) fieldWeight(text_t:asuntojen in 2499),
product of:
1.0 = tf(termFreq(text_t:asuntojen)=1)
5.795354 = idf(docFreq=1191, maxDocs=144169)
0.09375 = fieldNorm(field=text_t, doc=2499)
0.30008844 = (MATCH) weight(title_fi:asunto^2.0 in 2499), product of:
0.12358535 = queryWeight(title_fi:asunto^2.0), product of:
2.0 = boost
6.4751673 = idf(docFreq=603, maxDocs=144169)
0.009543024 = queryNorm
2.4281878 = (MATCH) fieldWeight(title_fi:asunto in 2499),
product of:
1.0 = tf(termFreq(title_fi:asunto)=1)
6.4751673 = idf(docFreq=603, maxDocs=144169)
0.375 = fieldNorm(field=title_fi, doc=2499)
0.46394145 = (MATCH) max plus 0.01 times others of:
0.45908907 = (MATCH) weight(title_t:hinnat^2.0 in 2499), product of:
0.13237973 = queryWeight(title_t:hinnat^2.0), product of:
2.0 = boost
6.935942 = idf(docFreq=380, maxDocs=144169)
0.009543024 = queryNorm
3.467971 = (MATCH) fieldWeight(title_t:hinnat in 2499), product of:
1.0 = tf(termFreq(title_t:hinnat)=1)
6.935942 = idf(docFreq=380, maxDocs=144169)
0.5 = fieldNorm(field=title_t, doc=2499)
0.10328812 = (MATCH) weight(ingress_t:hinnat in 2499), product of:
0.06279112 = queryWeight(ingress_t:hinnat), product of:
6.579792 = idf(docFreq=543, maxDocs=144169)
0.009543024 = queryNorm
1.644948 = (MATCH) fieldWeight(ingress_t:hinnat in 2499),
product of:
2.0 = tf(termFreq(ingress_t:hinnat)=4)
6.579792 = idf(docFreq=543, maxDocs=144169)
0.125 = fieldNorm(field=ingress_t, doc=2499)
0.01690726 = (MATCH) weight(text_fi:hinta in 2499), product of:
0.038214408 = queryWeight(text_fi:hinta), product of:
4.0044336 = idf(docFreq=7145, maxDocs=144169)
0.009543024 = queryNorm
0.44243157 = (MATCH) fieldWeight(text_fi:hinta in 2499),
product of:
1.4142135 = tf(termFreq(text_fi:hinta)=2)
4.0044336 = idf(docFreq=7145, maxDocs=144169)
0.078125 = fieldNorm(field=text_fi, doc=2499)
0.15190975 = (MATCH) weight(graphic.title_fi:hinta^2.0 in 2499),
product of:
0.096322075 = queryWeight(graphic.title_fi:hinta^2.0), product of:
2.0 = boost
5.046727 = idf(docFreq=2519, maxDocs=144169)
0.009543024 = queryNorm
1.5771022 = (MATCH) fieldWeight(graphic.title_fi:hinta in
2499), product of:
1.0 = tf(termFreq(graphic.title_fi:hinta)=1)
5.046727 = idf(docFreq=2519, maxDocs=144169)
0.3125 = fieldNorm(field=graphic.title_fi, doc=2499)
0.21313253 = (MATCH) weight(title_fi:hinta^2.0 in 2499), product of:
0.10415191 = queryWeight(title_fi:hinta^2.0), product of:
2.0 = boost
5.456966 = idf(docFreq=1671, maxDocs=144169)
0.009543024 = queryNorm
2.0463622 = (MATCH) fieldWeight(title_fi:hinta in 2499),
product of:
1.0 = tf(termFreq(title_fi:hinta)=1)
5.456966 = idf(docFreq=1671, maxDocs=144169)
0.375 = fieldNorm(field=title_fi, doc=2499)
0.450727 = (MATCH) weight(type:tie^6.0 in 2499), product of:
0.16064803 = queryWeight(type:tie^6.0), product of:
6.0 = boost
2.80568 = idf(docFreq=23695, maxDocs=144169)
0.009543024 = queryNorm
2.80568 = (MATCH) fieldWeight(type:tie in 2499), product of:
1.0 = tf(termFreq(type:tie)=1)
2.80568 = idf(docFreq=23695, maxDocs=144169)
1.0 = fieldNorm(field=type, doc=2499)
0.8213679 = (MATCH)
FunctionQuery(1.0/(3.16E-11*float(ms(const(1319438484878),date(date.modified_dt)))+1.0)),
product of:
0.86069983 =
1.0/(3.16E-11*float(ms(const(1319438484878),date(date.modified_dt)=1314316800000))+1.0)
100.0 = boost
0.009543024 = queryNorm
</str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/08/ashi_2011_08_2011-09-30_tie_001_fi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/02/ashi_2011_02_2011-07-29_tie_001_fi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/08/ashi_2011_08_2011-09-30_laa_001_fi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/01/ashi_2011_01_2011-04-28_tie_001_fi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/07/ashi_2011_07_2011-08-26_laa_001_fi.html"></str>
+<str
name="http://pxweb2.stat.fi/database/StatFin/asu/ashi/005_ashi_tau_102_fi.px"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2011/02/ashi_2011_02_2011-07-29_laa_001_fi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/asvu/2010/05/asvu_2010_05_2011-06-23_tie_001_fi.html"></str>
+<str
name="/media/nss/DATA2/data/wwwprod/til/ashi/2010/04/ashi_2010_04_2011-01-28_tie_001_fi.html"></str>
</lst>
<str name="QParser">DisMaxQParser</str>
<null name="altquerystring"/>
<arr name="boost_queries"><str>type:tie^6 type:kuv^2 type:tau^2</str></arr>
<arr name="parsed_boost_queries"><str>type:tie^6.0 type:kuv^2.0
type:tau^2.0</str></arr>
<arr
name="boostfuncs"><str>recip(ms(NOW,date.modified_dt),3.16e-11,1,1)^100</str></arr>
<arr name="filter_queries"><str/></arr>
<arr name="parsed_filter_queries"/>
+<lst name="timing"></lst>
</lst>