This is an automated email from the ASF dual-hosted git repository. kxiao pushed a commit to branch master in repository https://gitbox.apache.org/repos/asf/doris-website.git
The following commit(s) were added to refs/heads/master by this push: new b350d2b0a9b Update the description of the usage of match_phrase_prefix. (#1726) b350d2b0a9b is described below commit b350d2b0a9bccc8534b77b3338a12c4efb0317d6 Author: zzzxl <yangs...@selectdb.com> AuthorDate: Thu Jan 9 10:26:36 2025 +0800 Update the description of the usage of match_phrase_prefix. (#1726) --- docs/table-design/index/inverted-index.md | 1 + .../current/table-design/index/inverted-index.md | 1 + .../version-2.0/table-design/index/inverted-index.md | 1 + .../version-2.1/table-design/index/inverted-index.md | 1 + .../version-3.0/table-design/index/inverted-index.md | 1 + versioned_docs/version-2.0/table-design/index/inverted-index.md | 1 + versioned_docs/version-2.1/table-design/index/inverted-index.md | 1 + versioned_docs/version-3.0/table-design/index/inverted-index.md | 1 + 8 files changed, 8 insertions(+) diff --git a/docs/table-design/index/inverted-index.md b/docs/table-design/index/inverted-index.md index 4b5adfa771c..c0213223f3e 100644 --- a/docs/table-design/index/inverted-index.md +++ b/docs/table-design/index/inverted-index.md @@ -302,6 +302,7 @@ SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3'; SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3+'; -- 2.3 Prefix matching the last word keyword2, with a default limit of 50 prefixes (controlled by session variable inverted_index_max_expansions) +-- It is necessary to ensure that keyword1 and keyword2 remain adjacent in the original text after tokenization, with no other words in between. -- 'keyword1 keyword2abc' matches because keyword1 is identical and keyword2abc is a prefix of keyword2 -- 'keyword1 keyword2' also matches because keyword2 is a prefix of keyword2 -- 'keyword1 keyword3' does not match because keyword3 is not a prefix of keyword2 diff --git a/i18n/zh-CN/docusaurus-plugin-content-docs/current/table-design/index/inverted-index.md b/i18n/zh-CN/docusaurus-plugin-content-docs/current/table-design/index/inverted-index.md index 98dc525b983..78b3da13ceb 100644 --- a/i18n/zh-CN/docusaurus-plugin-content-docs/current/table-design/index/inverted-index.md +++ b/i18n/zh-CN/docusaurus-plugin-content-docs/current/table-design/index/inverted-index.md @@ -305,6 +305,7 @@ SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3'; SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3+'; -- 2.3 在保持词顺序的前提下,对最后一个词 keyword2 做前缀匹配,默认找 50 个前缀词(session 变量 inverted_index_max_expansions 控制) +-- 需要保证 keyword1, keyword2 在原文分词后也是相邻的,不能中间有其他词 -- 'keyword1 keyword2abc' 能匹配,因为 keyword1 完全一样,最后一个 keyword2abc 是 keyword2 的前缀 -- 'keyword1 keyword2' 也能匹配,因为 keyword2 也是 keyword2 的前缀 -- 'keyword1 keyword3' 不能匹配,因为 keyword3 不是 keyword2 的前缀 diff --git a/i18n/zh-CN/docusaurus-plugin-content-docs/version-2.0/table-design/index/inverted-index.md b/i18n/zh-CN/docusaurus-plugin-content-docs/version-2.0/table-design/index/inverted-index.md index 00074fa14b3..4f1d1b8d25c 100644 --- a/i18n/zh-CN/docusaurus-plugin-content-docs/version-2.0/table-design/index/inverted-index.md +++ b/i18n/zh-CN/docusaurus-plugin-content-docs/version-2.0/table-design/index/inverted-index.md @@ -305,6 +305,7 @@ SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3'; SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3+'; -- 2.3 在保持词顺序的前提下,对最后一个词 keyword2 做前缀匹配,默认找 50 个前缀词(session 变量 inverted_index_max_expansions 控制) +-- 需要保证 keyword1, keyword2 在原文分词后也是相邻的,不能中间有其他词 -- 'keyword1 keyword2abc' 能匹配,因为 keyword1 完全一样,最后一个 keyword2abc 是 keyword2 的前缀 -- 'keyword1 keyword2' 也能匹配,因为 keyword2 也是 keyword2 的前缀 -- 'keyword1 keyword3' 不能匹配,因为 keyword3 不是 keyword2 的前缀 diff --git a/i18n/zh-CN/docusaurus-plugin-content-docs/version-2.1/table-design/index/inverted-index.md b/i18n/zh-CN/docusaurus-plugin-content-docs/version-2.1/table-design/index/inverted-index.md index 43e12d40b58..6666a347a35 100644 --- a/i18n/zh-CN/docusaurus-plugin-content-docs/version-2.1/table-design/index/inverted-index.md +++ b/i18n/zh-CN/docusaurus-plugin-content-docs/version-2.1/table-design/index/inverted-index.md @@ -305,6 +305,7 @@ SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3'; SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3+'; -- 2.3 在保持词顺序的前提下,对最后一个词 keyword2 做前缀匹配,默认找 50 个前缀词(session 变量 inverted_index_max_expansions 控制) +-- 需要保证 keyword1, keyword2 在原文分词后也是相邻的,不能中间有其他词 -- 'keyword1 keyword2abc' 能匹配,因为 keyword1 完全一样,最后一个 keyword2abc 是 keyword2 的前缀 -- 'keyword1 keyword2' 也能匹配,因为 keyword2 也是 keyword2 的前缀 -- 'keyword1 keyword3' 不能匹配,因为 keyword3 不是 keyword2 的前缀 diff --git a/i18n/zh-CN/docusaurus-plugin-content-docs/version-3.0/table-design/index/inverted-index.md b/i18n/zh-CN/docusaurus-plugin-content-docs/version-3.0/table-design/index/inverted-index.md index 98dc525b983..78b3da13ceb 100644 --- a/i18n/zh-CN/docusaurus-plugin-content-docs/version-3.0/table-design/index/inverted-index.md +++ b/i18n/zh-CN/docusaurus-plugin-content-docs/version-3.0/table-design/index/inverted-index.md @@ -305,6 +305,7 @@ SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3'; SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3+'; -- 2.3 在保持词顺序的前提下,对最后一个词 keyword2 做前缀匹配,默认找 50 个前缀词(session 变量 inverted_index_max_expansions 控制) +-- 需要保证 keyword1, keyword2 在原文分词后也是相邻的,不能中间有其他词 -- 'keyword1 keyword2abc' 能匹配,因为 keyword1 完全一样,最后一个 keyword2abc 是 keyword2 的前缀 -- 'keyword1 keyword2' 也能匹配,因为 keyword2 也是 keyword2 的前缀 -- 'keyword1 keyword3' 不能匹配,因为 keyword3 不是 keyword2 的前缀 diff --git a/versioned_docs/version-2.0/table-design/index/inverted-index.md b/versioned_docs/version-2.0/table-design/index/inverted-index.md index 11fe799e9e8..2411fcb137d 100644 --- a/versioned_docs/version-2.0/table-design/index/inverted-index.md +++ b/versioned_docs/version-2.0/table-design/index/inverted-index.md @@ -302,6 +302,7 @@ SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3'; SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3+'; -- 2.3 Prefix matching the last word keyword2, with a default limit of 50 prefixes (controlled by session variable inverted_index_max_expansions) +-- It is necessary to ensure that keyword1 and keyword2 remain adjacent in the original text after tokenization, with no other words in between. -- 'keyword1 keyword2abc' matches because keyword1 is identical and keyword2abc is a prefix of keyword2 -- 'keyword1 keyword2' also matches because keyword2 is a prefix of keyword2 -- 'keyword1 keyword3' does not match because keyword3 is not a prefix of keyword2 diff --git a/versioned_docs/version-2.1/table-design/index/inverted-index.md b/versioned_docs/version-2.1/table-design/index/inverted-index.md index fae75d68110..7e86a2bd50d 100644 --- a/versioned_docs/version-2.1/table-design/index/inverted-index.md +++ b/versioned_docs/version-2.1/table-design/index/inverted-index.md @@ -299,6 +299,7 @@ SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3'; SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3+'; -- 2.3 Prefix matching the last word keyword2, with a default limit of 50 prefixes (controlled by session variable inverted_index_max_expansions) +-- It is necessary to ensure that keyword1 and keyword2 remain adjacent in the original text after tokenization, with no other words in between. -- 'keyword1 keyword2abc' matches because keyword1 is identical and keyword2abc is a prefix of keyword2 -- 'keyword1 keyword2' also matches because keyword2 is a prefix of keyword2 -- 'keyword1 keyword3' does not match because keyword3 is not a prefix of keyword2 diff --git a/versioned_docs/version-3.0/table-design/index/inverted-index.md b/versioned_docs/version-3.0/table-design/index/inverted-index.md index 4b5adfa771c..c0213223f3e 100644 --- a/versioned_docs/version-3.0/table-design/index/inverted-index.md +++ b/versioned_docs/version-3.0/table-design/index/inverted-index.md @@ -302,6 +302,7 @@ SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3'; SELECT * FROM table_name WHERE content MATCH_PHRASE 'keyword1 keyword2 ~3+'; -- 2.3 Prefix matching the last word keyword2, with a default limit of 50 prefixes (controlled by session variable inverted_index_max_expansions) +-- It is necessary to ensure that keyword1 and keyword2 remain adjacent in the original text after tokenization, with no other words in between. -- 'keyword1 keyword2abc' matches because keyword1 is identical and keyword2abc is a prefix of keyword2 -- 'keyword1 keyword2' also matches because keyword2 is a prefix of keyword2 -- 'keyword1 keyword3' does not match because keyword3 is not a prefix of keyword2 --------------------------------------------------------------------- To unsubscribe, e-mail: commits-unsubscr...@doris.apache.org For additional commands, e-mail: commits-h...@doris.apache.org