Copilot commented on code in PR #1473:
URL: https://github.com/apache/camel-website/pull/1473#discussion_r2693908652


##########
.docsearch.config.json:
##########
@@ -0,0 +1,125 @@
+{
+  "index": {
+    "name": "apache_camel",
+    "startUrls": [
+      "https://camel.apache.org/";
+    ],
+    "ignoreCanonicalTo": false,
+    "pathsToMatch": [
+      "https://camel.apache.org/**";
+    ],
+    "pathsToIgnore": [
+      "https://camel.apache.org/search";,
+      "https://camel.apache.org/404.html";
+    ],
+    "includeHeadingLevels": [1, 2, 3, 4, 5, 6],
+    "stripQueryParameters": true
+  },
+  "crawler": {
+    "userAgent": "Algolia Crawler",
+    "maxDepth": 20,
+    "maxUrls": 50000,
+    "waitUntilFired": true,
+    "timeoutMs": 30000,
+    "sitemapUrls": [
+      "https://camel.apache.org/sitemap.xml";
+    ],
+    "ignoreRobotsTxt": false,
+    "allowedDomains": [
+      "camel.apache.org"
+    ]
+  },
+  "selectors": {
+    "lvl0": {
+      "selector": "h1",
+      "global": true,
+      "default_value": "Documentation"
+    },
+    "lvl1": "h2",
+    "lvl2": "h3",
+    "lvl3": "h4",
+    "lvl4": "h5",
+    "lvl5": "h6",
+    "text": "p, li, td, th, dt, dd, span:not(.tooltip), 
div:not([class*='hidden']), table tbody, code, pre"
+  },
+  "selectors_exclude": [
+    ".no_index",
+    "[data-no-index]",
+    ".sidebar",
+    ".breadcrumb",
+    "nav",
+    ".navbar",
+    ".menu",
+    ".toc",
+    "footer",
+    ".footer",
+    ".copyright",
+    ".hide",
+    ".hidden",
+    "[aria-hidden='true']",
+    "script",
+    "style",
+    ".language-toggle",
+    ".sidebar-toggle"
+  ],
+  "min_indexed_level": 1,
+  "only_content_level": false,
+  "start_urls": [
+    {
+      "url": "https://camel.apache.org/components/next/";,
+      "page_rank": 5
+    },
+    {
+      "url": "https://camel.apache.org/components/latest/";,
+      "page_rank": 5
+    },
+    {
+      "url": "https://camel.apache.org/components/\\d+\\.\\d+\\.x/";,

Review Comment:
   The regex pattern uses `\\d+\\.\\d+\\.x` which would match URLs like `4.4.x` 
literally (where 'x' is the character 'x'), not as a wildcard. For matching 
version patterns like `4.4.0` or `4.10.5`, the pattern should be 
`\\d+\\.\\d+\\.\\d+`. If the actual URLs contain a literal 'x' character (like 
`/4.4.x/`), then this is correct, but this should be verified against the 
actual URL structure.



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]

Reply via email to