Skip to content

Commit 896292e

Browse files
committed
Tweak indexing.
1 parent 8ca3ab0 commit 896292e

1 file changed

Lines changed: 31 additions & 3 deletions

File tree

search-server/typesense-scraper/typesense-scraper-config.json

Lines changed: 31 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,18 +3,46 @@
33
"allowed_domains": ["172.17.0.2","reference.servicestack.net"],
44
"start_urls": [
55
{
6-
"url": "https://reference.servicestack.net/"
6+
"url": "https://reference.servicestack.net/api/ServiceStack.Blazor/"
7+
},
8+
{
9+
"url": "https://reference.servicestack.net/api/ServiceStack.Blazor.Components/"
10+
},
11+
{
12+
"url": "https://reference.servicestack.net/api/ServiceStack.Blazor.Components.Tailwind/"
713
}
814
],
915
"selectors": {
1016
"default": {
11-
"lvl0": ".theme-doc-sidebar-item-link-level-2 .menu__link--active",
17+
"lvl0": {
18+
"selector": "(//ul[contains(@class,'menu__list')]//a[contains(@class, 'menu__link menu__link--sublist menu__link--active')]/text() | //nav[contains(@class, 'navbar')]//a[contains(@class, 'navbar__link--active')]/text())[last()]",
19+
"type": "xpath",
20+
"global": true,
21+
"default_value": "Documentation"
22+
},
1223
"lvl1": "article h1",
1324
"lvl2": "article h3",
1425
"lvl3": "article h5, article td:first-child",
1526
"text": "article p, article li, article td:last-child"
1627
}
1728
},
1829
"scrape_start_urls": false,
19-
"strip_chars": " .,;:#"
30+
"strip_chars": " .,;:#",
31+
"custom_settings": {
32+
"separatorsToIndex": "_",
33+
"attributesForFaceting": [
34+
"language",
35+
"version",
36+
"type",
37+
"docusaurus_tag"
38+
],
39+
"attributesToRetrieve": [
40+
"hierarchy",
41+
"content",
42+
"anchor",
43+
"url",
44+
"url_without_anchor",
45+
"type"
46+
]
47+
}
2048
}

0 commit comments

Comments
 (0)