-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcrawlerConfig.json
97 lines (97 loc) · 3.1 KB
/
crawlerConfig.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
{
"appId": "52C6J0MS4V",
"apiKey": "816dc34de3e9c7f6b2d4f95bb85ba4a5",
"rateLimit": 8,
"startUrls": ["https://worldtravel-83q.pages.dev/"],
"renderJavaScript": false,
"sitemaps": [],
"exclusionPatterns": [],
"ignoreCanonicalTo": false,
"discoveryPatterns": ["https://worldtravel-83q.pages.dev/**"],
"schedule": "at 05:10 on Saturday",
"actions": [
{
"indexName": "worldtravel",
"pathsToMatch": ["https://worldtravel-83q.pages.dev/**"],
"recordExtractor": {
"type": "selectorContent",
"selectors": [
"title",
".content h1",
".content h2",
".content h3",
".content h4",
".content h5",
".content p",
".content li"
]
}
}
],
"initialIndexSettings": {
"worldtravel": {
"attributesForFaceting": ["type", "lang"],
"attributesToRetrieve": ["hierarchy", "content", "anchor", "url"],
"attributesToHighlight": ["hierarchy", "hierarchy_camel", "content"],
"attributesToSnippet": ["content:10"],
"camelCaseAttributes": ["hierarchy", "hierarchy_radio", "content"],
"searchableAttributes": [
"unordered(hierarchy_radio_camel.lvl0)",
"unordered(hierarchy_radio.lvl0)",
"unordered(hierarchy_radio_camel.lvl1)",
"unordered(hierarchy_radio.lvl1)",
"unordered(hierarchy_radio_camel.lvl2)",
"unordered(hierarchy_radio.lvl2)",
"unordered(hierarchy_radio_camel.lvl3)",
"unordered(hierarchy_radio.lvl3)",
"unordered(hierarchy_radio_camel.lvl4)",
"unordered(hierarchy_radio.lvl4)",
"unordered(hierarchy_radio_camel.lvl5)",
"unordered(hierarchy_radio.lvl5)",
"unordered(hierarchy_radio_camel.lvl6)",
"unordered(hierarchy_radio.lvl6)",
"unordered(hierarchy_camel.lvl0)",
"unordered(hierarchy.lvl0)",
"unordered(hierarchy_camel.lvl1)",
"unordered(hierarchy.lvl1)",
"unordered(hierarchy_camel.lvl2)",
"unordered(hierarchy.lvl2)",
"unordered(hierarchy_camel.lvl3)",
"unordered(hierarchy.lvl3)",
"unordered(hierarchy_camel.lvl4)",
"unordered(hierarchy.lvl4)",
"unordered(hierarchy_camel.lvl5)",
"unordered(hierarchy.lvl5)",
"unordered(hierarchy_camel.lvl6)",
"unordered(hierarchy.lvl6)",
"content"
],
"distinct": true,
"attributeForDistinct": "url",
"customRanking": [
"desc(weight.pageRank)",
"desc(weight.level)",
"asc(weight.position)"
],
"ranking": [
"words",
"filters",
"typo",
"attribute",
"proximity",
"exact",
"custom"
],
"highlightPreTag": "<span class=\"algolia-docsearch-suggestion--highlight\">",
"highlightPostTag": "</span>",
"minWordSizefor1Typo": 3,
"minWordSizefor2Typos": 7,
"allowTyposOnNumericTokens": false,
"minProximity": 1,
"ignorePlurals": true,
"advancedSyntax": true,
"attributeCriteriaComputedByMinProximity": true,
"removeWordsIfNoResults": "allOptional"
}
}
}