forked from apify/actor-algolia-website-indexer
-
Notifications
You must be signed in to change notification settings - Fork 0
/
INPUT_SCHEMA.json
132 lines (132 loc) · 3.81 KB
/
INPUT_SCHEMA.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
{
"title": "Algolia Web Crawler input",
"description": "",
"type": "object",
"schemaVersion": 1,
"properties": {
"algoliaAppId": {
"sectionCaption": "Basic",
"title": "Algolia App ID",
"type": "string",
"description": "Your Algolia Application ID",
"editor": "textfield"
},
"algoliaApiKey": {
"title": "Algolia API Key",
"type": "string",
"description": "Your Algolia API key",
"editor": "textfield"
},
"algoliaIndexName": {
"title": "Algolia Index Name",
"type": "string",
"description": "Your Algolia index name",
"editor": "textfield"
},
"crawlerName": {
"title": "Crawler Name",
"type": "string",
"description": "Crawler name, it updates/removes/adds pages into to index regarding this name. In this case, you can have more website in the index.",
"editor": "textfield"
},
"startUrls": {
"title": "Start URLs",
"type": "array",
"description": "URLs where to start crawling",
"prefill": [
{
"url": "http://example.com"
}
],
"editor": "requestListSources"
},
"selectors": {
"title": "Selectors",
"type": "array",
"description": "Pick selectors, which text content you want to index. Key is name of attribute and value is CSS selector.",
"prefill": [
{
"key": "h1",
"value": "body"
}
],
"editor": "keyValue"
},
"requiredAttributes": {
"title": "Required attributes",
"type": "array",
"description": "Pick attributes, which are required in index. By default all attributes from selectors are required.",
"prefill": [],
"editor": "json"
},
"waitForElement": {
"title": "Wait for element",
"type": "string",
"description": "Selector of element to wait on each page.",
"editor": "textfield"
},
"additionalPageAttrs": {
"title": "Additional attributes",
"type": "object",
"description": "Pick additional attributes you want to attach to each record in index.",
"editor": "json",
"prefill": {},
"default": {}
},
"skipIndexUpdate": {
"title": "Skip Index Updated",
"type": "boolean",
"description": "If check crawler will not update Algolia index.",
"default": true
},
"disableCrawlerCascade": {
"title": "Disable crawling links found on pages",
"type": "boolean",
"description": "Disable crawling links found on pages.",
"default": false
},
"listOfUrls": {
"title": "List of URLs to scan (ignore start URLs)",
"type": "array",
"description": "The list of urls to scan (ignore start URLs)",
"editor": "requestListSources"
},
"pseudoUrls": {
"sectionCaption": "Overrides defaults",
"title": "Pseudo-URLs",
"type": "array",
"description": "Overrides default pseudoUrls",
"editor": "pseudoUrls"
},
"pageFunction": {
"title": "Page function",
"type": "string",
"description": "Overrides default pageFunction",
"editor": "javascript"
},
"clickableElements": {
"title": "Clickable elements",
"type": "string",
"description": "Overrides default clickableElements",
"editor": "textfield"
},
"keepUrlFragments": {
"title": "Keep URL fragments",
"type": "boolean",
"description": "Option to switch on enqueueing URL with URL fragments",
"default": false
},
"omitSearchParamsFromUrl": {
"title": "Omit search params from URLs",
"type": "boolean",
"description": "Option to switch off enqueueing with search params.",
"default": false
}
},
"required": [
"algoliaAppId",
"algoliaApiKey",
"algoliaIndexName",
"startUrls"
]
}