forked from vdrmota/Social-Media-and-Contact-Info-Extractor
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathINPUT_SCHEMA.json
59 lines (59 loc) · 2.53 KB
/
INPUT_SCHEMA.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
{
"title": "Contact Info Scraper",
"type": "object",
"schemaVersion": 1,
"properties": {
"startUrls": {
"title": "Start URLs",
"type": "array",
"description": "List of web pages where the actor will start crawling.",
"prefill": [{ "url": "https://apify.com" }],
"editor": "requestListSources"
},
"maxRequests": {
"title": "Maximum pages",
"type": "integer",
"description": "The maximum number of pages the crawler will load. It is always a good idea to limit the number of pages, otherwise the actor might run infinitely or consume too much resources.",
"minimum": 1,
"prefill": 100
},
"maxRequestsPerStartUrl": {
"title": "Maximum pages per start URL",
"type": "integer",
"description": "The maximum number of pages that will be enqueued from each start URL you provide.",
"minimum": 1
},
"maxDepth": {
"title": "Maximum link depth",
"type": "integer",
"description": "The maximum number of links away from the <b>Start URLs</b> that the actor will crawl. If <code>0</code>, the actor will not follow any links. If empty or null, the actor will follow links to arbitrary depth.",
"minimum": 0,
"prefill": 2,
"sectionCaption": "Scraping options",
"sectionDescription": "Here you can specify further conditions for the scrape. However we worked hard to set the best options for you already."
},
"sameDomain": {
"title": "Stay within domain",
"type": "boolean",
"description": "If set, the actor will only follow links within the same domain as the referring page.",
"default": true
},
"considerChildFrames": {
"title": "Probe frames",
"type": "boolean",
"description": "If set, the actor will extract contact information also from IFRAMEs. Sometimes, you might not want that (e.g. this will include data from online ads).",
"default": true
},
"proxyConfig": {
"title": "Proxy",
"type": "object",
"description": "Proxy servers let you bypass website protections, avoid IP address blocking and view content for other countries. Try to use the proxy if you are experiencing timeout errors.",
"default": {
"useApifyProxy": true
},
"editor": "proxy",
"sectionCaption": "Proxy configuration"
}
},
"required": ["startUrls"]
}