$echo '{
< "startUrls": [
< {
< "key": "START",
< "value": "https://www.example.com/"
< }
< ],
< "crawlPurls": [
< {
< "key": "MY_LABEL",
< "value": "https://www.example.com/[.*]"
< }
< ],
< "clickableElementsSelector": "a:not([rel=nofollow])",
< "pageFunction": "function pageFunction(context) {\\n // called on every page the crawler visits, use it to extract data from it\\n var $ = context.jQuery;\\n var result = {\\n title: $('\''title'\'').text(),\\n myValue: $('\''TODO'\'').text()\\n };\\n return result;\\n}\\n",
< "interceptRequest": "function interceptRequest(context, newRequest) {\\n // called whenever the crawler finds a link to a new page,\\n // use it to override default behavior\\n return newRequest;\\n}\\n"
<}' |
<apify call apify/legacy-phantomjs-crawler --silent --output-dataset