1import { ApifyClient } from 'apify-client';
2
3
4
5const client = new ApifyClient({
6 token: '<YOUR_API_TOKEN>',
7});
8
9
10const input = {
11 "startUrls": [
12 {
13 "url": "https://docs.apify.com/academy/web-scraping-for-beginners"
14 }
15 ],
16 "useSitemaps": false,
17 "respectRobotsTxtFile": true,
18 "crawlerType": "playwright:adaptive",
19 "includeUrlGlobs": [],
20 "excludeUrlGlobs": [],
21 "initialCookies": [],
22 "customHttpHeaders": {},
23 "proxyConfiguration": {
24 "useApifyProxy": true
25 },
26 "keepElementsCssSelector": "",
27 "removeElementsCssSelector": `nav, footer, script, style, noscript, svg, img[src^='data:'],
28 [role="alert"],
29 [role="banner"],
30 [role="dialog"],
31 [role="alertdialog"],
32 [role="region"][aria-label*="skip" i],
33 [aria-modal="true"]`,
34 "blockMedia": true,
35 "clickElementsCssSelector": "[aria-expanded=\"false\"]",
36 "storeSkippedUrls": false
37};
38
39
40const run = await client.actor("apify/website-content-crawler").call(input);
41
42
43console.log('Results from dataset');
44console.log(`๐พ Check your data here: https://console.apify.com/storage/datasets/${run.defaultDatasetId}`);
45const { items } = await client.dataset(run.defaultDatasetId).listItems();
46items.forEach((item) => {
47 console.dir(item);
48});
49
50