1from apify_client import ApifyClient
2
3
4
5client = ApifyClient("<YOUR_API_TOKEN>")
6
7
8run_input = {
9 "startUrls": ["https://apify.com"],
10 "additionalPaths": [
11 "/about",
12 "/about-us",
13 "/contact",
14 "/contact-us",
15 "/pages/contact-us",
16 "/pages/about-us",
17 "/pages/privacy-policy",
18 "/privacy-policy",
19 "/pages/terms-and-conditions",
20 "/terms-and-conditions",
21 "/pages/sitemap",
22 "/sitemap",
23 "/pages/faq",
24 "/faq",
25 "/pages/our-story",
26 "/our-story",
27 "/pages/our-team",
28 "/our-team",
29 ],
30 "excludeKeywords": [
31 "whatsapp",
32 "wa.me",
33 "facebook",
34 "instagram",
35 "linkedin",
36 "youtube",
37 "twitter",
38 "x.com",
39 "blog",
40 "blogs",
41 "news",
42 "setting",
43 "settings",
44 "#",
45 "collection",
46 "collections",
47 "product",
48 "products",
49 "account",
50 "login",
51 "logout",
52 "signin",
53 "signout",
54 "cart",
55 "checkout",
56 "search",
57 "compare",
58 "wishlist",
59 ],
60 "proxyConfiguration": {
61 "useApifyProxy": True,
62 "apifyProxyGroups": ["RESIDENTIAL"],
63 },
64}
65
66
67run = client.actor("competent_clarinet/website-contact-crawler").call(run_input=run_input)
68
69
70print("💾 Check your data here: https://console.apify.com/storage/datasets/" + run["defaultDatasetId"])
71for item in client.dataset(run["defaultDatasetId"]).iterate_items():
72 print(item)
73
74