1from apify_client import ApifyClient
2
3
4
5client = ApifyClient("<YOUR_API_TOKEN>")
6
7
8run_input = {
9 "maxItems": 10,
10 "domains": [
11 "amazon.com",
12 "google.com",
13 "facebook.com",
14 "youtube.com",
15 "twitter.com",
16 "instagram.com",
17 "linkedin.com",
18 "wikipedia.org",
19 "reddit.com",
20 "pinterest.com",
21 "netflix.com",
22 "microsoft.com",
23 "apple.com",
24 "ebay.com",
25 "cnn.com",
26 "bbc.com",
27 "nytimes.com",
28 "walmart.com",
29 "target.com",
30 "bestbuy.com",
31 "costco.com",
32 "homedepot.com",
33 "lowes.com",
34 "ikea.com",
35 "nike.com",
36 "adidas.com",
37 "uber.com",
38 "airbnb.com",
39 "booking.com",
40 "expedia.com",
41 "spotify.com",
42 "hulu.com",
43 "disneyplus.com",
44 "hbomax.com",
45 "twitch.tv",
46 "paypal.com",
47 "stripe.com",
48 "shopify.com",
49 "wix.com",
50 "squarespace.com",
51 "wordpress.com",
52 "medium.com",
53 "github.com",
54 "stackoverflow.com",
55 "quora.com",
56 "tumblr.com",
57 "duolingo.com",
58 "coursera.org",
59 "udemy.com",
60 "khanacademy.org",
61 ],
62 "proxyConfiguration": {
63 "useApifyProxy": True,
64 "apifyProxyGroups": ["RESIDENTIAL"],
65 },
66}
67
68
69run = client.actor("parseforge/similarweb-scraper").call(run_input=run_input)
70
71
72print("πΎ Check your data here: https://console.apify.com/storage/datasets/" + run["defaultDatasetId"])
73for item in client.dataset(run["defaultDatasetId"]).iterate_items():
74 print(item)
75
76