1from apify_client import ApifyClient
2
3
4
5client = ApifyClient("<YOUR_API_TOKEN>")
6
7
8run_input = {
9 "startUrls": ["https://www.theguardian.com"],
10 "articleUrls": [],
11 "proxyConfiguration": { "useApifyProxy": False },
12 "extendOutputFunction": """# def extend(soup, article, html):
13# return {\"pageTitle\": soup.title.string.strip() if soup.title else None}
14""",
15}
16
17
18run = client.actor("scrapier/smart-article-extractor").call(run_input=run_input)
19
20
21print("๐พ Check your data here: https://console.apify.com/storage/datasets/" + run["defaultDatasetId"])
22for item in client.dataset(run["defaultDatasetId"]).iterate_items():
23 print(item)
24
25