1from apify_client import ApifyClient
2
3
4
5client = ApifyClient("<YOUR_API_TOKEN>")
6
7
8run_input = {
9    "requests": [
10        { "url": "https://www.scrapethissite.com/pages/simple/" },
11        {
12            "id": "forms",
13            "url": "https://www.scrapethissite.com/pages/simple/",
14            "extract": [{
15                    "field_name": "extracted_html",
16                    "selector": "#countries > div > div:nth-child(4) > div:nth-child(1)",
17                    "extract_type": "HTML",
18                }],
19        },
20        {
21            "id": "hockey",
22            "url": "https://www.scrapethissite.com/pages/forms/",
23            "extract": [
24                {
25                    "field_name": "year1",
26                    "selector": "#hockey > div > table > tbody > tr:nth-child(2) > td.year",
27                    "extract_type": "Text",
28                },
29                {
30                    "field_name": "year2",
31                    "selector": "#hockey > div > table > tbody > tr:nth-child(3) > td.year",
32                    "extract_type": "Text",
33                },
34                {
35                    "field_name": "class_name",
36                    "selector": "#hockey > div > table > tbody > tr:nth-child(2) > td.year",
37                    "extract_type": { "Attribute": "class" },
38                },
39            ],
40        },
41    ],
42    "proxy_settings": { "useApifyProxy": True },
43}
44
45
46run = client.actor("danielherman/fast-scraper").call(run_input=run_input)
47
48
49print("💾 Check your data here: https://console.apify.com/storage/datasets/" + run["defaultDatasetId"])
50for item in client.dataset(run["defaultDatasetId"]).iterate_items():
51    print(item)
52
53