1from apify_client import ApifyClient
2
3
4
5client = ApifyClient("<YOUR_API_TOKEN>")
6
7
8run_input = {
9 "startUrls": [{ "url": "https://ballasalla.sch.im/site/uploads/pages/3/_media/20171107_019647f4/Online_gaming_an_introduction_for_parents_and_carers_2017.pdf" }],
10 "storage_provider": "none",
11 "gcp_auth_method": "hmac",
12 "gcp_service_account_json": "",
13 "gcp_project_id": "",
14 "bucket_name": "",
15 "access_key": "",
16 "secret_key": "",
17 "endpoint": "storage.googleapis.com",
18 "file_path": [],
19 "allowedDomains": ["apify.com"],
20 "proxyConfiguration": { "useApifyProxy": True },
21}
22
23
24run = client.actor("getdataforme/pdf-to-text-scraper").call(run_input=run_input)
25
26
27print("💾 Check your data here: https://console.apify.com/storage/datasets/" + run["defaultDatasetId"])
28for item in client.dataset(run["defaultDatasetId"]).iterate_items():
29 print(item)
30
31