1from apify_client import ApifyClient
2
3
4
5client = ApifyClient("<YOUR_API_TOKEN>")
6
7
8run_input = {
9 "query": "web browser for RAG pipelines -site:reddit.com",
10 "proxyConfiguration": { "useApifyProxy": True },
11 "removeElementsCssSelector": """nav, footer, script, style, noscript, svg, img[src^='data:'],
12[role=\"alert\"],
13[role=\"banner\"],
14[role=\"dialog\"],
15[role=\"alertdialog\"],
16[role=\"region\"][aria-label*=\"skip\" i],
17[aria-modal=\"true\"]""",
18 "htmlTransformer": "none",
19}
20
21
22run = client.actor("apify/rag-web-browser").call(run_input=run_input)
23
24
25print("πΎ Check your data here: https://console.apify.com/storage/datasets/" + run["defaultDatasetId"])
26for item in client.dataset(run["defaultDatasetId"]).iterate_items():
27 print(item)
28
29