1import { ApifyClient } from 'apify-client';
2
3
4
5const client = new ApifyClient({
6 token: '<YOUR_API_TOKEN>',
7});
8
9
10const input = {
11 "startUrls": [
12 {
13 "url": "https://news.ycombinator.com/"
14 }
15 ],
16 "instructions": `Gets the post with the most points from the page and returns it as JSON in this format:
17 postTitle
18 postUrl
19 pointsCount`,
20 "model": "gpt-3.5-turbo",
21 "includeUrlGlobs": [],
22 "excludeUrlGlobs": [],
23 "linkSelector": "a[href]",
24 "initialCookies": [],
25 "proxyConfiguration": {
26 "useApifyProxy": true
27 },
28 "targetSelector": "",
29 "removeElementsCssSelector": "script, style, noscript, path, svg, xlink",
30 "skipGptGlobs": [],
31 "schema": {
32 "type": "object",
33 "properties": {
34 "title": {
35 "type": "string",
36 "description": "Page title"
37 },
38 "description": {
39 "type": "string",
40 "description": "Page description"
41 }
42 },
43 "required": [
44 "title",
45 "description"
46 ]
47 },
48 "schemaDescription": ""
49};
50
51
52const run = await client.actor("drobnikj/extended-gpt-scraper").call(input);
53
54
55console.log('Results from dataset');
56console.log(`💾 Check your data here: https://console.apify.com/storage/datasets/${run.defaultDatasetId}`);
57const { items } = await client.dataset(run.defaultDatasetId).listItems();
58items.forEach((item) => {
59 console.dir(item);
60});
61
62