
Google News Scraper
7 days trial then $20.00/month - No credit card required now

Google News Scraper
7 days trial then $20.00/month - No credit card required now
Gets featured articles from Google News with title, link, source, publication date and image.
You can access the Google News Scraper programmatically from your own applications by using the Apify API. You can choose the language preference from below. To use the Apify API, you’ll need an Apify account and your API token, found in Integrations settings in Apify Console.
1{
2 "openapi": "3.0.1",
3 "info": {
4 "version": "0.0",
5 "x-build-id": "y80sb8veExmMdgUPB"
6 },
7 "servers": [
8 {
9 "url": "https://api.apify.com/v2"
10 }
11 ],
12 "paths": {
13 "/acts/lhotanova~google-news-scraper/run-sync-get-dataset-items": {
14 "post": {
15 "operationId": "run-sync-get-dataset-items-lhotanova-google-news-scraper",
16 "x-openai-isConsequential": false,
17 "summary": "Executes an Actor, waits for its completion, and returns Actor's dataset items in response.",
18 "tags": [
19 "Run Actor"
20 ],
21 "requestBody": {
22 "required": true,
23 "content": {
24 "application/json": {
25 "schema": {
26 "$ref": "#/components/schemas/inputSchema"
27 }
28 }
29 }
30 },
31 "parameters": [
32 {
33 "name": "token",
34 "in": "query",
35 "required": true,
36 "schema": {
37 "type": "string"
38 },
39 "description": "Enter your Apify token here"
40 }
41 ],
42 "responses": {
43 "200": {
44 "description": "OK"
45 }
46 }
47 }
48 },
49 "/acts/lhotanova~google-news-scraper/runs": {
50 "post": {
51 "operationId": "runs-sync-lhotanova-google-news-scraper",
52 "x-openai-isConsequential": false,
53 "summary": "Executes an Actor and returns information about the initiated run in response.",
54 "tags": [
55 "Run Actor"
56 ],
57 "requestBody": {
58 "required": true,
59 "content": {
60 "application/json": {
61 "schema": {
62 "$ref": "#/components/schemas/inputSchema"
63 }
64 }
65 }
66 },
67 "parameters": [
68 {
69 "name": "token",
70 "in": "query",
71 "required": true,
72 "schema": {
73 "type": "string"
74 },
75 "description": "Enter your Apify token here"
76 }
77 ],
78 "responses": {
79 "200": {
80 "description": "OK",
81 "content": {
82 "application/json": {
83 "schema": {
84 "$ref": "#/components/schemas/runsResponseSchema"
85 }
86 }
87 }
88 }
89 }
90 }
91 },
92 "/acts/lhotanova~google-news-scraper/run-sync": {
93 "post": {
94 "operationId": "run-sync-lhotanova-google-news-scraper",
95 "x-openai-isConsequential": false,
96 "summary": "Executes an Actor, waits for completion, and returns the OUTPUT from Key-value store in response.",
97 "tags": [
98 "Run Actor"
99 ],
100 "requestBody": {
101 "required": true,
102 "content": {
103 "application/json": {
104 "schema": {
105 "$ref": "#/components/schemas/inputSchema"
106 }
107 }
108 }
109 },
110 "parameters": [
111 {
112 "name": "token",
113 "in": "query",
114 "required": true,
115 "schema": {
116 "type": "string"
117 },
118 "description": "Enter your Apify token here"
119 }
120 ],
121 "responses": {
122 "200": {
123 "description": "OK"
124 }
125 }
126 }
127 }
128 },
129 "components": {
130 "schemas": {
131 "inputSchema": {
132 "type": "object",
133 "required": [
134 "query",
135 "language",
136 "proxyConfiguration"
137 ],
138 "properties": {
139 "query": {
140 "title": "Search query",
141 "type": "string",
142 "description": "Enter search query as you would write it to Google News search bar. You can even use an empty query to search for arbitrary news.",
143 "default": ""
144 },
145 "language": {
146 "title": "Language and region",
147 "enum": [
148 "US:en",
149 "SK:sk",
150 "AU:en",
151 "BW:en",
152 "CA:en",
153 "ET:en",
154 "GH:en",
155 "IN:en",
156 "ID:en",
157 "IE:en",
158 "IL:en",
159 "KE:en",
160 "LV:en",
161 "MY:en",
162 "NA:en",
163 "NZ:en",
164 "NG:en",
165 "PK:en",
166 "PH:en",
167 "SG:en",
168 "ZA:en",
169 "TZ:en",
170 "UG:en",
171 "GB:en",
172 "ZW:en",
173 "ID:id",
174 "CZ:cs",
175 "DE:de",
176 "AT:de",
177 "CH:de",
178 "AR:es-419",
179 "CL:es-419",
180 "CO:es-419",
181 "CU:es-419",
182 "ES:es",
183 "US:es-419",
184 "MX:es-419",
185 "PE:es-419",
186 "VE:es-419",
187 "BE:fr",
188 "CA:fr",
189 "FR:fr",
190 "MA:fr",
191 "SN:fr",
192 "CH:fr",
193 "IT:it",
194 "LV:lv",
195 "LT:lt",
196 "HU:hu",
197 "BE:nl",
198 "NL:nl",
199 "NO:no",
200 "PL:pl",
201 "BR:pt-419",
202 "PT:pt-150",
203 "RO:ro",
204 "SI:sl",
205 "SE:sv",
206 "VN:vi",
207 "TR:tr",
208 "GR:el",
209 "BG:bg",
210 "RU:ru",
211 "UA:ru",
212 "RS:sr",
213 "UA:uk",
214 "IL:he",
215 "AE:ar",
216 "SA:ar",
217 "LB:ar",
218 "EG:ar",
219 "IN:mr",
220 "IN:hi",
221 "BD:bn",
222 "IN:bn",
223 "IN:ta",
224 "IN:te",
225 "IN:ml",
226 "TH:th",
227 "CN:zh-Hans",
228 "TW:zh-Hant",
229 "HK:zh-Hant",
230 "JP:ja",
231 "KR:ko"
232 ],
233 "type": "string",
234 "description": "Select your language and region pair.",
235 "default": "US:en"
236 },
237 "maxItems": {
238 "title": "Max items",
239 "minimum": 0,
240 "type": "integer",
241 "description": "Set the maximum number of items you want to scrape. If you leave this field unset, the actor will extract all news since 2005-01-01. If you set this field to value less than or equal to 100, date filter won't be used. Otherwise, the scraper will search news per individual days."
242 },
243 "fetchArticleDetails": {
244 "title": "Fetch article details",
245 "type": "boolean",
246 "description": "Check this option if you want to decode RSS links into actual article links and also fetch images from the article's page metadata. Please note that this option will increase the runtime of the actor because additional requests to article pages will be made. If you don't need decoded links and article images, you can leave this option unchecked and your run will be significantly faster and cheaper.",
247 "default": true
248 },
249 "dateFrom": {
250 "title": "Date from (YYYY-MM-DD)",
251 "pattern": "\\d{4}-\\d{2}-\\d{2}",
252 "type": "string",
253 "description": "Set the starting date. Only the news published on this or newer date will be scraped. If `Open-ended date range` field is set, `Date from` and `Date to` fields will be ignored."
254 },
255 "dateTo": {
256 "title": "Date to (YYYY-MM-DD)",
257 "pattern": "\\d{4}-\\d{2}-\\d{2}",
258 "type": "string",
259 "description": "Set the finish date. Only the news published on this date or before will be scraped. If `Open-ended date range` field is set, `Date from` and `Date to` fields will be ignored."
260 },
261 "openEndedDateRange": {
262 "title": "Open-ended date range",
263 "pattern": "\\d+(h|d|y)",
264 "type": "string",
265 "description": "Set the open-ended date range such as '1h' to scrape news published in the last hour, '2d' for the last two days, or '1y' for the last year. You can use any combination of numbers and letters 'h', 'd', and 'y' to specify the time range. If you set this field, the `Date from` and `Date to` fields will be ignored."
266 },
267 "proxyConfiguration": {
268 "title": "Proxy Configuration",
269 "type": "object",
270 "description": "Use either automatic Apify proxies or your own.",
271 "default": {
272 "useApifyProxy": true
273 }
274 }
275 }
276 },
277 "runsResponseSchema": {
278 "type": "object",
279 "properties": {
280 "data": {
281 "type": "object",
282 "properties": {
283 "id": {
284 "type": "string"
285 },
286 "actId": {
287 "type": "string"
288 },
289 "userId": {
290 "type": "string"
291 },
292 "startedAt": {
293 "type": "string",
294 "format": "date-time",
295 "example": "2025-01-08T00:00:00.000Z"
296 },
297 "finishedAt": {
298 "type": "string",
299 "format": "date-time",
300 "example": "2025-01-08T00:00:00.000Z"
301 },
302 "status": {
303 "type": "string",
304 "example": "READY"
305 },
306 "meta": {
307 "type": "object",
308 "properties": {
309 "origin": {
310 "type": "string",
311 "example": "API"
312 },
313 "userAgent": {
314 "type": "string"
315 }
316 }
317 },
318 "stats": {
319 "type": "object",
320 "properties": {
321 "inputBodyLen": {
322 "type": "integer",
323 "example": 2000
324 },
325 "rebootCount": {
326 "type": "integer",
327 "example": 0
328 },
329 "restartCount": {
330 "type": "integer",
331 "example": 0
332 },
333 "resurrectCount": {
334 "type": "integer",
335 "example": 0
336 },
337 "computeUnits": {
338 "type": "integer",
339 "example": 0
340 }
341 }
342 },
343 "options": {
344 "type": "object",
345 "properties": {
346 "build": {
347 "type": "string",
348 "example": "latest"
349 },
350 "timeoutSecs": {
351 "type": "integer",
352 "example": 300
353 },
354 "memoryMbytes": {
355 "type": "integer",
356 "example": 1024
357 },
358 "diskMbytes": {
359 "type": "integer",
360 "example": 2048
361 }
362 }
363 },
364 "buildId": {
365 "type": "string"
366 },
367 "defaultKeyValueStoreId": {
368 "type": "string"
369 },
370 "defaultDatasetId": {
371 "type": "string"
372 },
373 "defaultRequestQueueId": {
374 "type": "string"
375 },
376 "buildNumber": {
377 "type": "string",
378 "example": "1.0.0"
379 },
380 "containerUrl": {
381 "type": "string"
382 },
383 "usage": {
384 "type": "object",
385 "properties": {
386 "ACTOR_COMPUTE_UNITS": {
387 "type": "integer",
388 "example": 0
389 },
390 "DATASET_READS": {
391 "type": "integer",
392 "example": 0
393 },
394 "DATASET_WRITES": {
395 "type": "integer",
396 "example": 0
397 },
398 "KEY_VALUE_STORE_READS": {
399 "type": "integer",
400 "example": 0
401 },
402 "KEY_VALUE_STORE_WRITES": {
403 "type": "integer",
404 "example": 1
405 },
406 "KEY_VALUE_STORE_LISTS": {
407 "type": "integer",
408 "example": 0
409 },
410 "REQUEST_QUEUE_READS": {
411 "type": "integer",
412 "example": 0
413 },
414 "REQUEST_QUEUE_WRITES": {
415 "type": "integer",
416 "example": 0
417 },
418 "DATA_TRANSFER_INTERNAL_GBYTES": {
419 "type": "integer",
420 "example": 0
421 },
422 "DATA_TRANSFER_EXTERNAL_GBYTES": {
423 "type": "integer",
424 "example": 0
425 },
426 "PROXY_RESIDENTIAL_TRANSFER_GBYTES": {
427 "type": "integer",
428 "example": 0
429 },
430 "PROXY_SERPS": {
431 "type": "integer",
432 "example": 0
433 }
434 }
435 },
436 "usageTotalUsd": {
437 "type": "number",
438 "example": 0.00005
439 },
440 "usageUsd": {
441 "type": "object",
442 "properties": {
443 "ACTOR_COMPUTE_UNITS": {
444 "type": "integer",
445 "example": 0
446 },
447 "DATASET_READS": {
448 "type": "integer",
449 "example": 0
450 },
451 "DATASET_WRITES": {
452 "type": "integer",
453 "example": 0
454 },
455 "KEY_VALUE_STORE_READS": {
456 "type": "integer",
457 "example": 0
458 },
459 "KEY_VALUE_STORE_WRITES": {
460 "type": "number",
461 "example": 0.00005
462 },
463 "KEY_VALUE_STORE_LISTS": {
464 "type": "integer",
465 "example": 0
466 },
467 "REQUEST_QUEUE_READS": {
468 "type": "integer",
469 "example": 0
470 },
471 "REQUEST_QUEUE_WRITES": {
472 "type": "integer",
473 "example": 0
474 },
475 "DATA_TRANSFER_INTERNAL_GBYTES": {
476 "type": "integer",
477 "example": 0
478 },
479 "DATA_TRANSFER_EXTERNAL_GBYTES": {
480 "type": "integer",
481 "example": 0
482 },
483 "PROXY_RESIDENTIAL_TRANSFER_GBYTES": {
484 "type": "integer",
485 "example": 0
486 },
487 "PROXY_SERPS": {
488 "type": "integer",
489 "example": 0
490 }
491 }
492 }
493 }
494 }
495 }
496 }
497 }
498 }
499}
Google News Scraper OpenAPI definition
OpenAPI is a standard for designing and describing RESTful APIs, allowing developers to define API structure, endpoints, and data formats in a machine-readable way. It simplifies API development, integration, and documentation.
OpenAPI is effective when used with AI agents and GPTs by standardizing how these systems interact with various APIs, for reliable integrations and efficient communication.
By defining machine-readable API specifications, OpenAPI allows AI models like GPTs to understand and use varied data sources, improving accuracy. This accelerates development, reduces errors, and provides context-aware responses, making OpenAPI a core component for AI applications.
You can download the OpenAPI definitions for Google News Scraper from the options below:
If you’d like to learn more about how OpenAPI powers GPTs, read our blog post.
You can also check out our other API clients:
Actor Metrics
178 monthly users
-
30 bookmarks
>99% runs succeeded
2.5 days response time
Created in Oct 2022
Modified 7 days ago