# First, specify the base Docker image. You can read more about
# the available images at https://sdk.apify.com/docs/guides/docker-images
# You can also use any other image from Docker Hub.
FROM apify/actor-node:16

# Second, copy just package.json and package-lock.json since those are the only
# files that affect "npm install" in the next step, to speed up the build.
COPY package*.json ./

# Install NPM packages, skip optional and development dependencies to
# keep the image small. Avoid logging too much and print the dependency
# tree for debugging
RUN npm --quiet set progress=false \
 && npm install --only=prod --no-optional \
 && echo "Installed NPM packages:" \
 && (npm list || true) \
 && echo "Node.js version:" \
 && node --version \
 && echo "NPM version:" \
 && npm --version

# Next, copy the remaining files and directories with the source code.
# Since we do this after NPM install, quick build will be really fast
# for most source file changes.
COPY . ./

# Optionally, specify how to launch the source code of your actor.
# By default, Apify's base Docker images define the CMD instruction
# that runs the Node.js source code using the command specified
# in the "scripts.start" section of the package.json file.
# In short, the instruction looks something like this:
#
# CMD npm start

main.js

1// This is the main Node.js source code file of your actor.
2// It is referenced from the "scripts" section of the package.json file.
3
4const Apify = require('apify');
5
6Apify.main(async () => {
7    // Get input of the actor. Input fields can be modified in INPUT_SCHEMA.json file.
8    // For more information, see https://docs.apify.com/actors/development/input-schema
9    const input = await Apify.getInput();
10    console.log('Input:');
11    console.dir(input);
12
13    // Here you can prepare your input for actor apify/web-scraper this input is based on a actor
14    // task you used as the starting point.
15    const metamorphInput = {
16        "breakpointLocation": "NONE",
17        "browserLog": false,
18        "debugLog": false,
19        "downloadCss": true,
20        "downloadMedia": true,
21        "ignoreCorsAndCsp": false,
22        "ignoreSslErrors": false,
23        "injectJQuery": true,
24        "keepUrlFragments": false,
25        "maxRequestRetries": input.maxRequestRetries,
26        "pageFunction": // The function accepts a single argument: the "context" object.
27        // For a complete list of its properties and functions,
28        // see https://apify.com/apify/web-scraper#page-function 
29        async function pageFunction(context) {
30            // This statement works as a breakpoint when you're trying to debug your code. Works only with Run mode: DEVELOPMENT!
31            // debugger; 
32            // jQuery is handy for finding DOM elements and extracting data from them.
33            // To use it, make sure to enable the "Inject jQuery" option.
34            const $ = context.jQuery;
35            const search = "#SearchProductCardComponent";
36            let timeoutMillis; // undefined
37            await context.waitFor(2000);
38                // 2 sec timeout after the first.
39            
40            const products = document.querySelectorAll(search);
41        
42        
43            var results = [];
44        
45            for (let i = 0; i < products.length-1; i++ )
46            {
47             
48                var logoURL = "";
49                var url = "";
50                var name = "";
51                var category = "";
52                try{logoURL = products[i].getElementsByTagName('img')[0].src;}
53                catch(error){}
54                try{url = products[i].childNodes[1].childNodes[0].href;}
55                catch(error){}
56                try{name = products[i].childNodes[1].childNodes[0].text;}
57                catch(error){}
58                try{category = products[i].childNodes[1].childNodes[1].text;}
59                catch(error){}
60                results.push({"name":name,"url":url,"logoURL":logoURL,"category":category})
61                
62            }
63            
64        
65            // Print some information to actor log
66            
67        
68            // Manually add a new page to the queue for scraping
69        
70            // Return an object with the data extracted from the page.
71            // It will be stored to the resulting dataset.
72            return {
73                results: results
74            };
75        },
76        "postNavigationHooks": `// We need to return array of (possibly async) functions here.
77            // The functions accept a single argument: the "crawlingContext" object.
78            [
79                async (crawlingContext) => {
80                    // ...
81                },
82            ]`,
83        "preNavigationHooks": `// We need to return array of (possibly async) functions here.
84            // The functions accept two arguments: the "crawlingContext" object
85            // and "gotoOptions".
86            [
87                async (crawlingContext, gotoOptions) => {
88                    // ...
89                },
90            ]`,
91        "proxyConfiguration": {
92            "useApifyProxy": true,
93            "apifyProxyCountry": "US"
94        },
95        "startUrls": input.startUrls,
96        "runMode": "PRODUCTION",
97        "useChrome": false,
98        "waitUntil": [
99            "networkidle2"
100        ]
101    };
102
103    // Now let's metamorph into actor apify/web-scraper using the created input.
104    await Apify.metamorph('apify/web-scraper', metamorphInput);
105});

package.json

{
    "name": "my-actor",
    "version": "0.0.1",
    "dependencies": {
        "apify": "^2.2.2"
    },
    "scripts": {
        "start": "node main.js"
    },
    "author": "Me!"
}

Google Maps Scraper

compass/crawler-google-places

Extract data from thousands of Google Maps locations and businesses, including reviews, reviewer details, images, contact info, opening hours, location, prices & more. Export scraped data, run the scraper via API, schedule and monitor runs, or integrate with other tools.

Compass

183K

4.7

Pitchbook Investors Scraper

parseforge/pitchbook-investors-scraper

Supercharge your private equity and venture capital research with our comprehensive PitchBook Investors Scraper! Access detailed investor data from 687,000+ investors across all regions. Perfect for fund managers, researchers, and analysts who need precise investor intelligence.

ParseForge

5.0

Amazon Reviews Scraper (By Product Url)

scrapingshark/amazon-reviews-scraper-by-product-url

Scrape detailed Amazon product reviews from any product URL with ease. Get review text, ratings, author info, review dates, helpful votes, and more—perfect for sentiment analysis, competitor research, and e-commerce insights.

ScrapingShark

Zillow Property Info Scraper

aknahin/zillow-property-info-scraper

This actor takes multiple property addresses (one per line) and fetches detailed information for each using Zillow’s internal APIs. Whether you’re analyzing comps, scouting investment properties, or automating real estate workflows, this tool is designed to save you hours of manual research.

Technivis

5.0

Moz Domain Authority Checker

jdtpnjtp/moz-domain-authority-checker

The MOZ Domain Authority API provides comprehensive domain analysis and SEO metrics through a simple REST interface. Analyze any domain to retrieve critical SEO indicators including Domain Authority (DA), Page Authority

Data Collector

GMGN Token Stat Scraper

muhammetakkurtt/gmgn-token-stat-scraper

Automate token data extraction from GMGN.ai with this powerful scraper. Supports Solana, Ethereum, BSC, Base, and Tron. Get real-time price, liquidity, trading volume, and holder stats for comprehensive crypto market analysis, investment research, and portfolio tracking. Boost your insights now!

Muhammet Akkurt

5.0

Allabolag Business Search Scraper

ecomscrape/allabolag-business-search-scraper

Extract Swedish business data from Allabolag.se efficiently with our automated scraper. Get company details, contact info, financials & more in JSON/CSV/Excel formats. Perfect for lead generation, market research & CRM integration. Easy-to-use tool processes thousands of records instantly.

ecomscrape

Youtube Video Transcript Scraper

turboscraper/youtube-transcript-scrap

Tired of manual transcript extraction? The YouTube-Transcript-Scraper makes it effortless! 🚀 Get full transcripts and valuable data in seconds. Let’s automate your workflow — it’s time to scrape smarter! 💻🔍

Ihor Dudnyk

Extract Email from Any Webpage | $1 per month

extensionkit.rdt001/email-scraper

Effortlessly uncover publicly accessible email addresses linked to specific domains. This tool performs an intelligent web scan, making it ideal for discovering contacts, generating leads, and conducting market analysis.

web automation lover

n8n Template Scraper

datavoyantlab/n8n-templates-scraper

Scrape n8n.io workflow template with this Apify actor. Filter by category (AI, Marketing, DevOps), sort by popularity & get structured data with importable JSONs for developers & businesses