You can access the Best Data Extractor API programmatically from your own applications by using the Apify API. You can also choose the language preference from below. To use the Apify API, you’ll need an Apify account and your API token, found in Integrations settings in Apify Console.

Python

JavaScript

CLI

OpenAPI

HTTP

MCP

{
  "openapi": "3.0.1",
  "info": {
    "version": "0.0",
    "x-build-id": "jElwKpACbcVgfl6vR"
  },
  "servers": [
    {
      "url": "https://api.apify.com/v2"
    }
  ],
  "paths": {
    "/acts/crawlkit~best-data-extractor-api/run-sync-get-dataset-items": {
      "post": {
        "operationId": "run-sync-get-dataset-items-crawlkit-best-data-extractor-api",
        "x-openai-isConsequential": false,
        "summary": "Executes an Actor, waits for its completion, and returns Actor's dataset items in response.",
        "tags": [
          "Run Actor"
        ],
        "requestBody": {
          "required": true,
          "content": {
            "application/json": {
              "schema": {
                "$ref": "#/components/schemas/inputSchema"
              }
            }
          }
        },
        "parameters": [
          {
            "name": "token",
            "in": "query",
            "required": true,
            "schema": {
              "type": "string"
            },
            "description": "Enter your Apify token here"
          }
        ],
        "responses": {
          "200": {
            "description": "OK"
          }
        }
      }
    },
    "/acts/crawlkit~best-data-extractor-api/runs": {
      "post": {
        "operationId": "runs-sync-crawlkit-best-data-extractor-api",
        "x-openai-isConsequential": false,
        "summary": "Executes an Actor and returns information about the initiated run in response.",
        "tags": [
          "Run Actor"
        ],
        "requestBody": {
          "required": true,
          "content": {
            "application/json": {
              "schema": {
                "$ref": "#/components/schemas/inputSchema"
              }
            }
          }
        },
        "parameters": [
          {
            "name": "token",
            "in": "query",
            "required": true,
            "schema": {
              "type": "string"
            },
            "description": "Enter your Apify token here"
          }
        ],
        "responses": {
          "200": {
            "description": "OK",
            "content": {
              "application/json": {
                "schema": {
                  "$ref": "#/components/schemas/runsResponseSchema"
                }
              }
            }
          }
        }
      }
    },
    "/acts/crawlkit~best-data-extractor-api/run-sync": {
      "post": {
        "operationId": "run-sync-crawlkit-best-data-extractor-api",
        "x-openai-isConsequential": false,
        "summary": "Executes an Actor, waits for completion, and returns the OUTPUT from Key-value store in response.",
        "tags": [
          "Run Actor"
        ],
        "requestBody": {
          "required": true,
          "content": {
            "application/json": {
              "schema": {
                "$ref": "#/components/schemas/inputSchema"
              }
            }
          }
        },
        "parameters": [
          {
            "name": "token",
            "in": "query",
            "required": true,
            "schema": {
              "type": "string"
            },
            "description": "Enter your Apify token here"
          }
        ],
        "responses": {
          "200": {
            "description": "OK"
          }
        }
      }
    }
  },
  "components": {
    "schemas": {
      "inputSchema": {
        "type": "object",
        "required": [
          "url",
          "schema"
        ],
        "properties": {
          "url": {
            "title": "Target URL",
            "type": "string",
            "description": "The URL of the website to extract data from."
          },
          "schema": {
            "title": "Extraction Schema (JSON)",
            "type": "object",
            "description": "JSON Schema defining the structure for LLM extraction. Required."
          },
          "options": {
            "title": "Options (JSON)",
            "type": "object",
            "description": "Configuration options like timeout, headers, etc."
          }
        }
      },
      "runsResponseSchema": {
        "type": "object",
        "properties": {
          "data": {
            "type": "object",
            "properties": {
              "id": {
                "type": "string"
              },
              "actId": {
                "type": "string"
              },
              "userId": {
                "type": "string"
              },
              "startedAt": {
                "type": "string",
                "format": "date-time",
                "example": "2025-01-08T00:00:00.000Z"
              },
              "finishedAt": {
                "type": "string",
                "format": "date-time",
                "example": "2025-01-08T00:00:00.000Z"
              },
              "status": {
                "type": "string",
                "example": "READY"
              },
              "meta": {
                "type": "object",
                "properties": {
                  "origin": {
                    "type": "string",
                    "example": "API"
                  },
                  "userAgent": {
                    "type": "string"
                  }
                }
              },
              "stats": {
                "type": "object",
                "properties": {
                  "inputBodyLen": {
                    "type": "integer",
                    "example": 2000
                  },
                  "rebootCount": {
                    "type": "integer",
                    "example": 0
                  },
                  "restartCount": {
                    "type": "integer",
                    "example": 0
                  },
                  "resurrectCount": {
                    "type": "integer",
                    "example": 0
                  },
                  "computeUnits": {
                    "type": "integer",
                    "example": 0
                  }
                }
              },
              "options": {
                "type": "object",
                "properties": {
                  "build": {
                    "type": "string",
                    "example": "latest"
                  },
                  "timeoutSecs": {
                    "type": "integer",
                    "example": 300
                  },
                  "memoryMbytes": {
                    "type": "integer",
                    "example": 1024
                  },
                  "diskMbytes": {
                    "type": "integer",
                    "example": 2048
                  }
                }
              },
              "buildId": {
                "type": "string"
              },
              "defaultKeyValueStoreId": {
                "type": "string"
              },
              "defaultDatasetId": {
                "type": "string"
              },
              "defaultRequestQueueId": {
                "type": "string"
              },
              "buildNumber": {
                "type": "string",
                "example": "1.0.0"
              },
              "containerUrl": {
                "type": "string"
              },
              "usage": {
                "type": "object",
                "properties": {
                  "ACTOR_COMPUTE_UNITS": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATASET_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATASET_WRITES": {
                    "type": "integer",
                    "example": 0
                  },
                  "KEY_VALUE_STORE_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "KEY_VALUE_STORE_WRITES": {
                    "type": "integer",
                    "example": 1
                  },
                  "KEY_VALUE_STORE_LISTS": {
                    "type": "integer",
                    "example": 0
                  },
                  "REQUEST_QUEUE_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "REQUEST_QUEUE_WRITES": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATA_TRANSFER_INTERNAL_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATA_TRANSFER_EXTERNAL_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "PROXY_RESIDENTIAL_TRANSFER_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "PROXY_SERPS": {
                    "type": "integer",
                    "example": 0
                  }
                }
              },
              "usageTotalUsd": {
                "type": "number",
                "example": 0.00005
              },
              "usageUsd": {
                "type": "object",
                "properties": {
                  "ACTOR_COMPUTE_UNITS": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATASET_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATASET_WRITES": {
                    "type": "integer",
                    "example": 0
                  },
                  "KEY_VALUE_STORE_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "KEY_VALUE_STORE_WRITES": {
                    "type": "number",
                    "example": 0.00005
                  },
                  "KEY_VALUE_STORE_LISTS": {
                    "type": "integer",
                    "example": 0
                  },
                  "REQUEST_QUEUE_READS": {
                    "type": "integer",
                    "example": 0
                  },
                  "REQUEST_QUEUE_WRITES": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATA_TRANSFER_INTERNAL_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "DATA_TRANSFER_EXTERNAL_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "PROXY_RESIDENTIAL_TRANSFER_GBYTES": {
                    "type": "integer",
                    "example": 0
                  },
                  "PROXY_SERPS": {
                    "type": "integer",
                    "example": 0
                  }
                }
              }
            }
          }
        }
      }
    }
  }
}

Best Data Extractor API OpenAPI definition

OpenAPI is a standard for designing and describing RESTful APIs, allowing developers to define API structure, endpoints, and data formats in a machine-readable way. It simplifies API development, integration, and documentation.

OpenAPI is effective when used with AI agents and GPTs by standardizing how these systems interact with various APIs, for reliable integrations and efficient communication.

By defining machine-readable API specifications, OpenAPI allows AI models like GPTs to understand and use varied data sources, improving accuracy. This accelerates development, reduces errors, and provides context-aware responses, making OpenAPI a core component for AI applications.

You can download the OpenAPI definitions for Best Data Extractor API from the options below:

OpenAPI.json

If you’d like to learn more about how OpenAPI powers GPTs, read our blog post.

You can also check out our other API clients:

Best Data Extractor API API in Python

Best Data Extractor API API in JavaScript

Best Data Extractor API API through CLI

Best Data Extractor API API

Zocdoc Scraper

fresh_cliff/zocdoc-scraper

Zocdoc Doctor Scraper - Extract doctor profiles, ratings, locations & availability from Zocdoc API. Search by location & specialty. Get clean structured data for healthcare research, competitor analysis & lead generation. Fast, reliable & bot-resistant scraping.

Brennan Crawford

Free Mcp Ai Linkedin Jobs Scraper Data Api

fresh_cliff/free-mcp-ai-linkedin-jobs-scraper-data-api

🚀 FREE MCP AI LinkedIn Jobs Scraper Data API. Extract job postings automatically with Model Context Protocol technology. Professional MCP-powered AI job scraper & data extractor. Get job titles, companies, locations, salaries, descriptions. Free automated LinkedIn scraping tool with MCP technology.

Brennan Crawford

TikTok Shop Scraper | Product Data Extractor API

charitable_aquarium/tiktok-shop-scraper

The fastest TikTok Shop Product Data Extractor. Scalable and stealthy data extraction tool for Tiktok shop products.

Md Faiyaz Bin Mohiuddin

228

1.6

(2)

Facebook Pages Scraper

apify/facebook-pages-scraper

Extract basic data from multiple Facebook Pages or Profiles. Extract Facebook page details, website, email, address, messenger, likes, followers, rating, ad running status, and other public data. Export scraped data, schedule scraper via API, integrate with other tools or AI workflows.

Apify

53K

4.6

(49)

Best Tiktok Scraper

scrape-creators/best-tiktok-scraper

Scrape TikTok data from profiles, videos, hashtags, search results, and the trending feed using URLs or keywords. Access video transcripts, view counts, likes, comments, music info, and more. Export data, run scrapes via API, schedule and monitor runs, or integrate with your existing tools.

Scrape Creators

518

Kakao Map Scraper - Korea Local Businesses & Reviews

haketa/kakao-map-scraper

Kakao Map scraper & data API for South Korea local businesses: search any category or keyword by area and export name, category, phone, address, GPS, rating, reviews, business hours, amenities, homepage & photos. Korea local business data, lead generation & market research — fast, no login.

Haketa

India MCA Company Data Scraper - CIN, Directors & Charges

haketa/india-mca-scraper

India company data scraper & API (MCA / CIN lookup): enrich any Indian company by CIN and export name, status, incorporation date, RoC, category, authorized & paid-up capital, address, email, directors with DIN & registered charges. India KYC, due-diligence & B2B lead data — fast, no login.

Haketa

Polymarket API no limit | Scraper/Screener | API V3

yellowchimp/polymarket

API for Agentic AI on Polymarket. Automate data extraction for markets, events, and price feeds. Features high-speed crawling and clean JSON formatting designed for developers building trading bots and market analysis tools. Structured JSON and Apify Dataset. Awarded best 2026.

INFO-YC Studios

Olx Product Listings Scraper

fresh_cliff/olx-product-listings-scraper

🔥 FREE OLX scraper PL,PT,RO,UA,BG,BA,KZ,UZ. Extract titles, prices, images, locations 99.9% accuracy. $19.99/month unlimited scraping. Enterprise anti-bot protection. How to scrape OLX data? Best OLX scraper for cars, real estate, electronics. Price monitoring, market research, competitor analysis.

Brennan Crawford

Apple App Store Scraper - Rankings, Reviews & Apps

haketa/app-store-scraper

Apple App Store scraper & data API: export top-chart rankings (Top Free, Paid, Grossing, New) by category & country, scrape app reviews & ratings, full app details, metadata and ASO keyword search. iOS app market intelligence & competitor tracking — fast, no login. Pairs with a Google Play scraper.

Haketa

Naver Land Scraper - Korea Apartments & Officetels

haketa/naver-land-scraper

Naver Land scraper & data API for South Korea real estate: search apartments, officetels & villas for sale (매매), jeonse (전세) & monthly rent (월세); export price, area, floor, direction, location, tags & the listing agent. Korea property market data & lead generation — fast.

Haketa