Dataset Schema Super Actor
Pricing
Pay per usage
Pricing
Pay per usage
Rating
0.0
(0)
Developer

Zuzka Pelechová
Actor stats
0
Bookmarked
1
Total users
0
Monthly active users
14 days ago
Last modified
Categories
Share
Pricing
Pay per usage
Pricing
Pay per usage
Rating
0.0
(0)
Developer

Zuzka Pelechová
Actor stats
0
Bookmarked
1
Total users
0
Monthly active users
14 days ago
Last modified
Categories
Share
You can access the Dataset Schema Super Actor programmatically from your own applications by using the Apify API. You can also choose the language preference from below. To use the Apify API, you’ll need an Apify account and your API token, found in Integrations settings in Apify Console.
{ "openapi": "3.0.1", "info": { "version": "1.0", "x-build-id": "oGsnxJ1gsKhZLIub7" }, "servers": [ { "url": "https://api.apify.com/v2" } ], "paths": { "/acts/zuzka~dataset-schema-super-actor/run-sync-get-dataset-items": { "post": { "operationId": "run-sync-get-dataset-items-zuzka-dataset-schema-super-actor", "x-openai-isConsequential": false, "summary": "Executes an Actor, waits for its completion, and returns Actor's dataset items in response.", "tags": [ "Run Actor" ], "requestBody": { "required": true, "content": { "application/json": { "schema": { "$ref": "#/components/schemas/inputSchema" } } } }, "parameters": [ { "name": "token", "in": "query", "required": true, "schema": { "type": "string" }, "description": "Enter your Apify token here" } ], "responses": { "200": { "description": "OK" } } } }, "/acts/zuzka~dataset-schema-super-actor/runs": { "post": { "operationId": "runs-sync-zuzka-dataset-schema-super-actor", "x-openai-isConsequential": false, "summary": "Executes an Actor and returns information about the initiated run in response.", "tags": [ "Run Actor" ], "requestBody": { "required": true, "content": { "application/json": { "schema": { "$ref": "#/components/schemas/inputSchema" } } } }, "parameters": [ { "name": "token", "in": "query", "required": true, "schema": { "type": "string" }, "description": "Enter your Apify token here" } ], "responses": { "200": { "description": "OK", "content": { "application/json": { "schema": { "$ref": "#/components/schemas/runsResponseSchema" } } } } } } }, "/acts/zuzka~dataset-schema-super-actor/run-sync": { "post": { "operationId": "run-sync-zuzka-dataset-schema-super-actor", "x-openai-isConsequential": false, "summary": "Executes an Actor, waits for completion, and returns the OUTPUT from Key-value store in response.", "tags": [ "Run Actor" ], "requestBody": { "required": true, "content": { "application/json": { "schema": { "$ref": "#/components/schemas/inputSchema" } } } }, "parameters": [ { "name": "token", "in": "query", "required": true, "schema": { "type": "string" }, "description": "Enter your Apify token here" } ], "responses": { "200": { "description": "OK" } } } } }, "components": { "schemas": { "inputSchema": { "type": "object", "required": [ "actorTechnicalName" ], "properties": { "actorTechnicalName": { "title": "Actor Technical Name", "pattern": "^[a-zA-Z0-9_-]+/[a-zA-Z0-9_-]+$", "type": "string", "description": "The technical name of the Actor to generate schema for (e.g., 'compass/Instagram-Scraper')" }, "generateInputs": { "title": "Generate Test Inputs", "type": "boolean", "description": "Generate test inputs for the Actor (Step 1)" }, "generateSchema": { "title": "Generate Initial Schema", "type": "boolean", "description": "Generate initial dataset schema from Actor runs (Step 2)" }, "existingMinimalInput": { "title": "Existing Minimal Input (JSON)", "type": "string", "description": "Provide existing minimal test input as JSON. Leave empty to use generated input." }, "existingNormalInput": { "title": "Existing Normal Input (JSON)", "type": "string", "description": "Provide existing normal test input as JSON. Leave empty to use generated input." }, "existingMaximalInput": { "title": "Existing Maximal Input (JSON)", "type": "string", "description": "Provide existing maximal test input as JSON. Leave empty to use generated input." }, "existingEdgeInput": { "title": "Existing Edge Input (JSON)", "type": "string", "description": "Provide existing edge test input as JSON. Leave empty to use generated input." }, "useRealDatasetIds": { "title": "Use Real Dataset IDs Instead", "type": "boolean", "description": "Generate schema from real Redash datasets instead of test inputs. Requires Redash credentials from Step 4." }, "enhanceSchema": { "title": "Enhance Schema with AI", "type": "boolean", "description": "Enhance schema using Claude Sonnet 4 (Step 3)" }, "existingEnhancedSchema": { "title": "Existing Enhanced Schema (JSON)", "type": "string", "description": "Provide existing enhanced schema as JSON to skip Step 3. Leave empty to generate new enhanced schema." }, "generateViews": { "title": "Generate Views", "type": "boolean", "description": "Whether to generate dataset views in the schema. Skip if you already have views in the schema." }, "validateSchema": { "title": "Validate Schema", "type": "boolean", "description": "Validate schema against real dataset data (Step 4)" }, "daysBack": { "title": "Days Back for Validation", "minimum": 1, "maximum": 14, "type": "integer", "description": "Number of days back to look for datasets in validation", "default": 5 }, "maximumResults": { "title": "Maximum Results for Validation", "minimum": 1, "maximum": 100, "type": "integer", "description": "Maximum number of results to fetch for validation", "default": 10 }, "minimumResults": { "title": "Minimum Results for Validation", "minimum": 1, "maximum": 100, "type": "integer", "description": "Minimum number of results required for validation", "default": 1 }, "runsPerUser": { "title": "Runs Per User for Validation", "minimum": 1, "maximum": 10, "type": "integer", "description": "Number of runs per user to consider in validation", "default": 2 }, "maxResultsPerQuery": { "title": "Max results per query", "minimum": 0, "maximum": 300, "type": "integer", "description": "Maximum number of rows to fetch from Redash chart query (0 = unlimited)", "default": 100 }, "createPR": { "title": "Create GitHub PR", "type": "boolean", "description": "Create GitHub pull request with the schema (Step 5)" }, "githubLink": { "title": "GitHub Repository Link", "pattern": "^https://github\\.com/[a-zA-Z0-9_-]+/[a-zA-Z0-9_-]+/?$", "type": "string", "description": "URL to the GitHub repository where the PR should be created" }, "githubToken": { "title": "GitHub Personal Access Token", "type": "string", "description": "GitHub Personal Access Token for creating PRs" } } }, "runsResponseSchema": { "type": "object", "properties": { "data": { "type": "object", "properties": { "id": { "type": "string" }, "actId": { "type": "string" }, "userId": { "type": "string" }, "startedAt": { "type": "string", "format": "date-time", "example": "2025-01-08T00:00:00.000Z" }, "finishedAt": { "type": "string", "format": "date-time", "example": "2025-01-08T00:00:00.000Z" }, "status": { "type": "string", "example": "READY" }, "meta": { "type": "object", "properties": { "origin": { "type": "string", "example": "API" }, "userAgent": { "type": "string" } } }, "stats": { "type": "object", "properties": { "inputBodyLen": { "type": "integer", "example": 2000 }, "rebootCount": { "type": "integer", "example": 0 }, "restartCount": { "type": "integer", "example": 0 }, "resurrectCount": { "type": "integer", "example": 0 }, "computeUnits": { "type": "integer", "example": 0 } } }, "options": { "type": "object", "properties": { "build": { "type": "string", "example": "latest" }, "timeoutSecs": { "type": "integer", "example": 300 }, "memoryMbytes": { "type": "integer", "example": 1024 }, "diskMbytes": { "type": "integer", "example": 2048 } } }, "buildId": { "type": "string" }, "defaultKeyValueStoreId": { "type": "string" }, "defaultDatasetId": { "type": "string" }, "defaultRequestQueueId": { "type": "string" }, "buildNumber": { "type": "string", "example": "1.0.0" }, "containerUrl": { "type": "string" }, "usage": { "type": "object", "properties": { "ACTOR_COMPUTE_UNITS": { "type": "integer", "example": 0 }, "DATASET_READS": { "type": "integer", "example": 0 }, "DATASET_WRITES": { "type": "integer", "example": 0 }, "KEY_VALUE_STORE_READS": { "type": "integer", "example": 0 }, "KEY_VALUE_STORE_WRITES": { "type": "integer", "example": 1 }, "KEY_VALUE_STORE_LISTS": { "type": "integer", "example": 0 }, "REQUEST_QUEUE_READS": { "type": "integer", "example": 0 }, "REQUEST_QUEUE_WRITES": { "type": "integer", "example": 0 }, "DATA_TRANSFER_INTERNAL_GBYTES": { "type": "integer", "example": 0 }, "DATA_TRANSFER_EXTERNAL_GBYTES": { "type": "integer", "example": 0 }, "PROXY_RESIDENTIAL_TRANSFER_GBYTES": { "type": "integer", "example": 0 }, "PROXY_SERPS": { "type": "integer", "example": 0 } } }, "usageTotalUsd": { "type": "number", "example": 0.00005 }, "usageUsd": { "type": "object", "properties": { "ACTOR_COMPUTE_UNITS": { "type": "integer", "example": 0 }, "DATASET_READS": { "type": "integer", "example": 0 }, "DATASET_WRITES": { "type": "integer", "example": 0 }, "KEY_VALUE_STORE_READS": { "type": "integer", "example": 0 }, "KEY_VALUE_STORE_WRITES": { "type": "number", "example": 0.00005 }, "KEY_VALUE_STORE_LISTS": { "type": "integer", "example": 0 }, "REQUEST_QUEUE_READS": { "type": "integer", "example": 0 }, "REQUEST_QUEUE_WRITES": { "type": "integer", "example": 0 }, "DATA_TRANSFER_INTERNAL_GBYTES": { "type": "integer", "example": 0 }, "DATA_TRANSFER_EXTERNAL_GBYTES": { "type": "integer", "example": 0 }, "PROXY_RESIDENTIAL_TRANSFER_GBYTES": { "type": "integer", "example": 0 }, "PROXY_SERPS": { "type": "integer", "example": 0 } } } } } } } } }}OpenAPI is a standard for designing and describing RESTful APIs, allowing developers to define API structure, endpoints, and data formats in a machine-readable way. It simplifies API development, integration, and documentation.
OpenAPI is effective when used with AI agents and GPTs by standardizing how these systems interact with various APIs, for reliable integrations and efficient communication.
By defining machine-readable API specifications, OpenAPI allows AI models like GPTs to understand and use varied data sources, improving accuracy. This accelerates development, reduces errors, and provides context-aware responses, making OpenAPI a core component for AI applications.
You can download the OpenAPI definitions for Dataset Schema Super Actor from the options below:
If you’d like to learn more about how OpenAPI powers GPTs, read our blog post.
You can also check out our other API clients: