1import asyncio
2import logging
3
4from apify.log import ActorLogFormatter
5
6from .main import main
7
8handler = logging.StreamHandler()
9handler.setFormatter(ActorLogFormatter())
10
11apify_client_logger = logging.getLogger('apify_client')
12apify_client_logger.setLevel(logging.INFO)
13apify_client_logger.addHandler(handler)
14
15apify_logger = logging.getLogger('apify')
16apify_logger.setLevel(logging.DEBUG)
17apify_logger.addHandler(handler)
18
19asyncio.run(main())

src/main.py

1import os
2from transformers import pipeline
3from apify import Actor
4
5async def main():
6    async with Actor:
7        actor_input = await Actor.get_input() or {}
8
9        generator = pipeline('text-generation', model='gpt2')
10        output = generator(actor_input["prompt"], max_length=actor_input["max_length"], num_return_sequences=1)
11
12        await Actor.push_data(output)

.dockerignore

# configurations
.idea

# crawlee and apify storage folders
apify_storage
crawlee_storage
storage

# installed files
node_modules

# git folder
.git

Dockerfile

FROM huggingface/transformers-pytorch-gpu

COPY requirements.txt ./

RUN echo "Python version:" \
 && python3 --version \
 && echo "Pip version:" \
 && pip --version \
 && echo "Installing dependencies from requirements.txt:" \
 && pip install -r requirements.txt \
 && echo "All installed Python packages:" \
 && pip freeze

COPY . ./

RUN python3 -c 'from transformers import pipeline; generator = pipeline("text-generation", model="gpt2")'

CMD ["python3", "-m", "src"]

INPUT_SCHEMA.json

{
  "title": "Generate text",
  "description": "This is actor input schema",
  "type": "object",
  "schemaVersion": 1,
  "properties": {
    "prompt": {
      "title": "Initial prompt",
      "type": "string",
      "description": "The initial prompt used as basis for text generation",
      "default": "My name is Apify and I like to",
      "editor": "textarea"
    },
    "max_length": {
      "title": "Maximum sequence length",
      "type": "integer",
      "description": "The maximum length of the generated sequence",
      "default": 30,
      "editor": "number"
    }
  },
  "required": [
    "prompt",
    "max_length"
  ]
}

requirements.txt

1# Add your dependencies here.
2# See https://pip.pypa.io/en/latest/cli/pip_install/#requirements-file-format
3# for how to format them
4
5apify ~= 1.0.0

Actor 2

code_crafter/actor-2

Code Pioneer

My Actor 2

diodames/my-actor-2

Martin Andrle

My Actor 2

tech_gear/my-actor-2

Tech Gear

My Actor 2

dev_fusion/my-actor-2

Dev Fusion

My Actor 2

build_matrix/my-actor-2

Build Matrix

GPT Browser

anchor/gpt-browser

A GPT browser to use OpenAI prompt on any website. Put a list of URLs and a prompt, then the GPT agent will give you the answer you need. Fast, easy, and not limited with OpenAI ChatGPT restrictions. The best way to search and use GPT on large number of websites. Upload Excel or CSV. Screenshots 📸

Anchor

DALL-E 2 Image Generation

jirimoravcik/dalle-2-image-generation

This actor enables you to generate images using OpenAI's DALL-E 2.

Jiří Moravčík

GPT Scraper

drobnikj/gpt-scraper

Extract data from any website and feed it into GPT via the OpenAI API. Use ChatGPT to proofread content, analyze sentiment, summarize reviews, extract contact details, and much more.

Jakub Drobník

6.1K

4.0

Extended GPT Scraper

drobnikj/extended-gpt-scraper

Extract data from any website and feed it into GPT via the OpenAI API. Use ChatGPT to proofread content, analyze sentiment, summarize reviews, extract contact details, and much more.

Jakub Drobník

1.5K

4.1

ai-quizgenie

bala-ceg/ai-quizgenie

ai-quizgenie is an Apify Actor that extracts content from webpages and PDFs to generate multiple-choice quiz questions (MCQs) using LLMs (GPT-3.5, GPT-4, etc.).