# Extract Reddit Comments for Sentiment Analysis

**Use case:** 

Pull the full comment thread from a Reddit post — scores, authors, depth, and timestamps — ready for sentiment or NLP analysis.

## Input

```json
{
  "postUrls": [
    {
      "url": "https://www.reddit.com/r/technology/comments/1abcd23/example_thread/"
    }
  ],
  "maxCommentsPerPost": 2000,
  "includeNSFW": false,
  "proxy": {
    "useApifyProxy": true,
    "apifyProxyGroups": [
      "RESIDENTIAL"
    ]
  }
}
```

## Output

```json
{
  "dataType": {
    "label": "Type",
    "format": "text"
  },
  "title": {
    "label": "Title",
    "format": "text"
  },
  "name": {
    "label": "Name",
    "format": "text"
  },
  "body": {
    "label": "Content",
    "format": "text"
  },
  "authorName": {
    "label": "Author",
    "format": "text"
  },
  "communityName": {
    "label": "Community",
    "format": "text"
  },
  "subredditName": {
    "label": "Subreddit",
    "format": "text"
  },
  "upVotes": {
    "label": "Upvotes",
    "format": "number"
  },
  "commentUpVotes": {
    "label": "Comment Upvotes",
    "format": "number"
  },
  "membersCount": {
    "label": "Members",
    "format": "number"
  },
  "commentsCount": {
    "label": "Comments Count",
    "format": "number"
  },
  "onlineUsersCount": {
    "label": "Online Users",
    "format": "number"
  },
  "postUrl": {
    "label": "Post URL",
    "format": "link"
  },
  "url": {
    "label": "URL",
    "format": "link"
  },
  "createdAt": {
    "label": "Created",
    "format": "date"
  },
  "commentCreatedAt": {
    "label": "Comment Created",
    "format": "date"
  },
  "crawledAt": {
    "label": "Crawled",
    "format": "date"
  },
  "searchTerm": {
    "label": "Search Term",
    "format": "text"
  },
  "id": {
    "label": "ID",
    "format": "text"
  },
  "parsedId": {
    "label": "Parsed ID",
    "format": "text"
  },
  "postTitle": {
    "label": "Post Title",
    "format": "text"
  },
  "postType": {
    "label": "Post Type",
    "format": "text"
  },
  "flair": {
    "label": "Flair",
    "format": "text"
  },
  "contentUrl": {
    "label": "Content URL",
    "format": "link"
  },
  "images": {
    "label": "Images",
    "format": "array"
  },
  "bodyHtml": {
    "label": "Content HTML",
    "format": "text"
  },
  "authorId": {
    "label": "Author ID",
    "format": "text"
  },
  "parsedAuthorId": {
    "label": "Parsed Author ID",
    "format": "text"
  },
  "communityId": {
    "label": "Community ID",
    "format": "text"
  },
  "parsedCommunityId": {
    "label": "Parsed Community ID",
    "format": "text"
  },
  "parsedCommunityName": {
    "label": "Parsed Community",
    "format": "text"
  },
  "subredditId": {
    "label": "Subreddit ID",
    "format": "text"
  },
  "parsedSubredditId": {
    "label": "Parsed Subreddit ID",
    "format": "text"
  },
  "postId": {
    "label": "Post ID",
    "format": "text"
  },
  "parsedPostId": {
    "label": "Parsed Post ID",
    "format": "text"
  },
  "parentId": {
    "label": "Parent ID",
    "format": "text"
  },
  "parsedParentId": {
    "label": "Parsed Parent ID",
    "format": "text"
  },
  "postUpVotes": {
    "label": "Post Upvotes",
    "format": "number"
  },
  "postCommentsCount": {
    "label": "Post Comments",
    "format": "number"
  },
  "postCreatedAt": {
    "label": "Post Created",
    "format": "date"
  },
  "description": {
    "label": "Description",
    "format": "text"
  },
  "publicDescription": {
    "label": "Public Description",
    "format": "text"
  },
  "communityIcon": {
    "label": "Community Icon",
    "format": "image"
  },
  "bannerImage": {
    "label": "Banner Image",
    "format": "image"
  },
  "nsfw": {
    "label": "NSFW",
    "format": "boolean"
  },
  "username": {
    "label": "Username",
    "format": "text"
  },
  "totalKarma": {
    "label": "Total Karma",
    "format": "number"
  },
  "linkKarma": {
    "label": "Link Karma",
    "format": "number"
  },
  "commentKarma": {
    "label": "Comment Karma",
    "format": "number"
  },
  "awardeeKarma": {
    "label": "Awardee Karma",
    "format": "number"
  },
  "awarderKarma": {
    "label": "Awarder Karma",
    "format": "number"
  },
  "isGold": {
    "label": "Gold",
    "format": "boolean"
  },
  "isMod": {
    "label": "Moderator",
    "format": "boolean"
  },
  "isEmployee": {
    "label": "Reddit Employee",
    "format": "boolean"
  },
  "hasVerifiedEmail": {
    "label": "Verified Email",
    "format": "boolean"
  },
  "verified": {
    "label": "Verified",
    "format": "boolean"
  },
  "iconImg": {
    "label": "Avatar",
    "format": "image"
  },
  "snoovatarImg": {
    "label": "Snoovatar",
    "format": "image"
  },
  "acceptFollowers": {
    "label": "Accepts Followers",
    "format": "boolean"
  },
  "bio": {
    "label": "Bio",
    "format": "text"
  },
  "followersCount": {
    "label": "Followers",
    "format": "number"
  },
  "bannerImg": {
    "label": "Banner Image",
    "format": "image"
  },
  "profileUrl": {
    "label": "Profile URL",
    "format": "link"
  },
  "score": {
    "label": "Score",
    "format": "number"
  },
  "upvoteRatio": {
    "label": "Upvote Ratio",
    "format": "number"
  },
  "over18": {
    "label": "NSFW (18+)",
    "format": "boolean"
  },
  "isSelf": {
    "label": "Self Post",
    "format": "boolean"
  },
  "isVideo": {
    "label": "Video",
    "format": "boolean"
  },
  "isGallery": {
    "label": "Gallery",
    "format": "boolean"
  },
  "spoiler": {
    "label": "Spoiler",
    "format": "boolean"
  },
  "locked": {
    "label": "Locked",
    "format": "boolean"
  },
  "hidden": {
    "label": "Hidden",
    "format": "boolean"
  },
  "archived": {
    "label": "Archived",
    "format": "boolean"
  },
  "pinned": {
    "label": "Pinned",
    "format": "boolean"
  },
  "stickied": {
    "label": "Stickied",
    "format": "boolean"
  },
  "edited": {
    "label": "Edited",
    "format": "boolean"
  },
  "editedAt": {
    "label": "Edited At",
    "format": "date"
  },
  "distinguished": {
    "label": "Distinguished",
    "format": "text"
  },
  "scoreHidden": {
    "label": "Score Hidden",
    "format": "boolean"
  },
  "isOriginalContent": {
    "label": "Original Content (OC)",
    "format": "boolean"
  },
  "numCrossposts": {
    "label": "Crossposts",
    "format": "number"
  },
  "totalAwardsReceived": {
    "label": "Awards",
    "format": "number"
  },
  "gilded": {
    "label": "Gilded",
    "format": "number"
  },
  "domain": {
    "label": "Domain",
    "format": "text"
  },
  "thumbnail": {
    "label": "Thumbnail",
    "format": "image"
  },
  "urlOverriddenByDest": {
    "label": "Outbound URL",
    "format": "link"
  },
  "subredditSubscribers": {
    "label": "Subreddit Subscribers",
    "format": "number"
  },
  "authorFlairText": {
    "label": "Author Flair",
    "format": "text"
  },
  "authorPremium": {
    "label": "Author Premium",
    "format": "boolean"
  },
  "numDuplicates": {
    "label": "Duplicates",
    "format": "number"
  },
  "removedByCategory": {
    "label": "Removed By Category",
    "format": "text"
  },
  "removedBy": {
    "label": "Removed By",
    "format": "text"
  },
  "bannedBy": {
    "label": "Banned By",
    "format": "text"
  },
  "removalReason": {
    "label": "Removal Reason",
    "format": "text"
  },
  "modReasonTitle": {
    "label": "Mod Reason Title",
    "format": "text"
  },
  "isRobotIndexable": {
    "label": "Robot Indexable",
    "format": "boolean"
  },
  "mediaType": {
    "label": "Media Type",
    "format": "text"
  },
  "hasMedia": {
    "label": "Has Media",
    "format": "boolean"
  },
  "galleryCount": {
    "label": "Gallery Count",
    "format": "number"
  },
  "galleryImages": {
    "label": "Gallery Images",
    "format": "array"
  },
  "mediaAssets": {
    "label": "Media Assets",
    "format": "array"
  },
  "videoUrl": {
    "label": "Video URL",
    "format": "link"
  },
  "media": {
    "label": "Media (raw)",
    "format": "object"
  },
  "secureMedia": {
    "label": "Secure Media (raw)",
    "format": "object"
  },
  "mediaMetadata": {
    "label": "Media Metadata (raw)",
    "format": "object"
  },
  "galleryData": {
    "label": "Gallery Data (raw)",
    "format": "object"
  },
  "ageHours": {
    "label": "Age (hours)",
    "format": "number"
  },
  "scorePerHour": {
    "label": "Score / Hour",
    "format": "number"
  },
  "commentsPerHour": {
    "label": "Comments / Hour",
    "format": "number"
  },
  "engagementTotal": {
    "label": "Engagement Total",
    "format": "number"
  },
  "commentToScoreRatio": {
    "label": "Comment:Score Ratio",
    "format": "number"
  },
  "isHighEngagement": {
    "label": "High Engagement",
    "format": "boolean"
  },
  "titleLength": {
    "label": "Title Length",
    "format": "number"
  },
  "bodyLength": {
    "label": "Body Length",
    "format": "number"
  },
  "wordCount": {
    "label": "Word Count",
    "format": "number"
  },
  "outboundUrlHost": {
    "label": "Outbound Host",
    "format": "text"
  },
  "authorFullname": {
    "label": "Author Fullname",
    "format": "text"
  },
  "parentKind": {
    "label": "Parent Kind",
    "format": "text"
  },
  "depth": {
    "label": "Comment Depth",
    "format": "number"
  },
  "controversiality": {
    "label": "Controversiality",
    "format": "number"
  },
  "isSubmitter": {
    "label": "Is OP",
    "format": "boolean"
  },
  "collapsed": {
    "label": "Collapsed",
    "format": "boolean"
  },
  "collapsedReason": {
    "label": "Collapsed Reason",
    "format": "text"
  }
}
```

## About this Actor

This example demonstrates how to use [Reddit Comment Scraper - Export Comments & Replies ($1.5/1k)](https://apify.com/harshmaur/reddit-comments-scraper) with a specific input configuration. Visit the [Actor detail page](https://apify.com/harshmaur/reddit-comments-scraper) to learn more, explore other use cases, and run it yourself.