Reddit Data Huge
Dataset containing Reddit Posts and Comments from various different subreddits.
@kaggle.prakharrathi25_reddit_data_huge
Dataset containing Reddit Posts and Comments from various different subreddits.
@kaggle.prakharrathi25_reddit_data_huge
Reddit is a collection of forums where people can share news and content as a thread or comment on other people’s posts. Reddit is broken up into more than a million communities known as “subreddits,” each of which covers a different topic. The name of a subreddit begins with /r/, which is part of the URLs that Reddit uses. For example, /r/nba is a subreddit where people talk about the National Basketball Association, while /r/boardgames is a subreddit for people to discuss board games.
In this dataset, I have added data from many different subreddits. This will act as an NLP gold mine for Social Media Analysis. This can help people understand what the youth is talking about.
I have collected it on my own using this article.
CREATE TABLE adviceforteens_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE anxiety_reddit_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE applyingtocollege_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE astrology_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE business_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE careerguidance_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE college (
"id" VARCHAR,
"title" VARCHAR,
"body" VARCHAR,
"subreddit" VARCHAR,
"upvotes" BIGINT,
"url" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE college_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE colombia_reddit_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE computer_science_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE covid19_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE dating_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE depression_reddit_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE employment_reddit_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE engineering_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE entrepreneur_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE feminism_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE gradschool_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE high_school (
"id" VARCHAR,
"title" VARCHAR,
"body" VARCHAR,
"subreddit" VARCHAR,
"upvotes" BIGINT,
"url" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE kidsrights_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE merged_reddit_data (
"unnamed_0" VARCHAR -- Unnamed: 0,
"id" VARCHAR,
"flair" VARCHAR,
"subreddit" VARCHAR,
"text" VARCHAR,
"sentiment" VARCHAR,
"creation_date" TIMESTAMP,
"upvotes" BIGINT
);CREATE TABLE mexico_spanishlanguage_reddit_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE neutralpolitics_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE povertyfinance_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);CREATE TABLE science_data (
"unnamed_0" BIGINT -- Unnamed: 0,
"id" VARCHAR,
"is_original" BOOLEAN,
"flair" VARCHAR,
"num_comments" BIGINT,
"title" VARCHAR,
"subreddit" VARCHAR,
"body" VARCHAR,
"url" VARCHAR,
"upvotes" BIGINT,
"comments" VARCHAR,
"creation_date" TIMESTAMP
);Anyone who has the link will be able to view this.