diff options
| author | Bobby <[email protected]> | 2022-12-04 17:39:01 -0500 |
|---|---|---|
| committer | Bobby <[email protected]> | 2022-12-04 17:39:01 -0500 |
| commit | 131ca6891b9941da42c729168481296eaab4a47e (patch) | |
| tree | 3b393dda127afa13923b9de34064d639c3e340ac /src/helpers | |
| parent | 6c4431b68b3accd51bc32b98a828d1b149213d85 (diff) | |
| download | RedditEngagementPrediction-131ca6891b9941da42c729168481296eaab4a47e.tar.xz RedditEngagementPrediction-131ca6891b9941da42c729168481296eaab4a47e.zip | |
Fixed Plots
Diffstat (limited to 'src/helpers')
| -rw-r--r-- | src/helpers/preprocessor.py | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/src/helpers/preprocessor.py b/src/helpers/preprocessor.py index d358d69..9c58b24 100644 --- a/src/helpers/preprocessor.py +++ b/src/helpers/preprocessor.py @@ -62,7 +62,7 @@ class Preprocessor: self.df['day'] = self.df['created_utc'].dt.day_name() # self.df.drop('created_utc', axis=1, inplace=True) - cols_to_keep = ['title', 'selftext', 'link_flair_text', 'subreddit', 'ups', 'num_comments', 'hour', 'day', 'distinguished', 'author_premium', 'subreddit_subscribers', 'author', 'score', 'created_utc', 'upvote_ratio'] + cols_to_keep = ['title', 'selftext', 'link_flair_text', 'subreddit', 'ups', 'num_comments', 'hour', 'day', 'distinguished', 'author_premium', 'subreddit_subscribers', 'author', 'score', 'created_utc', 'upvote_ratio', 'total_awards_received'] self.df = self.df[cols_to_keep] # "distinguished" coloumn has 2 values - "moderator" and "" - We can convert this to a boolean column |
