diff options
| author | Bobby <[email protected]> | 2022-12-02 19:02:33 -0500 |
|---|---|---|
| committer | GitHub <[email protected]> | 2022-12-02 19:02:33 -0500 |
| commit | 6496fb95432618f64cf23be0cd0eac362b3af3ed (patch) | |
| tree | 2b55c918af459621d2a0d15f3f345171e6721520 /src/windows/modeltrainer.py | |
| parent | af2ada7022d75411f2d74a4a4d2c95dfe3eb2e3a (diff) | |
| parent | 2fbbc2c07f306c6edd1ab543b03b6fc905b9fa3a (diff) | |
| download | RedditEngagementPrediction-6496fb95432618f64cf23be0cd0eac362b3af3ed.tar.xz RedditEngagementPrediction-6496fb95432618f64cf23be0cd0eac362b3af3ed.zip | |
Merge pull request #9 from luciferreeves/main
Reqs added
Diffstat (limited to 'src/windows/modeltrainer.py')
| -rw-r--r-- | src/windows/modeltrainer.py | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/src/windows/modeltrainer.py b/src/windows/modeltrainer.py index 25b49c9..1d332fe 100644 --- a/src/windows/modeltrainer.py +++ b/src/windows/modeltrainer.py @@ -148,7 +148,7 @@ class ModelTrainer(customtkinter.CTkToplevel): # select only text, subreddit, link_flair_text, distinguished, hour, day, ups, num_comments self.posts_ups = self.posts[self.categorical_features + self.text_features + ['ups']] self.posts_num_comments = self.posts[self.categorical_features + self.text_features + ['num_comments']] - self.tfidf = TfidfVectorizer(sublinear_tf=True, min_df=5, norm='l2', encoding='latin-1', ngram_range=(1, 2), stop_words='english') + self.tfidf = TfidfVectorizer() self.label_binarizer = LabelBinarizer() self.edit_textbox('Preparing Data (Upvotes)', 1, 'wait') |
