diff options
| -rw-r--r-- | .DS_Store | bin | 0 -> 6148 bytes | |||
| -rw-r--r-- | Report/report.aux | 32 | ||||
| -rw-r--r-- | Report/report.fdb_latexmk | 63 | ||||
| -rw-r--r-- | Report/report.fls | 210 | ||||
| -rw-r--r-- | Report/report.log | 219 | ||||
| -rw-r--r-- | Report/report.pdf | bin | 0 -> 11378187 bytes | |||
| -rw-r--r-- | Report/report.synctex.gz | bin | 0 -> 28856 bytes | |||
| -rw-r--r-- | Report/report.tex | 201 | ||||
| -rw-r--r-- | images/author_rank.png | bin | 0 -> 2006057 bytes | |||
| -rw-r--r-- | images/awards_per_subreddit.png | bin | 0 -> 1125589 bytes | |||
| -rw-r--r-- | images/best_time.png | bin | 0 -> 4431386 bytes | |||
| -rw-r--r-- | images/boxplot_scores.png | bin | 0 -> 242999 bytes | |||
| -rw-r--r-- | images/num_authors_multiple_subreddit.png | bin | 0 -> 129562 bytes | |||
| -rw-r--r-- | images/num_posts_per_day_per_subreddit.png | bin | 0 -> 1512397 bytes | |||
| -rw-r--r-- | images/num_posts_per_day_per_subreddit_bar.png | bin | 0 -> 1055979 bytes | |||
| -rw-r--r-- | images/num_posts_per_subreddit.png | bin | 0 -> 37293 bytes | |||
| -rw-r--r-- | images/num_subscribers_per_subreddit.png | bin | 0 -> 243280 bytes | |||
| -rw-r--r-- | images/pie_comments.png | bin | 0 -> 731818 bytes | |||
| -rw-r--r-- | images/post_multiple.png | bin | 0 -> 153345 bytes | |||
| -rw-r--r-- | images/scatterplot_scores.png | bin | 0 -> 1262190 bytes | |||
| -rw-r--r-- | project.ipynb | 6 |
21 files changed, 728 insertions, 3 deletions
diff --git a/.DS_Store b/.DS_Store Binary files differnew file mode 100644 index 0000000..e865e23 --- /dev/null +++ b/.DS_Store diff --git a/Report/report.aux b/Report/report.aux new file mode 100644 index 0000000..bc9d848 --- /dev/null +++ b/Report/report.aux @@ -0,0 +1,32 @@ +\relax +\@writefile{toc}{\contentsline {section}{\numberline {1}Motivation \& Problem Statement}{1}{}\protected@file@percent } +\@writefile{toc}{\contentsline {subsection}{\numberline {1.1}Motivation}{1}{}\protected@file@percent } +\@writefile{toc}{\contentsline {subsection}{\numberline {1.2}Problem Statement}{1}{}\protected@file@percent } +\@writefile{toc}{\contentsline {section}{\numberline {2}Data Collection}{2}{}\protected@file@percent } +\@writefile{toc}{\contentsline {section}{\numberline {3}Data Cleaning \& Preprocessing}{2}{}\protected@file@percent } +\@writefile{toc}{\contentsline {section}{\numberline {4}Expolaratory Data Analysis}{4}{}\protected@file@percent } +\@writefile{lof}{\contentsline {figure}{\numberline {1}{\ignorespaces Number of Posts per Subreddit}}{4}{}\protected@file@percent } +\newlabel{fig:posts_per_subreddit}{{1}{4}} +\@writefile{lof}{\contentsline {figure}{\numberline {2}{\ignorespaces Number of Subscribers per Subreddit}}{4}{}\protected@file@percent } +\newlabel{fig:subscribers_per_subreddit}{{2}{4}} +\@writefile{lof}{\contentsline {figure}{\numberline {3}{\ignorespaces Number of Authors who post in multiple subreddits}}{5}{}\protected@file@percent } +\newlabel{fig:authors_per_subreddit}{{3}{5}} +\@writefile{lof}{\contentsline {figure}{\numberline {4}{\ignorespaces Does posting in multiple subreddits drives more upvotes?}}{5}{}\protected@file@percent } +\newlabel{fig:upvotes_per_subreddit}{{4}{5}} +\@writefile{lof}{\contentsline {figure}{\numberline {5}{\ignorespaces History of posts per day per subreddit}}{6}{}\protected@file@percent } +\newlabel{fig:history_posts_per_day}{{5}{6}} +\@writefile{lof}{\contentsline {figure}{\numberline {6}{\ignorespaces Number of posts per day per subreddit}}{7}{}\protected@file@percent } +\newlabel{fig:posts_per_day}{{6}{7}} +\@writefile{lof}{\contentsline {figure}{\numberline {7}{\ignorespaces Top 10 Authors Per Subreddit}}{8}{}\protected@file@percent } +\newlabel{fig:top_authors_per_subreddit}{{7}{8}} +\@writefile{lof}{\contentsline {figure}{\numberline {8}{\ignorespaces Best Time to Post on each Subreddit}}{9}{}\protected@file@percent } +\newlabel{fig:best_time_to_post}{{8}{9}} +\@writefile{lof}{\contentsline {figure}{\numberline {9}{\ignorespaces Scatterplot of the scores vs number of comments in each subreddit}}{10}{}\protected@file@percent } +\newlabel{fig:score_vs_comments}{{9}{10}} +\@writefile{lof}{\contentsline {figure}{\numberline {10}{\ignorespaces \% of Authors opted to receive comment notifications per Subreddit}}{11}{}\protected@file@percent } +\newlabel{fig:comment_notifications}{{10}{11}} +\@writefile{lof}{\contentsline {figure}{\numberline {11}{\ignorespaces Total Awards Received vs Upvotes per Subreddit}}{12}{}\protected@file@percent } +\newlabel{fig:awards_vs_upvotes}{{11}{12}} +\@writefile{lof}{\contentsline {figure}{\numberline {12}{\ignorespaces Boxplot of the scores in each subreddit}}{13}{}\protected@file@percent } +\newlabel{fig:boxplot}{{12}{13}} +\gdef \@abspage@last{13} diff --git a/Report/report.fdb_latexmk b/Report/report.fdb_latexmk new file mode 100644 index 0000000..0ad9fcd --- /dev/null +++ b/Report/report.fdb_latexmk @@ -0,0 +1,63 @@ +# Fdb version 3 +["pdflatex"] 1666048237 "/Users/lucifer/Documents/projects/EAS_504/Report/report.tex" "report.pdf" "report" 1666048261 + "../images//author_rank.png" 1666045294 2006057 345c0b5d7d2bb0a0e926c00e389b9612 "" + "../images//awards_per_subreddit.png" 1666045387 1125589 022c541cb180b8fe49ebbd79db07c94d "" + "../images//best_time.png" 1666045309 4431386 c75b5a1b588df07ca81e6921bdeb2700 "" + "../images//boxplot_scores.png" 1666045330 242999 380a6526c63ceb5362a485227f201b06 "" + "../images//num_authors_multiple_subreddit.png" 1666045233 129562 dc750bcef04fb6fef25719efdff1a8f1 "" + "../images//num_posts_per_day_per_subreddit.png" 1666045280 1512397 067710348f63aced645f9134b0fd4e97 "" + "../images//num_posts_per_day_per_subreddit_bar.png" 1666045414 1055979 282192d6073c5fd035498015f019fa67 "" + "../images//num_posts_per_subreddit.png" 1666044839 37293 65a67f600c625d9b6342f3f02d7c37b6 "" + "../images//num_subscribers_per_subreddit.png" 1666045213 243280 255c720ac174b7f4f4928b6915591fc3 "" + "../images//pie_comments.png" 1666045361 731818 270554f72eabe179f1bb8f628dcf4e8a "" + "../images//post_multiple.png" 1666045255 153345 e95c92a767ac26dfce6aeb8a81cfc324 "" + "../images//scatterplot_scores.png" 1666045346 1262190 4d28182fe25b1f07c52d432f475d9a14 "" + "/Users/lucifer/Documents/projects/EAS_504/Report/report.tex" 1666048217 10957 eafabae6bfd1c4c26dbaf75b6088d89c "" + "/usr/local/texlive/2022/texmf-dist/fonts/enc/dvips/cm-super/cm-super-ts1.enc" 1136849721 2900 1537cc8184ad1792082cd229ecc269f4 "" + "/usr/local/texlive/2022/texmf-dist/fonts/map/fontname/texfonts.map" 1577235249 3524 cb3e574dea2d1052e39280babc910dc8 "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/jknappen/ec/tcrm1200.tfm" 1136768653 1536 74b7293ec3713bb7fdca8dd1bd1f469c "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmbx12.tfm" 1136768653 1324 c910af8c371558dc20f2d7822f66fe64 "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmmi12.tfm" 1136768653 1524 4414a8315f39513458b80dfc63bff03a "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmmi6.tfm" 1136768653 1512 f21f83efb36853c0b70002322c1ab3ad "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmmi8.tfm" 1136768653 1520 eccf95517727cb11801f4f1aee3a21b4 "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr12.tfm" 1136768653 1288 655e228510b4c2a1abe905c368440826 "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr17.tfm" 1136768653 1292 296a67155bdbfc32aa9c636f21e91433 "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr6.tfm" 1136768653 1300 b62933e007d01cfd073f79b963c01526 "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr8.tfm" 1136768653 1292 21c1c5bfeaebccffdb478fd231a0997d "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmsy10.tfm" 1136768653 1124 6c73e740cf17375f03eec0ee63599741 "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmsy6.tfm" 1136768653 1116 933a60c408fc0a863a92debe84b2d294 "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmsy8.tfm" 1136768653 1120 8b7d695260f3cff42e636090a8002094 "" + "/usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmtt12.tfm" 1136768653 772 9a936b7f5e2ff0557fce0f62822f0bbf "" + "/usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmbx12.pfb" 1248133631 32080 340ef9bf63678554ee606688e7b5339d "" + "/usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr10.pfb" 1248133631 35752 024fb6c41858982481f6968b5fc26508 "" + "/usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr12.pfb" 1248133631 32722 d7379af29a190c3f453aba36302ff5a9 "" + "/usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr17.pfb" 1248133631 32362 179c33bbf43f19adbb3825bb4e36e57a "" + "/usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr7.pfb" 1248133631 32762 224316ccc9ad3ca0423a14971cfa7fc1 "" + "/usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr8.pfb" 1248133631 32726 0a1aea6fcd6468ee2cf64d891f5c43c8 "" + "/usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmsy10.pfb" 1248133631 32569 5e5ddc8df908dea60932f3c484a54c0d "" + "/usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmtt12.pfb" 1248133631 24252 1e4e051947e12dfb50fee0b7f4e26e3a "" + "/usr/local/texlive/2022/texmf-dist/fonts/type1/public/cm-super/sfrm1200.pfb" 1215737283 136101 f533469f523533d38317ab5729d00c8a "" + "/usr/local/texlive/2022/texmf-dist/tex/context/base/mkii/supp-pdf.mkii" 1461363279 71627 94eb9990bed73c364d7f53f960cc8c5b "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls" 1654720880 20144 7555b7429d80bef287ebb82117811acc "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/base/size12.clo" 1654720880 8449 7fbdc9c8596083427317c1e525489c81 "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty" 1579991033 13886 d1306dcf79a944f6988e688c1785f9ce "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty" 1137110151 6749 16d2656a1984957e674b149555f1ea1d "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/graphics-cfg/graphics.cfg" 1465944070 1224 978390e9c2234eab29404bc21b268d1e "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/graphics-def/pdftex.def" 1601931164 19103 48d29b6e2a64cb717117ef65f107b404 "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty" 1654720880 18387 8f900a490197ebaf93c02ae9476d4b09 "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty" 1654720880 8010 a8d949cbdbc5c983593827c9eec252e1 "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty" 1654720880 2671 7e67d78d9b88c845599a85b2d41f2e39 "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty" 1654720880 4023 293ea1c16429fc0c4cf605f4da1791a9 "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def" 1661977202 30282 33c465a64f2bd5ad4a68a7b2f555a29b "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/latexconfig/epstopdf-sys.cfg" 1279039959 678 4792914a8f45be57bb98413425e4c7af "" + "/usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty" 1137110779 22423 d476012cd03f82f9475ad54ba6cd3267 "" + "/usr/local/texlive/2022/texmf-dist/web2c/texmf.cnf" 1646502317 40171 cdab547de63d26590bebb3baff566530 "" + "/usr/local/texlive/2022/texmf-var/fonts/map/pdftex/updmap/pdftex.map" 1663570351 4595816 106c4e272f709332e200b7ab82c17944 "" + "/usr/local/texlive/2022/texmf-var/web2c/pdftex/pdflatex.fmt" 1663570397 3058617 cd9771818186ae15ff6f2cbe82ec8a81 "" + "/usr/local/texlive/2022/texmf.cnf" 1647878952 577 209b46be99c9075fd74d4c0369380e8c "" + "report.aux" 1666048261 2985 cbf72b8d9c61d13f3f276ab9706b09c8 "pdflatex" + "report.tex" 1666048217 10957 eafabae6bfd1c4c26dbaf75b6088d89c "" + (generated) + "report.aux" + "report.log" + "report.pdf" diff --git a/Report/report.fls b/Report/report.fls new file mode 100644 index 0000000..ff5052c --- /dev/null +++ b/Report/report.fls @@ -0,0 +1,210 @@ +PWD /Users/lucifer/Documents/projects/EAS_504/Report +INPUT /usr/local/texlive/2022/texmf.cnf +INPUT /usr/local/texlive/2022/texmf-dist/web2c/texmf.cnf +INPUT /usr/local/texlive/2022/texmf-var/web2c/pdftex/pdflatex.fmt +INPUT /Users/lucifer/Documents/projects/EAS_504/Report/report.tex +OUTPUT report.log +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/size12.clo +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/size12.clo +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/size12.clo +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/base/size12.clo +INPUT /usr/local/texlive/2022/texmf-dist/fonts/map/fontname/texfonts.map +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr12.tfm +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics-cfg/graphics.cfg +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics-cfg/graphics.cfg +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics-cfg/graphics.cfg +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics-cfg/graphics.cfg +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics-def/pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics-def/pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics-def/pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/graphics-def/pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +INPUT ./report.aux +INPUT report.aux +INPUT report.aux +OUTPUT report.aux +INPUT /usr/local/texlive/2022/texmf-dist/tex/context/base/mkii/supp-pdf.mkii +INPUT /usr/local/texlive/2022/texmf-dist/tex/context/base/mkii/supp-pdf.mkii +INPUT /usr/local/texlive/2022/texmf-dist/tex/context/base/mkii/supp-pdf.mkii +INPUT /usr/local/texlive/2022/texmf-dist/tex/context/base/mkii/supp-pdf.mkii +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/latexconfig/epstopdf-sys.cfg +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/latexconfig/epstopdf-sys.cfg +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/latexconfig/epstopdf-sys.cfg +INPUT /usr/local/texlive/2022/texmf-dist/tex/latex/latexconfig/epstopdf-sys.cfg +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr17.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr12.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmmi12.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmsy10.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr17.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmbx12.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmbx12.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/jknappen/ec/tcrm1200.tfm +OUTPUT report.pdf +INPUT /usr/local/texlive/2022/texmf-var/fonts/map/pdftex/updmap/pdftex.map +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr8.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmr6.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmmi12.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmmi8.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmmi6.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmsy10.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmsy8.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmsy6.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmtt12.tfm +INPUT /usr/local/texlive/2022/texmf-dist/fonts/tfm/public/cm/cmbx12.tfm +INPUT ../images//num_posts_per_subreddit.png +INPUT ../images//num_posts_per_subreddit.png +INPUT ../images//num_posts_per_subreddit.png +INPUT ../images//num_posts_per_subreddit.png +INPUT ../images//num_subscribers_per_subreddit.png +INPUT ../images//num_subscribers_per_subreddit.png +INPUT ../images//num_subscribers_per_subreddit.png +INPUT ../images//num_subscribers_per_subreddit.png +INPUT ../images//num_authors_multiple_subreddit.png +INPUT ../images//num_authors_multiple_subreddit.png +INPUT ../images//num_authors_multiple_subreddit.png +INPUT ../images//num_authors_multiple_subreddit.png +INPUT ../images//post_multiple.png +INPUT ../images//post_multiple.png +INPUT ../images//post_multiple.png +INPUT ../images//post_multiple.png +INPUT ../images//num_posts_per_day_per_subreddit.png +INPUT ../images//num_posts_per_day_per_subreddit.png +INPUT ../images//num_posts_per_day_per_subreddit.png +INPUT ../images//num_posts_per_day_per_subreddit.png +INPUT ../images//num_posts_per_day_per_subreddit_bar.png +INPUT ../images//num_posts_per_day_per_subreddit_bar.png +INPUT ../images//num_posts_per_day_per_subreddit_bar.png +INPUT ../images//num_posts_per_day_per_subreddit_bar.png +INPUT ../images//author_rank.png +INPUT ../images//author_rank.png +INPUT ../images//author_rank.png +INPUT ../images//author_rank.png +INPUT ../images//best_time.png +INPUT ../images//best_time.png +INPUT ../images//best_time.png +INPUT ../images//best_time.png +INPUT ../images//scatterplot_scores.png +INPUT ../images//scatterplot_scores.png +INPUT ../images//scatterplot_scores.png +INPUT ../images//scatterplot_scores.png +INPUT ../images//pie_comments.png +INPUT ../images//pie_comments.png +INPUT ../images//pie_comments.png +INPUT ../images//pie_comments.png +INPUT ../images//awards_per_subreddit.png +INPUT ../images//awards_per_subreddit.png +INPUT ../images//awards_per_subreddit.png +INPUT ../images//awards_per_subreddit.png +INPUT ../images//boxplot_scores.png +INPUT ../images//boxplot_scores.png +INPUT ../images//boxplot_scores.png +INPUT ../images//boxplot_scores.png +INPUT report.aux +INPUT /usr/local/texlive/2022/texmf-dist/fonts/enc/dvips/cm-super/cm-super-ts1.enc +INPUT /usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmbx12.pfb +INPUT /usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr10.pfb +INPUT /usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr12.pfb +INPUT /usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr17.pfb +INPUT /usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr7.pfb +INPUT /usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr8.pfb +INPUT /usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmsy10.pfb +INPUT /usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmtt12.pfb +INPUT /usr/local/texlive/2022/texmf-dist/fonts/type1/public/cm-super/sfrm1200.pfb diff --git a/Report/report.log b/Report/report.log new file mode 100644 index 0000000..7feb76c --- /dev/null +++ b/Report/report.log @@ -0,0 +1,219 @@ +This is pdfTeX, Version 3.141592653-2.6-1.40.24 (TeX Live 2022) (preloaded format=pdflatex 2022.9.19) 17 OCT 2022 19:10 +entering extended mode + restricted \write18 enabled. + file:line:error style messages enabled. + %&-line parsing enabled. +**/Users/lucifer/Documents/projects/EAS_504/Report/report.tex +(/Users/lucifer/Documents/projects/EAS_504/Report/report.tex +LaTeX2e <2022-06-01> patch level 5 +L3 programming layer <2022-08-30> (/usr/local/texlive/2022/texmf-dist/tex/latex/base/article.cls +Document Class: article 2021/10/04 v1.4n Standard LaTeX document class +(/usr/local/texlive/2022/texmf-dist/tex/latex/base/size12.clo +File: size12.clo 2021/10/04 v1.4n Standard LaTeX file (size option) +) +\c@part=\count185 +\c@section=\count186 +\c@subsection=\count187 +\c@subsubsection=\count188 +\c@paragraph=\count189 +\c@subparagraph=\count190 +\c@figure=\count191 +\c@table=\count192 +\abovecaptionskip=\skip47 +\belowcaptionskip=\skip48 +\bibindent=\dimen138 +) (/usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphicx.sty +Package: graphicx 2021/09/16 v1.2d Enhanced LaTeX Graphics (DPC,SPQR) + (/usr/local/texlive/2022/texmf-dist/tex/latex/graphics/keyval.sty +Package: keyval 2022/05/29 v1.15 key=value parser (DPC) +\KV@toks@=\toks16 +) (/usr/local/texlive/2022/texmf-dist/tex/latex/graphics/graphics.sty +Package: graphics 2022/03/10 v1.4e Standard LaTeX Graphics (DPC,SPQR) + (/usr/local/texlive/2022/texmf-dist/tex/latex/graphics/trig.sty +Package: trig 2021/08/11 v1.11 sin cos tan (DPC) +) (/usr/local/texlive/2022/texmf-dist/tex/latex/graphics-cfg/graphics.cfg +File: graphics.cfg 2016/06/04 v1.11 sample graphics configuration +) +Package graphics Info: Driver file: pdftex.def on input line 107. + (/usr/local/texlive/2022/texmf-dist/tex/latex/graphics-def/pdftex.def +File: pdftex.def 2020/10/05 v1.2a Graphics/color driver for pdftex +)) +\Gin@req@height=\dimen139 +\Gin@req@width=\dimen140 +) (/usr/local/texlive/2022/texmf-dist/tex/latex/float/float.sty +Package: float 2001/11/08 v1.3d Float enhancements (AL) +\c@float@type=\count193 +\float@exts=\toks17 +\float@box=\box51 +\@float@everytoks=\toks18 +\@floatcapt=\box52 +) (/usr/local/texlive/2022/texmf-dist/tex/latex/sectsty/sectsty.sty +Package: sectsty 2002/02/25 v2.0.2 Commands to change all sectional heading styles + + +LaTeX Warning: Command \underbar has changed. + Check if current package is valid. + + +LaTeX Warning: Command \underline has changed. + Check if current package is valid. + +) (/usr/local/texlive/2022/texmf-dist/tex/latex/l3backend/l3backend-pdftex.def +File: l3backend-pdftex.def 2022-08-30 L3 backend support: PDF output (pdfTeX) +\l__color_backend_stack_int=\count194 +\l__pdf_internal_box=\box53 +) + +LaTeX Warning: Unused global option(s): + [letterpage]. + +(./report.aux) +\openout1 = `report.aux'. + +LaTeX Font Info: Checking defaults for OML/cmm/m/it on input line 17. +LaTeX Font Info: ... okay on input line 17. +LaTeX Font Info: Checking defaults for OMS/cmsy/m/n on input line 17. +LaTeX Font Info: ... okay on input line 17. +LaTeX Font Info: Checking defaults for OT1/cmr/m/n on input line 17. +LaTeX Font Info: ... okay on input line 17. +LaTeX Font Info: Checking defaults for T1/cmr/m/n on input line 17. +LaTeX Font Info: ... okay on input line 17. +LaTeX Font Info: Checking defaults for TS1/cmr/m/n on input line 17. +LaTeX Font Info: ... okay on input line 17. +LaTeX Font Info: Checking defaults for OMX/cmex/m/n on input line 17. +LaTeX Font Info: ... okay on input line 17. +LaTeX Font Info: Checking defaults for U/cmr/m/n on input line 17. +LaTeX Font Info: ... okay on input line 17. + (/usr/local/texlive/2022/texmf-dist/tex/context/base/mkii/supp-pdf.mkii +[Loading MPS to PDF converter (version 2006.09.02).] +\scratchcounter=\count195 +\scratchdimen=\dimen141 +\scratchbox=\box54 +\nofMPsegments=\count196 +\nofMParguments=\count197 +\everyMPshowfont=\toks19 +\MPscratchCnt=\count198 +\MPscratchDim=\dimen142 +\MPnumerator=\count199 +\makeMPintoPDFobject=\count266 +\everyMPtoPDFconversion=\toks20 +) (/usr/local/texlive/2022/texmf-dist/tex/latex/epstopdf-pkg/epstopdf-base.sty +Package: epstopdf-base 2020-01-24 v2.11 Base part for package epstopdf +Package epstopdf-base Info: Redefining graphics rule for `.eps' on input line 485. + (/usr/local/texlive/2022/texmf-dist/tex/latex/latexconfig/epstopdf-sys.cfg +File: epstopdf-sys.cfg 2010/07/13 v1.3 Configuration of (r)epstopdf for TeX Live +)) +LaTeX Font Info: External font `cmex10' loaded for size +(Font) <14.4> on input line 18. +LaTeX Font Info: External font `cmex10' loaded for size +(Font) <7> on input line 18. + [1 + +{/usr/local/texlive/2022/texmf-var/fonts/map/pdftex/updmap/pdftex.map}] +LaTeX Font Info: External font `cmex10' loaded for size +(Font) <12> on input line 38. +LaTeX Font Info: External font `cmex10' loaded for size +(Font) <8> on input line 38. +LaTeX Font Info: External font `cmex10' loaded for size +(Font) <6> on input line 38. +LaTeX Font Info: External font `cmex10' loaded for size +(Font) <5> on input line 38. + +Underfull \hbox (badness 6461) in paragraph at lines 40--45 +[]\OT1/cmtt/m/n/12 python\OT1/cmr/m/n/12 , \OT1/cmtt/m/n/12 datascience\OT1/cmr/m/n/12 , \OT1/cmtt/m/n/12 javascript\OT1/cmr/m/n/12 , \OT1/cmtt/m/n/12 linux\OT1/cmr/m/n/12 , \OT1/cmtt/m/n/12 opensource\OT1/cmr/m/n/12 , \OT1/cmtt/m/n/12 node\OT1/cmr/m/n/12 , + [] + + +Underfull \hbox (badness 10000) in paragraph at lines 48--49 + + [] + +[2] [3] +<../images//num_posts_per_subreddit.png, id=20, 1174.3875pt x 555.07375pt> +File: ../images//num_posts_per_subreddit.png Graphic file (type png) +<use ../images//num_posts_per_subreddit.png> +Package pdftex.def Info: ../images//num_posts_per_subreddit.png used on input line 76. +(pdftex.def) Requested size: 312.00119pt x 147.4665pt. +<../images//num_subscribers_per_subreddit.png, id=22, 1162.1016pt x 555.2745pt> +File: ../images//num_subscribers_per_subreddit.png Graphic file (type png) +<use ../images//num_subscribers_per_subreddit.png> +Package pdftex.def Info: ../images//num_subscribers_per_subreddit.png used on input line 84. +(pdftex.def) Requested size: 312.00119pt x 149.07884pt. +<../images//num_authors_multiple_subreddit.png, id=23, 1181.1327pt x 497.2176pt> +File: ../images//num_authors_multiple_subreddit.png Graphic file (type png) +<use ../images//num_authors_multiple_subreddit.png> +Package pdftex.def Info: ../images//num_authors_multiple_subreddit.png used on input line 92. +(pdftex.def) Requested size: 312.00119pt x 131.33716pt. + [4 <../images//num_posts_per_subreddit.png> <../images//num_subscribers_per_subreddit.png>] +<../images//post_multiple.png, id=29, 1181.1327pt x 497.2176pt> +File: ../images//post_multiple.png Graphic file (type png) +<use ../images//post_multiple.png> +Package pdftex.def Info: ../images//post_multiple.png used on input line 102. +(pdftex.def) Requested size: 312.00119pt x 131.33716pt. +<../images//num_posts_per_day_per_subreddit.png, id=30, 1438.173pt x 1420.1055pt> +File: ../images//num_posts_per_day_per_subreddit.png Graphic file (type png) +<use ../images//num_posts_per_day_per_subreddit.png> +Package pdftex.def Info: ../images//num_posts_per_day_per_subreddit.png used on input line 113. +(pdftex.def) Requested size: 390.0pt x 385.10213pt. + [5 <../images//num_authors_multiple_subreddit.png> <../images//post_multiple.png>] +<../images//num_posts_per_day_per_subreddit_bar.png, id=36, 1436.9685pt x 1420.1055pt> +File: ../images//num_posts_per_day_per_subreddit_bar.png Graphic file (type png) +<use ../images//num_posts_per_day_per_subreddit_bar.png> +Package pdftex.def Info: ../images//num_posts_per_day_per_subreddit_bar.png used on input line 124. +(pdftex.def) Requested size: 390.0pt x 385.42717pt. + [6 <../images//num_posts_per_day_per_subreddit.png>] +<../images//author_rank.png, id=41, 1434.0777pt x 1420.1055pt> +File: ../images//author_rank.png Graphic file (type png) +<use ../images//author_rank.png> +Package pdftex.def Info: ../images//author_rank.png used on input line 135. +(pdftex.def) Requested size: 370.49881pt x 366.87846pt. + [7 <../images//num_posts_per_day_per_subreddit_bar.png>] +<../images//best_time.png, id=47, 1438.173pt x 1420.1055pt> +File: ../images//best_time.png Graphic file (type png) +<use ../images//best_time.png> +Package pdftex.def Info: ../images//best_time.png used on input line 150. +(pdftex.def) Requested size: 390.0pt x 385.10213pt. + [8 <../images//author_rank.png>] +<../images//scatterplot_scores.png, id=53, 1437.6912pt x 1420.1055pt> +File: ../images//scatterplot_scores.png Graphic file (type png) +<use ../images//scatterplot_scores.png> +Package pdftex.def Info: ../images//scatterplot_scores.png used on input line 161. +(pdftex.def) Requested size: 390.0pt x 385.21048pt. + [9 <../images//best_time.png>] +<../images//pie_comments.png, id=58, 1131.9891pt x 1420.1055pt> +File: ../images//pie_comments.png Graphic file (type png) +<use ../images//pie_comments.png> +Package pdftex.def Info: ../images//pie_comments.png used on input line 172. +(pdftex.def) Requested size: 390.0pt x 489.2652pt. + [10 <../images//scatterplot_scores.png>] +Overfull \vbox (19.1485pt too high) has occurred while \output is active [] + + [11 <../images//pie_comments.png>] +<../images//awards_per_subreddit.png, id=67, 1437.6912pt x 1420.1055pt> +File: ../images//awards_per_subreddit.png Graphic file (type png) +<use ../images//awards_per_subreddit.png> +Package pdftex.def Info: ../images//awards_per_subreddit.png used on input line 183. +(pdftex.def) Requested size: 390.0pt x 385.21048pt. + [12 <../images//awards_per_subreddit.png>] +<../images//boxplot_scores.png, id=72, 1181.1327pt x 555.2745pt> +File: ../images//boxplot_scores.png Graphic file (type png) +<use ../images//boxplot_scores.png> +Package pdftex.def Info: ../images//boxplot_scores.png used on input line 194. +(pdftex.def) Requested size: 390.0pt x 183.34282pt. + [13 <../images//boxplot_scores.png>] (./report.aux) ) +Here is how much of TeX's memory you used: + 1627 strings out of 475075 + 29322 string characters out of 5779003 + 371189 words of memory out of 5000000 + 23039 multiletter control sequences out of 15000+600000 + 474933 words of font info for 47 fonts, out of 8000000 for 9000 + 1141 hyphenation exceptions out of 8191 + 55i,8n,62p,471b,228s stack positions out of 10000i,1000n,20000p,200000b,200000s +{/usr/local/texlive/2022/texmf-dist/fonts/enc/dvips/cm-super/cm-super-ts1.enc}</usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmbx12.pfb></usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr10.pfb></usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr12.pfb></usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr17.pfb></usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr7.pfb></usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmr8.pfb></usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmsy10.pfb></usr/local/texlive/2022/texmf-dist/fonts/type1/public/amsfonts/cm/cmtt12.pfb></usr/local/texlive/2022/texmf-dist/fonts/type1/public/cm-super/sfrm1200.pfb> +Output written on report.pdf (13 pages, 11378187 bytes). +PDF statistics: + 118 PDF objects out of 1000 (max. 8388607) + 60 compressed objects within 1 object stream + 0 named destinations out of 1000 (max. 500000) + 61 words of extra memory for PDF output out of 10000 (max. 10000000) + diff --git a/Report/report.pdf b/Report/report.pdf Binary files differnew file mode 100644 index 0000000..c343db4 --- /dev/null +++ b/Report/report.pdf diff --git a/Report/report.synctex.gz b/Report/report.synctex.gz Binary files differnew file mode 100644 index 0000000..afb7158 --- /dev/null +++ b/Report/report.synctex.gz diff --git a/Report/report.tex b/Report/report.tex new file mode 100644 index 0000000..dc0c3b7 --- /dev/null +++ b/Report/report.tex @@ -0,0 +1,201 @@ +\documentclass[12pt, letterpage]{article} +\usepackage{graphicx} +\usepackage{float} +\usepackage{sectsty} + +\title{EAS 4/587 – Data Intensive Computing\\Phase 1 Report} +\author{ + Kumar Priyansh \\ + \footnotesize UBIT Name: kumarpri + \and Ritu Dimri\\ + \footnotesize UBIT Name: ritudimr +} +\date{} +\sloppy +\graphicspath{{../images/}} + +\begin{document} +\maketitle + +\section{Motivation \& Problem Statement} + +\subsection{Motivation} +\begin{itemize} + \item Reddit is a social media website where users can post links to articles, images, videos, etc.\ and other users can comment on them. Authors of the posts, generally look to drive maximum engagement from their posts. + \item Unlike other social media websites, Reddit has a unique feature of upvoting and downvoting the posts. Also, since the posts are publicly visible, factors like the time of posting, the number of upvotes, the number of comments, etc.\ matter a lot. + \item Since there are a lot of posts being made every minute, significant posts can get lost in the crowd. Also, the posts that are made at a particular time of the day, may not be visible to the users who are active at a different time of the day. +\end{itemize} + +\subsection{Problem Statement} +\begin{itemize} + \item Fetch the data using the Reddit Developer API from different programming related subreddits (communities). Since, there are a lot of subreddits on Reddit; we will keep the scope of the project limited. + \item Analyze the data and find relevant insights after cleaning and preprocessing the data. + \item Build a model to predict the engagement a post will likely receive, given the time of posting, the number of upvotes, the number of comments, and other factors. +\end{itemize} + +\section{Data Collection} + +The data was collected from the Reddit Developer API\footnote{https://www.reddit.com/dev/api/}. The API provides access to the data of the posts made on Reddit. The data was collected from the following subreddits: + +\texttt{python}, +\texttt{datascience}, \texttt{javascript}, +\texttt{linux}, \texttt{opensource}, \texttt{node}, +\texttt{programming}, \texttt{computerscience}, +\texttt{webdev}, \texttt{statistics}, \texttt{machinelearning}, \texttt{compsci}, \texttt{java}, \texttt{rust}, \texttt{typescript}. + +\section{Data Cleaning \& Preprocessing} + +\textbf{Note:} Since the data is coming from a live API, the data is not static. Hence, the plots and the results may vary from the ones shown in the report. \\ + +After collecting the data, we got more than 15,700 rows and 118 columns. The data was cleaned and preprocessed to remove the unnecessary columns and to make the data more readable. The data was cleaned and preprocessed using the following steps: + +\begin{enumerate} + \item \textbf{Dropping Saturated Columns}: Saturated columns are the columns that have a single value for all the rows. These columns do not provide any useful information and hence, they were dropped. + \item \textbf{Fixing Data Types}: Some columns can have incorrect data type when converted into a Pandas DataFrame. All data was converted to \texttt{string} type, except numeric (\texttt{int} \& \texttt{float}) and \texttt{boolean} columns. Some boolean colums like \texttt{distinguished} and \texttt{author\_premium} required forced type conversion to \texttt{boolean} type. + \item \textbf{Drop Duplicates}: Sometimes, the same post is copied and pasted in multiple subreddits. These posts are duplicates and hence, they were dropped, keeping only one copy of the post. + \item \textbf{Check for Missing and Null Values}: The data was checked for missing and null values. After the above steps, there were no missing or null values in the data. + \item \textbf{Handling Flairs}: Flairs are the tags that are assigned to the posts. They are used to categorize the posts. For example, a post can be tagged as \texttt{help}, \texttt{discussion}, \texttt{news}, etc.\ Only the relevant flair columns were kept. The flairs might also contain emojis, which were also removed in a later step. + \item \textbf{Handling Deleted Posts \& Posts by Deleted Users}: Posts that were deleted by the author or the moderators were removed from the data. Also, posts by deleted users were removed. + \item \textbf{Handling Polls}: Polls are posts that are used to collect votes from the users. These posts were removed from the data as they do not provide any useful information for text analysis. + \item \textbf{Dropping Unnecessary Columns}: Some columns were dropped as they were not relevant for the analysis. For example, columns like \texttt{thumbnail\_height} and \texttt{thumbnail\_width} were dropped as they do not provide any useful information. + \item \textbf{Lowecasing Text Columns}: All text columns were converted to lowercase. + \item \textbf{Removing HTML Entities, Escape Characters and URLs}: HTML entities, escape characters and URLs were removed from the text columns. + \item \textbf{Removing Punctuations, Numbers and Emojis}: Punctuations, numbers and emojis were removed from the text columns. + \item \textbf{Removing Stopwords \& Contractions}: Stopwords and contractions were removed from the text columns. + \item \textbf{Lemmatization \& Stemming}: Lemmatization and stemming were performed on the text columns to reduce the words to their root form. +\end{enumerate} + +\pagebreak +\section{Expolaratory Data Analysis} + +After cleaning and preprocessing the data, we were left with around 8,000+ rows and 28 columns. The data was analyzed to find relevant insights. The data was analyzed using the following steps: + +\subsection*{Number of Posts Fetched per Subreddit} +\begin{figure}[H] + \centering + \includegraphics[width=0.8\textwidth]{num_posts_per_subreddit.png} + \caption{Number of Posts per Subreddit} + \label{fig:posts_per_subreddit} +\end{figure} + +\subsection*{Number of Subscribers per Subreddit} +\begin{figure}[H] + \centering + \includegraphics[width=0.8\textwidth]{num_subscribers_per_subreddit.png} + \caption{Number of Subscribers per Subreddit} + \label{fig:subscribers_per_subreddit} +\end{figure} + +\subsection*{Number of Authors who post in multiple subreddits} +\begin{figure}[H] + \centering + \includegraphics[width=0.8\textwidth]{num_authors_multiple_subreddit.png} + \caption{Number of Authors who post in multiple subreddits} + \label{fig:authors_per_subreddit} +\end{figure} + +From the above figure, it seems like most of the authors post in only one subreddit. + +\subsection*{Does posting in multiple subreddits drives more upvotes?} +\begin{figure}[H] + \centering + \includegraphics[width=0.8\textwidth]{post_multiple.png} + \caption{Does posting in multiple subreddits drives more upvotes?} + \label{fig:upvotes_per_subreddit} +\end{figure} + +From the above figure, it seems like authors who post in multiple subreddits get more upvotes, generally. + +\subsection*{History of posts per day per subreddit (Past 6 months)} + +\begin{figure}[H] + \centering + \includegraphics[width=1\textwidth]{num_posts_per_day_per_subreddit.png} + \caption{History of posts per day per subreddit} + \label{fig:history_posts_per_day} +\end{figure} + +From the above figure, it seems like the number of posts per day is increasing for most of the subreddits. + +\subsection*{Number of posts per subreddit, categorized by days of the week} + +\begin{figure}[H] + \centering + \includegraphics[width=1\textwidth]{num_posts_per_day_per_subreddit_bar.png} + \caption{Number of posts per day per subreddit} + \label{fig:posts_per_day} +\end{figure} + +The above figure presents total number of posts per subreddit, categorized by the days of the week. + +\subsection*{Top 10 Authors Per Subreddit} + +\begin{figure}[H] + \centering + \includegraphics[width=0.95\textwidth]{author_rank.png} + \caption{Top 10 Authors Per Subreddit} + \label{fig:top_authors_per_subreddit} +\end{figure} + +The above plot was generated by creating an author ranking system. The authors were then sorted in descending order of their rank. The top 10 authors were then plotted. The ranking system uses the following simple formula to rank the authors: + +\begin{equation} + \textnormal{Rank} = \textnormal{Post Score} \times \textnormal{Upvote Ratio} + \textnormal{Number of Comments} +\end{equation} + +\subsection*{Finding the best time to post on each subreddit} + +\begin{figure}[H] + \centering + \includegraphics[width=1\textwidth]{best_time.png} + \caption{Best Time to Post on each Subreddit} + \label{fig:best_time_to_post} +\end{figure} + +The above plot was generated by finding the total hourly engagement on each subreddit, categorized by each day. It seems like the best time to post on each subreddit is different and there happens to be a peak in the engagement at different times of the day. + +\subsection*{Scatterplot of the scores vs number of comments in each subreddit} + +\begin{figure}[H] + \centering + \includegraphics[width=1\textwidth]{scatterplot_scores.png} + \caption{Scatterplot of the scores vs number of comments in each subreddit} + \label{fig:score_vs_comments} +\end{figure} + +The above plot was generated by plotting the scores vs number of comments in each subreddit. It seems like there is a positive correlation between the scores and the number of comments, except for some controversial posts, which tend to get more comments than the scores. + +\subsection*{\% of Authors opted to receive comment notifications per Subreddit} + +\begin{figure}[H] + \centering + \includegraphics[width=1\textwidth]{pie_comments.png} + \caption{\% of Authors opted to receive comment notifications per Subreddit} + \label{fig:comment_notifications} +\end{figure} + +The above plot was generated by finding the percentage of authors who opted to receive comment notifications in each subreddit. It seems like most of the authors opted to receive comment notifications. + +\subsection*{Total Awards Received vs Upvotes per Subreddit} + +\begin{figure}[H] + \centering + \includegraphics[width=1\textwidth]{awards_per_subreddit.png} + \caption{Total Awards Received vs Upvotes per Subreddit} + \label{fig:awards_vs_upvotes} +\end{figure} + +Good posts are usually awarded with ``awards". The above plot was generated by plotting the total awards received vs upvotes in each subreddit. It seems like there is a positive correlation between the total awards received and the upvotes. + +\subsection*{Boxplot of the scores in each subreddit} + +\begin{figure}[H] + \centering + \includegraphics[width=1\textwidth]{boxplot_scores.png} + \caption{Boxplot of the scores in each subreddit} + \label{fig:boxplot} +\end{figure} + +The above plot was generated by plotting the boxplot of the scores in each subreddit. It seems like most of the scores are concentrated in the lower range, except for a few outliers – they are the posts that went viral. It means that most of the posts are not very popular. + +\end{document}
\ No newline at end of file diff --git a/images/author_rank.png b/images/author_rank.png Binary files differnew file mode 100644 index 0000000..da01bd1 --- /dev/null +++ b/images/author_rank.png diff --git a/images/awards_per_subreddit.png b/images/awards_per_subreddit.png Binary files differnew file mode 100644 index 0000000..9ba0c5c --- /dev/null +++ b/images/awards_per_subreddit.png diff --git a/images/best_time.png b/images/best_time.png Binary files differnew file mode 100644 index 0000000..646a8a4 --- /dev/null +++ b/images/best_time.png diff --git a/images/boxplot_scores.png b/images/boxplot_scores.png Binary files differnew file mode 100644 index 0000000..5c292f3 --- /dev/null +++ b/images/boxplot_scores.png diff --git a/images/num_authors_multiple_subreddit.png b/images/num_authors_multiple_subreddit.png Binary files differnew file mode 100644 index 0000000..ac5137e --- /dev/null +++ b/images/num_authors_multiple_subreddit.png diff --git a/images/num_posts_per_day_per_subreddit.png b/images/num_posts_per_day_per_subreddit.png Binary files differnew file mode 100644 index 0000000..e68c653 --- /dev/null +++ b/images/num_posts_per_day_per_subreddit.png diff --git a/images/num_posts_per_day_per_subreddit_bar.png b/images/num_posts_per_day_per_subreddit_bar.png Binary files differnew file mode 100644 index 0000000..13100e3 --- /dev/null +++ b/images/num_posts_per_day_per_subreddit_bar.png diff --git a/images/num_posts_per_subreddit.png b/images/num_posts_per_subreddit.png Binary files differnew file mode 100644 index 0000000..7e85a73 --- /dev/null +++ b/images/num_posts_per_subreddit.png diff --git a/images/num_subscribers_per_subreddit.png b/images/num_subscribers_per_subreddit.png Binary files differnew file mode 100644 index 0000000..64d56d0 --- /dev/null +++ b/images/num_subscribers_per_subreddit.png diff --git a/images/pie_comments.png b/images/pie_comments.png Binary files differnew file mode 100644 index 0000000..f7892e2 --- /dev/null +++ b/images/pie_comments.png diff --git a/images/post_multiple.png b/images/post_multiple.png Binary files differnew file mode 100644 index 0000000..3422be0 --- /dev/null +++ b/images/post_multiple.png diff --git a/images/scatterplot_scores.png b/images/scatterplot_scores.png Binary files differnew file mode 100644 index 0000000..b0731d2 --- /dev/null +++ b/images/scatterplot_scores.png diff --git a/project.ipynb b/project.ipynb index fdfccab..0fbfbbe 100644 --- a/project.ipynb +++ b/project.ipynb @@ -1614,7 +1614,7 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3.9.10 64-bit", + "display_name": "Python 3.10.7 64-bit", "language": "python", "name": "python3" }, @@ -1628,12 +1628,12 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.9.10" + "version": "3.10.7" }, "orig_nbformat": 4, "vscode": { "interpreter": { - "hash": "aee8b7b246df8f9039afb4144a1f6fd8d2ca17a180786b69acc140d282b71a49" + "hash": "b0fa6594d8f4cbf19f97940f81e996739fb7646882a419484c72d19e05852a7e" } } }, |
