diff --git a/document.aux b/document.aux
index 973abbe..4255b0d 100644
--- a/document.aux
+++ b/document.aux
@@ -75,13 +75,13 @@
\abx@aux@segm{0}{0}{6}
\abx@aux@cite{10}
\abx@aux@segm{0}{0}{10}
-\abx@aux@cite{11}
-\abx@aux@segm{0}{0}{11}
\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Tweepy Python Package}{14}{section*.17}}
\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Sentiment Analysis}{14}{section*.18}}
\newlabel{sentiment}{{}{14}{Sentiment Analysis}{section*.18}{}}
\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Natural Language Processing}{14}{section*.19}}
\newlabel{algorithms}{{}{14}{Natural Language Processing}{section*.19}{}}
+\abx@aux@cite{11}
+\abx@aux@segm{0}{0}{11}
\abx@aux@cite{12}
\abx@aux@segm{0}{0}{12}
\abx@aux@segm{0}{0}{12}
@@ -147,46 +147,56 @@
\abx@aux@cite{31}
\abx@aux@segm{0}{0}{31}
\abx@aux@segm{0}{0}{30}
+\abx@aux@cite{32}
+\abx@aux@segm{0}{0}{32}
\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Machine Learning}{20}{section*.26}}
\newlabel{machine}{{}{20}{Machine Learning}{section*.26}{}}
\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Naive Bayes}{20}{section*.27}}
+\abx@aux@segm{0}{0}{32}
+\abx@aux@cite{33}
+\abx@aux@segm{0}{0}{33}
+\abx@aux@segm{0}{0}{8}
\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{Solution Approach}{22}{section*.28}}
\newlabel{solution}{{}{22}{Solution Approach}{section*.28}{}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Solution Summary}{22}{section*.29}}
-\newlabel{sumary}{{}{22}{Solution Summary}{section*.29}{}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Requirements}{22}{section*.30}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Data flow Overview}{22}{section*.31}}
-\newlabel{data-flow}{{}{22}{Data flow Overview}{section*.31}{}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Packages, Tools and Techniques}{22}{section*.32}}
-\newlabel{tools}{{}{22}{Packages, Tools and Techniques}{section*.32}{}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{System Design and Implementation}{23}{section*.33}}
-\newlabel{implementation}{{}{23}{System Design and Implementation}{section*.33}{}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Data collection}{23}{section*.34}}
-\newlabel{collection}{{}{23}{Data collection}{section*.34}{}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Price Time-series Data}{23}{section*.35}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Data processing}{23}{section*.36}}
-\newlabel{processing}{{}{23}{Data processing}{section*.36}{}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Preprocessing}{23}{section*.37}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Tweet Filtering}{23}{section*.38}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Text Cleaning}{23}{section*.39}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Ngram based Language detection filtering}{23}{section*.40}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Spam Filtering}{23}{section*.41}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Tweet Processing}{23}{section*.42}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Naive Bayes model}{23}{section*.43}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Sentiment Analysis}{23}{section*.44}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{VADER}{23}{section*.45}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Recurrent Neural Network - LSTM}{23}{section*.46}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Training and Testing Model}{23}{section*.47}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Scoring and Validation}{23}{section*.48}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Future Prediction Forecasting}{23}{section*.49}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{Testing: Verification and Reflection}{24}{section*.50}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{Discussion: Contribution and Reflection}{25}{section*.51}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Limitations}{25}{section*.52}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{Conclusion and Future Improvements}{26}{section*.53}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Conclusion}{26}{section*.54}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Future Improvements}{26}{section*.55}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{Appendices}{29}{section*.57}}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Appendix A - Project Initiation Document}{29}{section*.58}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Data gathering}{22}{section*.29}}
+\abx@aux@segm{0}{0}{23}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Spam Filtering}{23}{section*.30}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Language Detection}{23}{section*.31}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Solution Summary}{23}{section*.32}}
+\newlabel{sumary}{{}{23}{Solution Summary}{section*.32}{}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Requirements}{23}{section*.33}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Data flow Overview}{23}{section*.34}}
+\newlabel{data-flow}{{}{23}{Data flow Overview}{section*.34}{}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Packages, Tools and Techniques}{23}{section*.35}}
+\newlabel{tools}{{}{23}{Packages, Tools and Techniques}{section*.35}{}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{System Design and Implementation}{24}{section*.36}}
+\newlabel{implementation}{{}{24}{System Design and Implementation}{section*.36}{}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Data collection}{24}{section*.37}}
+\newlabel{collection}{{}{24}{Data collection}{section*.37}{}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Price Time-series Data}{24}{section*.38}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Data processing}{24}{section*.39}}
+\newlabel{processing}{{}{24}{Data processing}{section*.39}{}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Preprocessing}{24}{section*.40}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Tweet Filtering}{24}{section*.41}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Text Cleaning}{24}{section*.42}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Ngram based Language detection filtering}{24}{section*.43}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Spam Filtering}{24}{section*.44}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Tweet Processing}{24}{section*.45}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {paragraph}{Naive Bayes model}{24}{section*.46}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Sentiment Analysis}{24}{section*.47}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{VADER}{24}{section*.48}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Recurrent Neural Network - LSTM}{24}{section*.49}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Training and Testing Model}{24}{section*.50}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Scoring and Validation}{24}{section*.51}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsubsection}{Future Prediction Forecasting}{24}{section*.52}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{Testing: Verification and Reflection}{25}{section*.53}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{Discussion: Contribution and Reflection}{26}{section*.54}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Limitations}{26}{section*.55}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{Conclusion and Future Improvements}{27}{section*.56}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Conclusion}{27}{section*.57}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Future Improvements}{27}{section*.58}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {section}{Appendices}{31}{section*.60}}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Appendix A - Project Initiation Document}{31}{section*.61}}
\abx@aux@refcontextdefaultsdone
\abx@aux@defaultrefcontext{0}{1}{none/global//global/global}
\abx@aux@defaultrefcontext{0}{2}{none/global//global/global}
@@ -220,4 +230,5 @@
\abx@aux@defaultrefcontext{0}{30}{none/global//global/global}
\abx@aux@defaultrefcontext{0}{31}{none/global//global/global}
\abx@aux@defaultrefcontext{0}{32}{none/global//global/global}
-\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Appendix B - Log book}{42}{section*.59}}
+\abx@aux@defaultrefcontext{0}{33}{none/global//global/global}
+\@writefile{toc}{\defcounter {refsection}{0}\relax }\@writefile{toc}{\contentsline {subsection}{Appendix B - Log book}{44}{section*.62}}
diff --git a/document.bbl b/document.bbl
index 04f6158..219c395 100644
--- a/document.bbl
+++ b/document.bbl
@@ -1081,8 +1081,8 @@
\strng{authorbibnamehash}{baa9695b2bf77f7b33bb07b5d116d7e1}
\strng{authornamehash}{baa9695b2bf77f7b33bb07b5d116d7e1}
\strng{authorfullhash}{baa9695b2bf77f7b33bb07b5d116d7e1}
- \field{sortinit}{8}
- \field{sortinithash}{07edf88d4ea82509b9c4b4d13f41c452}
+ \field{sortinit}{5}
+ \field{sortinithash}{3c19c3776b658b3558e9e2e4840c01e2}
\field{labelnamesource}{author}
\field{labeltitlesource}{title}
\field{booktitle}{IJCAI 2001 workshop on empirical methods in artificial intelligence}
@@ -1099,6 +1099,33 @@
\verb https://www.cc.gatech.edu/~isbell/reading/papers/Rish.pdf
\endverb
\endentry
+ \entry{33}{inproceedings}{}
+ \name{author}{1}{}{%
+ {{hash=1e48a059b3f2c3703bea8d54a9e002c9}{%
+ family={Roesslein},
+ familyi={R\bibinitperiod},
+ given={Joshua},
+ giveni={J\bibinitperiod}}}%
+ }
+ \strng{namehash}{1e48a059b3f2c3703bea8d54a9e002c9}
+ \strng{fullhash}{1e48a059b3f2c3703bea8d54a9e002c9}
+ \strng{bibnamehash}{1e48a059b3f2c3703bea8d54a9e002c9}
+ \strng{authorbibnamehash}{1e48a059b3f2c3703bea8d54a9e002c9}
+ \strng{authornamehash}{1e48a059b3f2c3703bea8d54a9e002c9}
+ \strng{authorfullhash}{1e48a059b3f2c3703bea8d54a9e002c9}
+ \field{sortinit}{5}
+ \field{sortinithash}{3c19c3776b658b3558e9e2e4840c01e2}
+ \field{labelnamesource}{author}
+ \field{labeltitlesource}{title}
+ \field{title}{Tweepy Documentation}
+ \field{year}{2009}
+ \verb{urlraw}
+ \verb http://docs.tweepy.org/en/v3.5.0/
+ \endverb
+ \verb{url}
+ \verb http://docs.tweepy.org/en/v3.5.0/
+ \endverb
+ \endentry
\enddatalist
\endrefsection
\endinput
diff --git a/document.bcf b/document.bcf
index 7611244..5325cd5 100644
--- a/document.bcf
+++ b/document.bcf
@@ -1977,6 +1977,11 @@
30
31
30
+ 32
+ 32
+ 33
+ 8
+ 23
*
diff --git a/document.blg b/document.blg
index fc06e6e..9403f39 100644
--- a/document.blg
+++ b/document.blg
@@ -1,20 +1,20 @@
[0] Config.pm:302> INFO - This is Biber 2.9
[0] Config.pm:305> INFO - Logfile is 'document.blg'
-[18] biber:313> INFO - === Tue Apr 23, 2019, 18:58:50
-[34] Biber.pm:371> INFO - Reading 'document.bcf'
-[79] Biber.pm:854> INFO - Using all citekeys in bib section 0
-[88] Biber.pm:3981> INFO - Processing section 0
-[96] Biber.pm:4154> INFO - Looking for bibtex format file 'report.bib' for section 0
-[97] bibtex.pm:1468> INFO - LaTeX decoding ...
-[124] bibtex.pm:1294> INFO - Found BibTeX data source 'report.bib'
-[167] Utils.pm:169> WARN - year field 'Mar 13, 2016' in entry '23' is not an integer - this will probably not sort properly.
-[199] Utils.pm:169> WARN - Name "Mairal, J., Ponce, J., Sapiro, G., Zisserman, A." has too many commas: skipping name
-[228] Utils.pm:169> WARN - BibTeX subsystem: warning: comma(s) at end of name (removing)
-[228] Utils.pm:169> WARN - BibTeX subsystem: author, warning: comma(s) at end of name (removing)
-[245] UCollate.pm:68> INFO - Overriding locale 'en-US' defaults 'variable = shifted' with 'variable = non-ignorable'
-[245] UCollate.pm:68> INFO - Overriding locale 'en-US' defaults 'normalization = NFD' with 'normalization = prenormalized'
-[245] Biber.pm:3809> INFO - Sorting list 'none/global//global/global' of type 'entry' with template 'none' and locale 'en-US'
-[245] Biber.pm:3815> INFO - No sort tailoring available for locale 'en-US'
-[262] bbl.pm:617> INFO - Writing 'document.bbl' with encoding 'ascii'
-[273] bbl.pm:720> INFO - Output to document.bbl
-[273] Biber.pm:110> INFO - WARNINGS: 4
+[20] biber:313> INFO - === Tue Apr 23, 2019, 21:27:28
+[37] Biber.pm:371> INFO - Reading 'document.bcf'
+[87] Biber.pm:854> INFO - Using all citekeys in bib section 0
+[97] Biber.pm:3981> INFO - Processing section 0
+[106] Biber.pm:4154> INFO - Looking for bibtex format file 'report.bib' for section 0
+[108] bibtex.pm:1468> INFO - LaTeX decoding ...
+[139] bibtex.pm:1294> INFO - Found BibTeX data source 'report.bib'
+[203] Utils.pm:169> WARN - year field 'Mar 13, 2016' in entry '23' is not an integer - this will probably not sort properly.
+[245] Utils.pm:169> WARN - Name "Mairal, J., Ponce, J., Sapiro, G., Zisserman, A." has too many commas: skipping name
+[260] Utils.pm:169> WARN - BibTeX subsystem: warning: comma(s) at end of name (removing)
+[260] Utils.pm:169> WARN - BibTeX subsystem: author, warning: comma(s) at end of name (removing)
+[279] UCollate.pm:68> INFO - Overriding locale 'en-US' defaults 'variable = shifted' with 'variable = non-ignorable'
+[280] UCollate.pm:68> INFO - Overriding locale 'en-US' defaults 'normalization = NFD' with 'normalization = prenormalized'
+[280] Biber.pm:3809> INFO - Sorting list 'none/global//global/global' of type 'entry' with template 'none' and locale 'en-US'
+[280] Biber.pm:3815> INFO - No sort tailoring available for locale 'en-US'
+[300] bbl.pm:617> INFO - Writing 'document.bbl' with encoding 'ascii'
+[312] bbl.pm:720> INFO - Output to document.bbl
+[312] Biber.pm:110> INFO - WARNINGS: 4
diff --git a/document.log b/document.log
index b27cb0c..73c02d5 100644
--- a/document.log
+++ b/document.log
@@ -1,4 +1,4 @@
-This is pdfTeX, Version 3.14159265-2.6-1.40.18 (TeX Live 2017/Debian) (preloaded format=pdflatex 2018.10.16) 23 APR 2019 20:26
+This is pdfTeX, Version 3.14159265-2.6-1.40.18 (TeX Live 2017/Debian) (preloaded format=pdflatex 2018.10.16) 23 APR 2019 21:45
entering extended mode
restricted \write18 enabled.
%&-line parsing enabled.
@@ -945,7 +945,7 @@ LaTeX Info: Redefining \nameref on input line 63.
\@outlinefile=\write5
\openout5 = `document.out'.
-
+
File: images/reading_logo.png Graphic file (type png)