forked from dataBikeHsUlm/report
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathDSPRReport.tex
157 lines (147 loc) · 8.06 KB
/
DSPRReport.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
\documentclass[12pt]{report}
\usepackage{graphicx}
\usepackage{caption}
\usepackage[english]{babel}
\usepackage{caption}
\usepackage{capt-of}
\usepackage{color, colortbl}
\usepackage[hidelinks]{hyperref}
\usepackage[numbers]{natbib}
\usepackage[nohyperlinks, printonlyused, withpage, smaller]{acronym}
\usepackage[ngerman]{datetime}
\usepackage{chngcntr}
\usepackage{pdfpages}
\usepackage{enumitem}
\usepackage{amsmath}
\usepackage{tikz}
\usepackage[skins]{tcolorbox}
\usepackage{rotating}
\usepackage{framed}
\counterwithin{figure}{section}
\usepackage{lipsum}
\usepackage{float}
\usepackage{listings}
\usepackage{xcolor}
\usepackage{listing}
\usepackage{hyperref}
\usepackage{lscape}
\usepackage{longtable}
\usepackage{upquote}
\def\frontmatter{%
\pagenumbering{roman}
\setcounter{page}{1}
\renewcommand{\thesection}{\Roman{section}}
}%
\def\mainmatter{%
\pagenumbering{arabic}
\setcounter{page}{1}
\setcounter{section}{0}
\renewcommand{\thesection}{\arabic{section}}
}%
\def\backmatter{%
\setcounter{section}{0}
\renewcommand{\thesection}{\Alph{section}}
}%
\renewcommand{\listfigurename}{\begingroup
\tocchapter{}
\tocfile{\listoffigurename}{B Illustration Directory}
\endgroup}
\begin{document}
\frontmatter
\begin{titlepage}
\newcommand{\HRule}{\rule{\linewidth}{1.5mm}}
\center{}
\begin{figure}
\centering
\includegraphics[width=0.5\textwidth]{img/hslogo}\label{pic:Logo}
\end{figure}
\begin{center}
\end{center}
{\huge Masterproject}\\[0.4cm]
\begin{center}
\end{center}
{\Large Data Science }\\
{Analytics and Prediction for Rental Bike Usage in London}
\vfill
\begin{center}
{Contributors:}\ \\
\vspace{0.25\baselineskip}
{\Large Anass Khaldi, Guillaume Goni, Kathi Rodi, Pascal Riedel}
\end{center}
\vfill
\begin{center}
{\large Expert: Prof.\ Dr.\ von Schwerin }\\
\end{center}
\begin{center}
{\large Expert: Prof.\ Dr.\ Herbort}
\end{center}
\begin{center}
{\large Expert: Prof.\ Dr.\ Goldstein}
\end{center}
\vfill
{\Large \today}
\end{titlepage}
\newpage
\tableofcontents
\mainmatter{}
\newpage
\chapter{Project Presentation and Organization}
% TODO: reorganize, rewrite
\input{./01_introduction.tex}
\input{./02_task_description.tex}
\input{./03_task_description_2.tex}
\input{./04_collaboration_technologies.tex}
\input{./05_responsabilities.tex}
\chapter{Postal Code Database (Nominatim and Graphhopper)}
\input{./11_nominatim.tex}
\input{./13_graphhopper.tex}
\input{./12_database.tex}
\input{./14_2_digits_db.tex}
\input{./15_django.tex}
\chapter{Bike Rental in London}
\input{./21_evaluation_of_hadoop_distros.tex}
\input{./22_data_profiling.tex}
\input{./23_data_prediction.tex}
\input{./24_hourly.tex}
\input{./25_additional.tex}
\chapter{Postal Code Database (Junior)}
% TODO: other things ?
\input{./31_junior_task_description.tex}
\input{./32_junior_conclusion.tex}
\newpage
\bibliographystyle{plain}
\bibliography{./bibtex/library}
\renewcommand{\listfigurename}{B Illustration Directory}
\listoffigures
\section*{C List of Abbreviations}
\addcontentsline{toc}{section}{C List of Abbreviations}
\begin{acronym}
\acro{yarn}[YARN]{Yet Another Resource Negotiator}
\acro{sql} [SQL]{Structured Query Language}
\acro{nsql} [NoSQL]{Not only Sql}
\acro{pl}[PL/pgSQL] {Procedural Language/PostgreSQL}
\acro{osm}[OSM]{OpenStreetMap}
\acro{hdp}[HDP]{Hortonworks Data Platform}
\acro{hdfs} [HDFS]{Hadoop Distributed File System}
\acro{osm}[OSM]{OpenStreetMap}
\acro{dfsio}[DFSIO]{Data File System I/O}
\acro{mlp}[MLPRegressor]{Multi-layer Perceptron Regressor}
\acro{rmse}[RMSE]{Root Mean Square Error}
\end{acronym}
\newpage
\section*{D Attachments}
\addcontentsline{toc}{section}{D Attachments}
\subsection*{Attachment 1:\\ Responsibilities}\label{resp}
\begin{landscape}
\begin{table}[]
\begin{tabular}{l|l|l|l|}
\cline{2-4}
& Sprint 1 & Sprint 2 & Sprint 3 \\ \hline
\multicolumn{1}{|l|}{Anass} & \begin{tabular}[c]{@{}l@{}}hadoop docu\\ creation of users in hadoop\\ install nominatim/ components\\ import planet database\\ compute postcodes\\ reverse geocoding in bulk\end{tabular} & \begin{tabular}[c]{@{}l@{}}design big picture\\ research maps for WebApp\\ research Django\end{tabular} & \begin{tabular}[c]{@{}l@{}}Fixing dead hadoop node\\ installGraphhopper\\ docu Graphhopper\\ import OSM data to Graphhopper\\ write report part of edited tasks\end{tabular} \\ \hline
\multicolumn{1}{|l|}{Guillaume} & \begin{tabular}[c]{@{}l@{}}create user for nominatim\\ uploading SSH keys\\ querying centroids\\ distances by route\\ distances in bulk\end{tabular} & \begin{tabular}[c]{@{}l@{}}create GitHub repos\\ unioned all notebooks\\ connect geopy with nominatim\\ reserach Django\\ Django tutorial\\ script for initializing database\\ initialize db with postcodes\end{tabular} & \begin{tabular}[c]{@{}l@{}}research postcodes in PostgresDB\\ script for filling zipcodes in db\\ write report part of edited tasks\end{tabular} \\ \hline
\multicolumn{1}{|l|}{Kathi} & \begin{tabular}[c]{@{}l@{}}creating team Box\\ creating templates\\ documentation OSM API\\ geocoding/reverse Geocoding\\ distances as the crow flies\\ design ER model\\ create presentation for sprint review\\ Scrum Master tasks\end{tabular} & \begin{tabular}[c]{@{}l@{}}design \& finalize Big Picture\\ Graphhopper docu \& example\\ install x2go server\\ docu access vms via x2go client\\ define mockup structure\\ create mockup\\ install mysql database\\ create presentation for sprint review\\ Scrum Master tasks\end{tabular} & \begin{tabular}[c]{@{}l@{}}latex template for project report\\ write report part of edited tasks\\ union texts of team members to report\\ reorganize GitHub repositories\\ create presentation for sprint review\\ Scrum Master tasks\end{tabular} \\ \hline
\multicolumn{1}{|l|}{Pascal} & \begin{tabular}[c]{@{}l@{}}research hadoop distributions\\ find weightened comparison data\\ hadoop documentation\\ Installation of HDP\\ Implement Map Reduce Job\end{tabular} & \begin{tabular}[c]{@{}l@{}}Solving Hadoop issues\\ collect TFL data \& \\ data munging on Hadoop\\ create mockup\\ installed Django server\end{tabular} & \begin{tabular}[c]{@{}l@{}}create spark file sizing notebook\\ CycleRoutes prepared \& collected \\ plotting statistics of cycle usage\\ solving hadoop errors\\ plotting routes of cycle data\\ write report part of edited tasks\end{tabular} \\ \hline
\end{tabular}
\end{table}
\end{landscape}
\end{document}