-
Notifications
You must be signed in to change notification settings - Fork 72
/
DataScienceEssentials.tex
78 lines (61 loc) · 3.48 KB
/
DataScienceEssentials.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
\pdfminorversion=4
\documentclass[opener-c,labs,grey,nociteref]{HJnewsiambook}
% See command.tex for all package imports, environments, and special commands.
\input{command}
\makeindex
\title{Data Science Essentials}
\author{Jeffrey Humpherys \& Tyler J.~Jarvis, managing editors}
\begin{document} % ============================================================
\thispagestyle{empty} % Book cover and Front matter ---------------------------
\maketitle
\thispagestyle{empty}
\frontmatter
\include{contributors}
\begin{thepreface} % Preface --------------------------------------------------
This lab manual is designed to accompany the textbook \emph{Foundations of Applied Mathematics} by Humpherys and Jarvis.
While the Volume 3 text focuses on statistics and rigorous data analysis, these labs aim to introduce experienced Python programmers to common tools for obtaining, cleaning, organizing, and presenting data.
The reader should be familiar with Python \cite{vanrossum2010python} and its NumPy \cite{oliphant2006guide,ascher2001numerical,oliphant2007python} and Matplotlib \cite{Hunter:2007} packages before attempting these labs.
See the Python Essentials manual for introductions to these topics.
\vfill
\copyright{This work is licensed under the Creative Commons Attribution 3.0 United States License.
You may copy, distribute, and display this copyrighted work only if you give credit to Dr.~J.~Humpherys.
All derivative works must include an attribution to Dr.~J.~Humpherys as the owner of this work as well as the web address to
\\\centerline{\url{https://github.com/Foundations-of-Applied-Mathematics/Labs}}\\as the original source of this work.
\\To view a copy of the Creative Commons Attribution 3.0 License, visit
\\\centerline{\url{http://creativecommons.org/licenses/by/3.0/us/}} or send a letter to Creative Commons, 171 Second Street, Suite 300, San Francisco, California, 94105, USA.}
\vfill
\centering\includegraphics[height=1.2cm]{by.pdf}
\vfill
\end{thepreface}
\setcounter{tocdepth}{1}
\tableofcontents
\mainmatter % LABS ============================================================
\part{Labs}
\subimport{./DataScienceEssentials/UnixShell1/}{UnixShell1}
\subimport{./DataScienceEssentials/UnixShell2/}{UnixShell2}
\subimport{./DataScienceEssentials/SQL1/}{SQL1}
\subimport{./DataScienceEssentials/SQL2/}{SQL2}
\subimport{./DataScienceEssentials/RegularExpressions/}{RegularExpressions}
% \subimport{./DataScienceEssentials/WebTechnologies/}{WebTechnologies}
\subimport{./DataScienceEssentials/WebScraping/}{WebScraping}
% \subimport{./DataScienceEssentials/WebCrawling/}{WebCrawling}
\subimport{./DataScienceEssentials/Pandas1/}{Pandas1}
\subimport{./DataScienceEssentials/Pandas2/}{Pandas2}
\subimport{./DataScienceEssentials/Pandas3/}{Pandas3}
\subimport{./DataScienceEssentials/Pandas4/}{Pandas4}
\subimport{./DataScienceEssentials/DataCleaning/}{DataCleaning}
% \subimport{./DataScienceEssentials/MongoDB/}{MongoDB}
\subimport{./DataScienceEssentials/Parallel_Intro/}{parallel1}
\subimport{./DataScienceEssentials/MPI/}{mpi}
% \subimport{./DataScienceEssentials/Ethics/}{ethics}
\subimport{./DataScienceEssentials/Spark/}{spark}
\part{Appendices} % Relevant Appendices ---------------------------------------
\begin{appendices}
\subimport{./Appendices/NumpyVisualGuide/}{NumpyVisualGuide}
\subimport{./Appendices/MatplotlibCustomization/}{MatplotlibCustomization}
% \subimport{./Appendices/SklearnGuide/}{SklearnGuide}
\end{appendices}
% Bibliography
\bibliographystyle{alpha}
\bibliography{references}
\end{document}