\documentclass[10pt,a4paper]{article} % Packages \usepackage{fancyhdr} % For header and footer \usepackage{multicol} % Allows multicols in tables \usepackage{tabularx} % Intelligent column widths \usepackage{tabulary} % Used in header and footer \usepackage{hhline} % Border under tables \usepackage{graphicx} % For images \usepackage{xcolor} % For hex colours %\usepackage[utf8x]{inputenc} % For unicode character support \usepackage[T1]{fontenc} % Without this we get weird character replacements \usepackage{colortbl} % For coloured tables \usepackage{setspace} % For line height \usepackage{lastpage} % Needed for total page number \usepackage{seqsplit} % Splits long words. %\usepackage{opensans} % Can't make this work so far. Shame. Would be lovely. \usepackage[normalem]{ulem} % For underlining links % Most of the following are not required for the majority % of cheat sheets but are needed for some symbol support. \usepackage{amsmath} % Symbols \usepackage{MnSymbol} % Symbols \usepackage{wasysym} % Symbols %\usepackage[english,german,french,spanish,italian]{babel} % Languages % Document Info \author{nova-cane98} \pdfinfo{ /Title (data-analytics-exam-1.pdf) /Creator (Cheatography) /Author (nova-cane98) /Subject (Data Analytics Exam 1 Cheat Sheet) } % Lengths and widths \addtolength{\textwidth}{6cm} \addtolength{\textheight}{-1cm} \addtolength{\hoffset}{-3cm} \addtolength{\voffset}{-2cm} \setlength{\tabcolsep}{0.2cm} % Space between columns \setlength{\headsep}{-12pt} % Reduce space between header and content \setlength{\headheight}{85pt} % If less, LaTeX automatically increases it \renewcommand{\footrulewidth}{0pt} % Remove footer line \renewcommand{\headrulewidth}{0pt} % Remove header line \renewcommand{\seqinsert}{\ifmmode\allowbreak\else\-\fi} % Hyphens in seqsplit % This two commands together give roughly % the right line height in the tables \renewcommand{\arraystretch}{1.3} \onehalfspacing % Commands \newcommand{\SetRowColor}[1]{\noalign{\gdef\RowColorName{#1}}\rowcolor{\RowColorName}} % Shortcut for row colour \newcommand{\mymulticolumn}[3]{\multicolumn{#1}{>{\columncolor{\RowColorName}}#2}{#3}} % For coloured multi-cols \newcolumntype{x}[1]{>{\raggedright}p{#1}} % New column types for ragged-right paragraph columns \newcommand{\tn}{\tabularnewline} % Required as custom column type in use % Font and Colours \definecolor{HeadBackground}{HTML}{333333} \definecolor{FootBackground}{HTML}{666666} \definecolor{TextColor}{HTML}{333333} \definecolor{DarkBackground}{HTML}{FC8721} \definecolor{LightBackground}{HTML}{FEF7F1} \renewcommand{\familydefault}{\sfdefault} \color{TextColor} % Header and Footer \pagestyle{fancy} \fancyhead{} % Set header to blank \fancyfoot{} % Set footer to blank \fancyhead[L]{ \noindent \begin{multicols}{3} \begin{tabulary}{5.8cm}{C} \SetRowColor{DarkBackground} \vspace{-7pt} {\parbox{\dimexpr\textwidth-2\fboxsep\relax}{\noindent \hspace*{-6pt}\includegraphics[width=5.8cm]{/web/www.cheatography.com/public/images/cheatography_logo.pdf}} } \end{tabulary} \columnbreak \begin{tabulary}{11cm}{L} \vspace{-2pt}\large{\bf{\textcolor{DarkBackground}{\textrm{Data Analytics Exam 1 Cheat Sheet}}}} \\ \normalsize{by \textcolor{DarkBackground}{nova-cane98} via \textcolor{DarkBackground}{\uline{cheatography.com/217313/cs/47738/}}} \end{tabulary} \end{multicols}} \fancyfoot[L]{ \footnotesize \noindent \begin{multicols}{3} \begin{tabulary}{5.8cm}{LL} \SetRowColor{FootBackground} \mymulticolumn{2}{p{5.377cm}}{\bf\textcolor{white}{Cheatographer}} \\ \vspace{-2pt}nova-cane98 \\ \uline{cheatography.com/nova-cane98} \\ \end{tabulary} \vfill \columnbreak \begin{tabulary}{5.8cm}{L} \SetRowColor{FootBackground} \mymulticolumn{1}{p{5.377cm}}{\bf\textcolor{white}{Cheat Sheet}} \\ \vspace{-2pt}Not Yet Published.\\ Updated 28th February, 2026.\\ Page {\thepage} of \pageref{LastPage}. \end{tabulary} \vfill \columnbreak \begin{tabulary}{5.8cm}{L} \SetRowColor{FootBackground} \mymulticolumn{1}{p{5.377cm}}{\bf\textcolor{white}{Sponsor}} \\ \SetRowColor{white} \vspace{-5pt} %\includegraphics[width=48px,height=48px]{dave.jpeg} Measure your website readability!\\ www.readability-score.com \end{tabulary} \end{multicols}} \begin{document} \raggedright \raggedcolumns % Set font size to small. Switch to any value % from this page to resize cheat sheet text: % www.emerson.emory.edu/services/latex/latex_169.html \footnotesize % Small font. \begin{multicols*}{2} \begin{tabularx}{8.4cm}{x{2.48 cm} x{5.52 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{IMPACT Model}} \tn % Row 0 \SetRowColor{LightBackground} I & ID the questions \tn % Row Count 1 (+ 1) % Row 1 \SetRowColor{white} M & Master the data \tn % Row Count 2 (+ 1) % Row 2 \SetRowColor{LightBackground} P & Perform test plan \tn % Row Count 3 (+ 1) % Row 3 \SetRowColor{white} A & Address and refine results \tn % Row Count 4 (+ 1) % Row 4 \SetRowColor{LightBackground} C & Communicate insights \tn % Row Count 5 (+ 1) % Row 5 \SetRowColor{white} T\{\{bb=1\}\} & Track outcomes \{\{bb=1\}\} \tn % Row Count 6 (+ 1) % Row 6 \SetRowColor{LightBackground} Identify & \{\{fa-arrow-right\}\}understand the problem that needs addressing \tn % Row Count 9 (+ 3) % Row 7 \SetRowColor{white} & Attributes = Audience, Scope, Use \tn % Row Count 11 (+ 2) % Row 8 \SetRowColor{LightBackground} Master & \{\{fa-arrow-right\}\}what data is available \& will that data help address the problem \tn % Row Count 15 (+ 4) % Row 9 \SetRowColor{white} & Need to know about the data: \tn % Row Count 17 (+ 2) % Row 10 \SetRowColor{LightBackground} & how to access \tn % Row Count 18 (+ 1) % Row 11 \SetRowColor{white} & availability \tn % Row Count 19 (+ 1) % Row 12 \SetRowColor{LightBackground} & reliability \tn % Row Count 20 (+ 1) % Row 13 \SetRowColor{white} & frequency of updates \tn % Row Count 21 (+ 1) % Row 14 \SetRowColor{LightBackground} & time line of data coverage \tn % Row Count 22 (+ 1) % Row 15 \SetRowColor{white} Perform Test Plan & \{\{fa-arrow-right\}\}think of the right approach to the data to be able to answer the question \tn % Row Count 26 (+ 4) % Row 16 \SetRowColor{LightBackground} & ID relationship between response/ dependent and predictor/ explanatory/ independent variables \tn % Row Count 30 (+ 4) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{2.48 cm} x{5.52 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{IMPACT Model (cont)}} \tn % Row 17 \SetRowColor{LightBackground} & {\bf{8 approaches}} \tn % Row Count 1 (+ 1) % Row 18 \SetRowColor{white} & \{\{fa-circle\}\} Classification "sorting into predefined categories" \tn % Row Count 4 (+ 3) % Row 19 \SetRowColor{LightBackground} & \{\{fa-circle\}\} Regression "a number" \tn % Row Count 6 (+ 2) % Row 20 \SetRowColor{white} & \{\{fa-circle\}\} Similarity Matching "similar individuals" \tn % Row Count 9 (+ 3) % Row 21 \SetRowColor{LightBackground} & \{\{fa-circle\}\} Clustering "finding natural groups" \tn % Row Count 11 (+ 2) % Row 22 \SetRowColor{white} & \{\{fa-circle\}\}Co-occurrence grouping "associations based on transactions" \tn % Row Count 14 (+ 3) % Row 23 \SetRowColor{LightBackground} & \{\{fa-circle\}\} Profiling "the typical" \tn % Row Count 16 (+ 2) % Row 24 \SetRowColor{white} & \{\{fa-circle\}\} Link Prediction "relationship between two data" \tn % Row Count 19 (+ 3) % Row 25 \SetRowColor{LightBackground} & \{\{fa-circle\}\} Data Reduction "Reduces to most critical" \tn % Row Count 22 (+ 3) % Row 26 \SetRowColor{white} Address and refine & \{\{fa-arrow-right\}\}Data analysis is iterative \tn % Row Count 24 (+ 2) % Row 27 \SetRowColor{LightBackground} & slice, dice, and manipulate the data \tn % Row Count 26 (+ 2) % Row 28 \SetRowColor{white} Communicate & \{\{fa-arrow-right\}\}insights are formed by decision makers and are communicated \tn % Row Count 29 (+ 3) % Row 29 \SetRowColor{LightBackground} & executive summaries, static reports, digital dashboards, and data visualizations \tn % Row Count 32 (+ 3) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{2.48 cm} x{5.52 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{IMPACT Model (cont)}} \tn % Row 30 \SetRowColor{LightBackground} Track outcomes & \{\{fa-arrow-right\}\}can we predict future outcomes \tn % Row Count 2 (+ 2) % Row 31 \SetRowColor{white} & then you can test how accurate the predictions were \tn % Row Count 4 (+ 2) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{8.4cm}{x{2.72 cm} x{5.28 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Business Environment and Big Data}} \tn % Row 0 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{Big Data} \tn % Row Count 1 (+ 1) % Row 1 \SetRowColor{white} 4 V's & Volume (size) \tn % Row Count 2 (+ 1) % Row 2 \SetRowColor{LightBackground} & Velocity (speed) \tn % Row Count 3 (+ 1) % Row 3 \SetRowColor{white} & Variety (types) \tn % Row Count 4 (+ 1) % Row 4 \SetRowColor{LightBackground} & Veracity (quality) \tn % Row Count 5 (+ 1) % Row 5 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{{\bf{Impact of data}} \{\{ac\}\} \{\{bb=1\}\} \{\{bt=1\}\}} \tn % Row Count 6 (+ 1) % Row 6 \SetRowColor{LightBackground} Auditing & Audits must embrace technology. \tn % Row Count 8 (+ 2) % Row 7 \SetRowColor{white} & Technology = better quality, transparency, accuracy in audit. \tn % Row Count 11 (+ 3) % Row 8 \SetRowColor{LightBackground} & gathering data \{\{fa-arrow-right\}\} rationale behind data queries \tn % Row Count 14 (+ 3) % Row 9 \SetRowColor{white} & expands auditors' capabilities in fraud detection \tn % Row Count 16 (+ 2) % Row 10 \SetRowColor{LightBackground} & automating compliance-monitoring activities \tn % Row Count 18 (+ 2) % Row 11 \SetRowColor{white} Management Accounting & (most similar to analytics) \tn % Row Count 20 (+ 2) % Row 12 \SetRowColor{LightBackground} & Job of MA: \tn % Row Count 21 (+ 1) % Row 13 \SetRowColor{white} & are asked questions by management \tn % Row Count 23 (+ 2) % Row 14 \SetRowColor{LightBackground} & find data to address those questions \tn % Row Count 25 (+ 2) % Row 15 \SetRowColor{white} & analyze the data \tn % Row Count 26 (+ 1) % Row 16 \SetRowColor{LightBackground} & report the results to management \tn % Row Count 28 (+ 2) % Row 17 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{Financial Reporting} \tn % Row Count 29 (+ 1) % Row 18 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{Financial Statement Analysis} \tn % Row Count 30 (+ 1) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{2.72 cm} x{5.28 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Business Environment and Big Data (cont)}} \tn % Row 19 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{Tax} \tn % Row Count 1 (+ 1) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{8.4cm}{x{3.76 cm} x{4.24 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Relational Database}} \tn % Row 0 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{Benefits of (3NF) Relational DB} \tn % Row Count 1 (+ 1) % Row 1 \SetRowColor{white} & Completeness \tn % Row Count 2 (+ 1) % Row 2 \SetRowColor{LightBackground} & No redundancy \tn % Row Count 3 (+ 1) % Row 3 \SetRowColor{white} & Business rules enforcement (IC) \tn % Row Count 5 (+ 2) % Row 4 \SetRowColor{LightBackground} \{\{bb=1\}\} & \{\{bb=1\}\} Communication and integration of business processes \tn % Row Count 8 (+ 3) % Row 5 \SetRowColor{white} ETL process & extract, transform, load \tn % Row Count 10 (+ 2) % Row 6 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{{\emph{doing what to the data?}} \{\{ac\}\}} \tn % Row Count 11 (+ 1) % Row 7 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{Extract} \tn % Row Count 12 (+ 1) % Row 8 \SetRowColor{LightBackground} & 1. Determining the purpose and scope \tn % Row Count 14 (+ 2) % Row 9 \SetRowColor{white} & 2. Obtaining \tn % Row Count 15 (+ 1) % Row 10 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{Transform} \tn % Row Count 16 (+ 1) % Row 11 \SetRowColor{white} & 3. Validating for completeness and integrity \tn % Row Count 19 (+ 3) % Row 12 \SetRowColor{LightBackground} & 4. Cleaning \tn % Row Count 20 (+ 1) % Row 13 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{Load} \tn % Row Count 21 (+ 1) % Row 14 \SetRowColor{LightBackground} \{\{bb=2\}\} & 5. Loading the data \{\{bb=2\}\} \tn % Row Count 23 (+ 2) % Row 15 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{{\bf{ DO a VICy Clean Load}}\{\{ac\}\}} \tn % Row Count 24 (+ 1) % Row 16 \SetRowColor{LightBackground} {\bf{Step 1}} Determining \{\{border=1\}\} & \{\{bb=1\}\} the purpose, to solve, what problem \tn % Row Count 27 (+ 3) % Row 17 \SetRowColor{white} & reliability, usefulness \tn % Row Count 29 (+ 2) % Row 18 \SetRowColor{LightBackground} & nature, timing, and extent \tn % Row Count 31 (+ 2) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{3.76 cm} x{4.24 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Relational Database (cont)}} \tn % Row 19 \SetRowColor{LightBackground} {\bf{Step 2}} Obtaining \{\{border=1\}\} & \{\{bb=1\}\} How obtain? \tn % Row Count 2 (+ 2) % Row 20 \SetRowColor{white} & standard data request form?? \tn % Row Count 4 (+ 2) % Row 21 \SetRowColor{LightBackground} & Where data? \tn % Row Count 5 (+ 1) % Row 22 \SetRowColor{white} & What specific data? \tn % Row Count 6 (+ 1) % Row 23 \SetRowColor{LightBackground} & what tools needed \tn % Row Count 7 (+ 1) % Row 24 \SetRowColor{white} ID what {\bf{you}} need to Extract & Where is {\bf{your}} info \tn % Row Count 9 (+ 2) % Row 25 \SetRowColor{LightBackground} & tables \tn % Row Count 10 (+ 1) % Row 26 \SetRowColor{white} & attributes \tn % Row Count 11 (+ 1) % Row 27 \SetRowColor{LightBackground} & relations between the 2 \tn % Row Count 13 (+ 2) % Row 28 \SetRowColor{white} {\bf{Step 3}} Validating \{\{border=1\}\} & \{\{bb=1\}\} ensure extracted data = complete \& integrity \tn % Row Count 16 (+ 3) % Row 29 \SetRowColor{LightBackground} 4 steps after extraction & 1. Compare number of records in OG and extracted \tn % Row Count 19 (+ 3) % Row 30 \SetRowColor{white} & 2. Compare descriptive statistics \tn % Row Count 21 (+ 2) % Row 31 \SetRowColor{LightBackground} & 3. Validate Date/Time fields \tn % Row Count 23 (+ 2) % Row 32 \SetRowColor{white} & 4. Compare string limits \tn % Row Count 25 (+ 2) % Row 33 \SetRowColor{LightBackground} {\bf{Step 4}} \{\{border=1\}\} & \{\{bb=1\}\} Cleaning \tn % Row Count 27 (+ 2) % Row 34 \SetRowColor{white} 4 steps to clean & Remove headings or subtotals \tn % Row Count 29 (+ 2) % Row 35 \SetRowColor{LightBackground} & Clean leading zeroes and (NPC's) nonprintable characters \tn % Row Count 32 (+ 3) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{3.76 cm} x{4.24 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Relational Database (cont)}} \tn % Row 36 \SetRowColor{LightBackground} & Format negative numbers \tn % Row Count 2 (+ 2) % Row 37 \SetRowColor{white} & Correct inconsistencies (US, U.S., United States, States) \tn % Row Count 5 (+ 3) % Row 38 \SetRowColor{LightBackground} Common quality issues & Dates \tn % Row Count 7 (+ 2) % Row 39 \SetRowColor{white} & Numbers \tn % Row Count 8 (+ 1) % Row 40 \SetRowColor{LightBackground} & International characters and encoding \tn % Row Count 10 (+ 2) % Row 41 \SetRowColor{white} & Languages and measures \tn % Row Count 12 (+ 2) % Row 42 \SetRowColor{LightBackground} & Human error \tn % Row Count 13 (+ 1) % Row 43 \SetRowColor{white} {\bf{Step 5}} \{\{border=1\}\} & \{\{bb=1\}\} Loading \tn % Row Count 15 (+ 2) % Row 44 \SetRowColor{LightBackground} & if previous steps were done correctly then no loading necessary \tn % Row Count 18 (+ 3) \hhline{>{\arrayrulecolor{DarkBackground}}--} \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{Extract = Determining \& Obtaining / 1 \& 2 \newline Transform = Validating \& Cleaning / 3 \& 4 \newline Load = Load / 5} \tn \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{8.4cm}{x{2.052 cm} x{2.812 cm} x{2.736 cm} } \SetRowColor{DarkBackground} \mymulticolumn{3}{x{8.4cm}}{\bf\textcolor{white}{4 quads}} \tn % Row 0 \SetRowColor{LightBackground} \{\{bb=3\}\}\{\{br=3\}\} & Declarative\{\{bb=3\}\}\{\{br=3\}\} & Exploratory\{\{bb=3\}\}\{\{br=3\}\} \tn % Row Count 2 (+ 2) % Row 1 \SetRowColor{white} Qual\{\{br=3\}\}\{\{bb=3\}\} & Quad 1\{\{br=1\}\}\{\{bb=1\}\} & Quad 3\{\{bb=1\}\} \tn % Row Count 4 (+ 2) % Row 2 \SetRowColor{LightBackground} Quan\{\{br=3\}\}\{\{bb=3\}\} & Quad 2\{\{br=1\}\} & Quad 4 \tn % Row Count 6 (+ 2) \hhline{>{\arrayrulecolor{DarkBackground}}---} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{8.4cm}{x{4 cm} x{4 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Distributions}} \tn % Row 0 \SetRowColor{LightBackground} Normal Distribution & ANY mean and ANY standard deviation \tn % Row Count 2 (+ 2) % Row 1 \SetRowColor{white} & The mean, median, and mode are all equal \tn % Row Count 4 (+ 2) % Row 2 \SetRowColor{LightBackground} & Half the data falls below the mean, half above \tn % Row Count 7 (+ 3) % Row 3 \SetRowColor{white} & SAT scores, IQ scores, heights and weights of newborn babies \tn % Row Count 10 (+ 3) % Row 4 \SetRowColor{LightBackground} Standard Normal Distribution & special \{\{fa-star-o\}\} \tn % Row Count 12 (+ 2) % Row 5 \SetRowColor{white} not typical for data-driven quantitative data & A mean of exactly 0 \tn % Row Count 15 (+ 3) % Row 6 \SetRowColor{LightBackground} & A standard deviation of exactly 1 \tn % Row Count 17 (+ 2) % Row 7 \SetRowColor{white} & the mean is 0, the median and mode are also 0 \tn % Row Count 20 (+ 3) % Row 8 \SetRowColor{LightBackground} Poisson Distribution \{\{fa-ban\}\} & the probability of a specific number of events happening in a fixed time period \tn % Row Count 24 (+ 4) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{8.4cm}{x{2.64 cm} x{5.36 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Data Governance and Ethics}} \tn % Row 0 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{Institute of Business Ethics} \tn % Row Count 1 (+ 1) % Row 1 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{6 Questions} \tn % Row Count 2 (+ 1) % Row 2 \SetRowColor{LightBackground} Does the company.... & How does the company use data? \tn % Row Count 4 (+ 2) % Row 3 \SetRowColor{white} & ...send a privacy notices? \tn % Row Count 5 (+ 1) % Row 4 \SetRowColor{LightBackground} & ...assess the risks for the customer? \tn % Row Count 7 (+ 2) % Row 5 \SetRowColor{white} & ...have safeguards for the risks of data misuse? \tn % Row Count 9 (+ 2) % Row 6 \SetRowColor{LightBackground} & ... have the appropriate tools to manage the risks of data misuse? \tn % Row Count 12 (+ 3) % Row 7 \SetRowColor{white} & ...conduct appropriate due diligence when sharing with or acquiring data from third parties? \tn % Row Count 16 (+ 4) \hhline{>{\arrayrulecolor{DarkBackground}}--} \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{\{\{fa-user-secret\}\} LMAO this is America, we have no data protection \newline \{\{fa-dollar\}\} This country is ruled by the amount of profit that share holders can extract \newline \{\{fa-institution\}\} No data rights for our own data \newline \#bigbrother4profit} \tn \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{8.4cm}{x{3.92 cm} x{4.08 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{7 goals CH1}} \tn % Row 0 \SetRowColor{LightBackground} Developed Analytics Mindset & Recognize when and how data analytics can address business questions. \tn % Row Count 4 (+ 4) % Row 1 \SetRowColor{white} Data Scrubbing and Data Preparation & Comprehend the process needed to clean and prepare the data before analysis. \tn % Row Count 8 (+ 4) % Row 2 \SetRowColor{LightBackground} Data Quality & Recognize what is meant by data quality, be it completeness, reliability, or validity. \tn % Row Count 13 (+ 5) % Row 3 \SetRowColor{white} Descriptive Data Analysis & Perform basic analysis to understand the quality of the underlying data and its ability to address the business question. \tn % Row Count 20 (+ 7) % Row 4 \SetRowColor{LightBackground} Data Analysis through Data Manipulation & Demonstrate the ability to sort, rearrange, merge, and reconfigure data in a manner that allows enhanced analysis. \tn % Row Count 26 (+ 6) % Row 5 \SetRowColor{white} Statistical Data Analysis Competency & Identify and implement an approach that will use statistical data analysis to draw conclusions and make recommendations on a timely basis. \tn % Row Count 33 (+ 7) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{3.92 cm} x{4.08 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{7 goals CH1 (cont)}} \tn % Row 6 \SetRowColor{LightBackground} Data Visualization and Data Reporting & Report results of analysis in an accessible way to each varied decision maker and their specific needs. \tn % Row Count 6 (+ 6) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{8.4cm}{x{4 cm} x{4 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Main Types of Data Analytics}} \tn % Row 0 \SetRowColor{LightBackground} Descriptive (past) & summarize existing data \tn % Row Count 2 (+ 2) % Row 1 \SetRowColor{white} & what has happened \tn % Row Count 3 (+ 1) % Row 2 \SetRowColor{LightBackground} Diagnostic (current) & explore the data \tn % Row Count 4 (+ 1) % Row 3 \SetRowColor{white} & why something has happened the way it has \tn % Row Count 7 (+ 3) % Row 4 \SetRowColor{LightBackground} Predictive (future) & used to generate a model \tn % Row Count 9 (+ 2) % Row 5 \SetRowColor{white} & what is likely to happen \tn % Row Count 11 (+ 2) % Row 6 \SetRowColor{LightBackground} Prescriptive (current/ for future) & identify the best possible options given constraints \tn % Row Count 14 (+ 3) % Row 7 \SetRowColor{white} & more advanced AI \tn % Row Count 15 (+ 1) % Row 8 \SetRowColor{LightBackground} \{\{bb=1\}\} & optimize current processes \{\{bb=1\}\} \tn % Row Count 17 (+ 2) % Row 9 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{{\bf{Descriptive}}\{\{border=1\}\}} \tn % Row Count 18 (+ 1) % Row 10 \SetRowColor{LightBackground} Summary statistics & mean, median, standard deviation, ect \tn % Row Count 20 (+ 2) % Row 11 \SetRowColor{white} Data reduction or filtering & {\emph{IFIF (Identify attribute, Filter, Interpret, Follow up)}} \tn % Row Count 23 (+ 3) % Row 12 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{{\bf{Diagnostic}}\{\{border=1\}\}} \tn % Row Count 24 (+ 1) % Row 13 \SetRowColor{white} Benefits of Diagnostic & reduced external audit fees, reduced audit delay, lower material weaknesses, restatements \tn % Row Count 29 (+ 5) % Row 14 \SetRowColor{LightBackground} Profiling\{\{fa-arrow-right\}\} & Characterizes the {\bf{typical}} behavior \tn % Row Count 31 (+ 2) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{4 cm} x{4 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Main Types of Data Analytics (cont)}} \tn % Row 15 \SetRowColor{LightBackground} & IDSIF (ID, Determine, Set boundaries, Interpret, Follow-up \tn % Row Count 3 (+ 3) % Row 16 \SetRowColor{white} {\emph{How profile?}} & {\emph{Z-score}} \tn % Row Count 4 (+ 1) % Row 17 \SetRowColor{LightBackground} & {\emph{Box Whisker}} \tn % Row Count 5 (+ 1) % Row 18 \SetRowColor{white} & {\emph{interquartile range (IQR)}} \tn % Row Count 7 (+ 2) % Row 19 \SetRowColor{LightBackground} Clustering (finding natural groups) \{\{fa-arrow-right\}\} & {\bf{Divides}} individuals into groups that share common underlying characteristics \tn % Row Count 11 (+ 4) % Row 20 \SetRowColor{white} Hypothesis Testing & proof if P\&C are meaningful \tn % Row Count 13 (+ 2) % Row 21 \SetRowColor{LightBackground} Similarity matching \{\{fa-arrow-right\}\} & Identifies similar individuals based on data already known about them \tn % Row Count 17 (+ 4) % Row 22 \SetRowColor{white} Cooccurrence grouping & Discovers associations between individuals based on transactions they are both involved in \tn % Row Count 22 (+ 5) % Row 23 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{{\bf{Predictive}}\{\{border=1\}\}} \tn % Row Count 23 (+ 1) % Row 24 \SetRowColor{white} & target = attribute or value to evaluate \tn % Row Count 25 (+ 2) % Row 25 \SetRowColor{LightBackground} & class = assigned category (to record for event) \tn % Row Count 28 (+ 3) % Row 26 \SetRowColor{white} Regression (number) & Estimates or predicts a numerical value for a variable using a statistical model \tn % Row Count 32 (+ 4) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{4 cm} x{4 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Main Types of Data Analytics (cont)}} \tn % Row 27 \SetRowColor{LightBackground} IV/DFF/IP/EF & Identify the variables, Determine the functional form, Identify parameters, Evaluate fit \tn % Row Count 5 (+ 5) % Row 28 \SetRowColor{white} Classification (sorting into predefined categories) & Assigns each unit into a small set of categories or classes \tn % Row Count 8 (+ 3) % Row 29 \SetRowColor{LightBackground} Link Prediction (relationship) & Predicts a relationship between two data items \tn % Row Count 11 (+ 3) % Row 30 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{{\bf{Prescriptive}}\{\{border=1\}\}} \tn % Row Count 12 (+ 1) % Row 31 \SetRowColor{LightBackground} Decision support systems & Rule-based systems that gather data and recommend actions \tn % Row Count 15 (+ 3) % Row 32 \SetRowColor{white} Artificial intelligence & Learning models that adapt to new data over time to make recommendations \tn % Row Count 19 (+ 4) % Row 33 \SetRowColor{LightBackground} {\bf{Benford's law}} & The law states that in many naturally occurring collections of numbers, the significant leading digit is likely to be small. \tn % Row Count 26 (+ 7) % Row 34 \SetRowColor{white} overfitting\{\{bt=1\}\} & complex models\{\{bt=1\}\} \tn % Row Count 28 (+ 2) % Row 35 \SetRowColor{LightBackground} underfitting & simple models \tn % Row Count 29 (+ 1) \hhline{>{\arrayrulecolor{DarkBackground}}--} \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{significance level = alpha \newline t-test = p-value \textless{} alpha = statistically significant else \{\{fa-thumbs-o-down\}\}} \tn \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{8.4cm}{x{4 cm} x{4 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Graphs Charts and Tables OH MY!}} \tn % Row 0 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{{\bf{Why Pictures?}}\{\{bb=1\}\}} \tn % Row Count 1 (+ 1) % Row 1 \SetRowColor{white} statistics & alone can be misleading \tn % Row Count 3 (+ 2) % Row 2 \SetRowColor{LightBackground} visualizations & visualizations \tn % Row Count 4 (+ 1) % Row 3 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{{\bf{Purpose }}\{\{bt=1\}\}} \tn % Row Count 5 (+ 1) % Row 4 \SetRowColor{LightBackground} Declarative & presenting findings \tn % Row Count 6 (+ 1) % Row 5 \SetRowColor{white} Exploratory & discovering insights \tn % Row Count 7 (+ 1) % Row 6 \SetRowColor{LightBackground} Qualitative & categorical \tn % Row Count 8 (+ 1) % Row 7 \SetRowColor{white} Quantitative & numerical \tn % Row Count 9 (+ 1) % Row 8 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{{\bf{Data Types}}\{\{bt=1\}\}} \tn % Row Count 10 (+ 1) % Row 9 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{Qualitative Data (categorical):} \tn % Row Count 11 (+ 1) % Row 10 \SetRowColor{LightBackground} Nominal & only count and group \tn % Row Count 12 (+ 1) % Row 11 \SetRowColor{white} Ordinal & \{\{fa-angle-down\}\} AND rank \tn % Row Count 14 (+ 2) % Row 12 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{Quantitative Data (numerical):} \tn % Row Count 15 (+ 1) % Row 13 \SetRowColor{white} Interval (no 0) & \{\{fa-angle-down\}\}and measure differences \tn % Row Count 17 (+ 2) % Row 14 \SetRowColor{LightBackground} Ratio & \{\{fa-angle-down\}\}has a meaningful zero \tn % Row Count 19 (+ 2) % Row 15 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{{\bf{The right chart}}\{\{bt=1\}\}} \tn % Row Count 20 (+ 1) % Row 16 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{QUAL} \tn % Row Count 21 (+ 1) % Row 17 \SetRowColor{white} Bar/Column C. & compares proportions of categories \tn % Row Count 23 (+ 2) % Row 18 \SetRowColor{LightBackground} \{\{fa-pie-chart\}\} Pie chart C. & parts of a whole \tn % Row Count 25 (+ 2) % Row 19 \SetRowColor{white} Stacked bar C. & shows proportion AND allows comparison \tn % Row Count 27 (+ 2) % Row 20 \SetRowColor{LightBackground} Word cloud & used for text data \tn % Row Count 28 (+ 1) % Row 21 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{QUAN} \tn % Row Count 29 (+ 1) % Row 22 \SetRowColor{LightBackground} \{\{fa-line-chart\}\}Line C. (continuous ) & trends over time \tn % Row Count 31 (+ 2) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{4 cm} x{4 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Graphs Charts and Tables OH MY! (cont)}} \tn % Row 23 \SetRowColor{LightBackground} Box and whisker P. & quartiles, medians, and outliers \tn % Row Count 2 (+ 2) % Row 24 \SetRowColor{white} Scatter P. & correlation between two variables or a trend line \tn % Row Count 5 (+ 3) % Row 25 \SetRowColor{LightBackground} Filled geographic map & data ranges across geography \tn % Row Count 7 (+ 2) % Row 26 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{{\bf{Refining}}\{\{bt=1\}\}} \tn % Row Count 8 (+ 1) % Row 27 \SetRowColor{LightBackground} \textasciitilde{}readability\textasciitilde{} & How much data do you need to show \tn % Row Count 10 (+ 2) % Row 28 \SetRowColor{white} & Should outliers be displayed or removed? \tn % Row Count 12 (+ 2) % Row 29 \SetRowColor{LightBackground} \textasciitilde{}make differences look dramatic\{\{fa-bomb\}\}\textasciitilde{} & What scale should be used? \tn % Row Count 15 (+ 3) % Row 30 \SetRowColor{white} & Do you need reference points to make the scale meaningful? \tn % Row Count 18 (+ 3) % Row 31 \SetRowColor{LightBackground} \textasciitilde{}\{\{fa-ban\}\}distract from data\textasciitilde{} & When should you use multiple colors? \tn % Row Count 20 (+ 2) % Row 32 \SetRowColor{white} \mymulticolumn{2}{x{8.4cm}}{{\bf{Reports}}} \tn % Row Count 21 (+ 1) % Row 33 \SetRowColor{LightBackground} \mymulticolumn{2}{x{8.4cm}}{get to the point} \tn % Row Count 22 (+ 1) % Row 34 \SetRowColor{white} I & Explain what was being researched \tn % Row Count 24 (+ 2) % Row 35 \SetRowColor{LightBackground} M & Overview of the data source and what data was included \tn % Row Count 27 (+ 3) % Row 36 \SetRowColor{white} P & Describe the analytical approach used \tn % Row Count 29 (+ 2) % Row 37 \SetRowColor{LightBackground} A & Present the results of the analysis \tn % Row Count 31 (+ 2) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{8.4cm}{x{4 cm} x{4 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Graphs Charts and Tables OH MY! (cont)}} \tn % Row 38 \SetRowColor{LightBackground} C & Communicate the insights and what they mean \tn % Row Count 3 (+ 3) % Row 39 \SetRowColor{white} T & Describe what outcomes will be tracked going forward \tn % Row Count 6 (+ 3) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{8.4cm}{x{2 cm} x{6 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{8.4cm}}{\bf\textcolor{white}{Data Types}} \tn % Row 0 \SetRowColor{LightBackground} Discrete Data & whole numbers \tn % Row Count 2 (+ 2) % Row 1 \SetRowColor{white} & number of students in a class \tn % Row Count 3 (+ 1) % Row 2 \SetRowColor{LightBackground} Interval Data & the differences between values are meaningful and equal \tn % Row Count 5 (+ 2) % Row 3 \SetRowColor{white} & Fahrenheit temperature \tn % Row Count 6 (+ 1) % Row 4 \SetRowColor{LightBackground} & time on a clock \tn % Row Count 7 (+ 1) % Row 5 \SetRowColor{white} Ratio data & requires a true zero \tn % Row Count 8 (+ 1) % Row 6 \SetRowColor{LightBackground} & 0 pounds = no weight \tn % Row Count 9 (+ 1) % Row 7 \SetRowColor{white} & 0 dollars = no money \{\{fa-arrow-right\}\} no problems \tn % Row Count 11 (+ 2) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} % That's all folks \end{multicols*} \end{document}