\documentclass[10pt,a4paper]{article} % Packages \usepackage{fancyhdr} % For header and footer \usepackage{multicol} % Allows multicols in tables \usepackage{tabularx} % Intelligent column widths \usepackage{tabulary} % Used in header and footer \usepackage{hhline} % Border under tables \usepackage{graphicx} % For images \usepackage{xcolor} % For hex colours %\usepackage[utf8x]{inputenc} % For unicode character support \usepackage[T1]{fontenc} % Without this we get weird character replacements \usepackage{colortbl} % For coloured tables \usepackage{setspace} % For line height \usepackage{lastpage} % Needed for total page number \usepackage{seqsplit} % Splits long words. %\usepackage{opensans} % Can't make this work so far. Shame. Would be lovely. \usepackage[normalem]{ulem} % For underlining links % Most of the following are not required for the majority % of cheat sheets but are needed for some symbol support. \usepackage{amsmath} % Symbols \usepackage{MnSymbol} % Symbols \usepackage{wasysym} % Symbols %\usepackage[english,german,french,spanish,italian]{babel} % Languages % Document Info \author{Robyn.jll} \pdfinfo{ /Title (psychological-statistics.pdf) /Creator (Cheatography) /Author (Robyn.jll) /Subject (Psychological Statistics Cheat Sheet) } % Lengths and widths \addtolength{\textwidth}{6cm} \addtolength{\textheight}{-1cm} \addtolength{\hoffset}{-3cm} \addtolength{\voffset}{-2cm} \setlength{\tabcolsep}{0.2cm} % Space between columns \setlength{\headsep}{-12pt} % Reduce space between header and content \setlength{\headheight}{85pt} % If less, LaTeX automatically increases it \renewcommand{\footrulewidth}{0pt} % Remove footer line \renewcommand{\headrulewidth}{0pt} % Remove header line \renewcommand{\seqinsert}{\ifmmode\allowbreak\else\-\fi} % Hyphens in seqsplit % This two commands together give roughly % the right line height in the tables \renewcommand{\arraystretch}{1.3} \onehalfspacing % Commands \newcommand{\SetRowColor}[1]{\noalign{\gdef\RowColorName{#1}}\rowcolor{\RowColorName}} % Shortcut for row colour \newcommand{\mymulticolumn}[3]{\multicolumn{#1}{>{\columncolor{\RowColorName}}#2}{#3}} % For coloured multi-cols \newcolumntype{x}[1]{>{\raggedright}p{#1}} % New column types for ragged-right paragraph columns \newcommand{\tn}{\tabularnewline} % Required as custom column type in use % Font and Colours \definecolor{HeadBackground}{HTML}{333333} \definecolor{FootBackground}{HTML}{666666} \definecolor{TextColor}{HTML}{333333} \definecolor{DarkBackground}{HTML}{A3A3A3} \definecolor{LightBackground}{HTML}{F3F3F3} \renewcommand{\familydefault}{\sfdefault} \color{TextColor} % Header and Footer \pagestyle{fancy} \fancyhead{} % Set header to blank \fancyfoot{} % Set footer to blank \fancyhead[L]{ \noindent \begin{multicols}{3} \begin{tabulary}{5.8cm}{C} \SetRowColor{DarkBackground} \vspace{-7pt} {\parbox{\dimexpr\textwidth-2\fboxsep\relax}{\noindent \hspace*{-6pt}\includegraphics[width=5.8cm]{/web/www.cheatography.com/public/images/cheatography_logo.pdf}} } \end{tabulary} \columnbreak \begin{tabulary}{11cm}{L} \vspace{-2pt}\large{\bf{\textcolor{DarkBackground}{\textrm{Psychological Statistics Cheat Sheet}}}} \\ \normalsize{by \textcolor{DarkBackground}{Robyn.jll} via \textcolor{DarkBackground}{\uline{cheatography.com/146401/cs/31664/}}} \end{tabulary} \end{multicols}} \fancyfoot[L]{ \footnotesize \noindent \begin{multicols}{3} \begin{tabulary}{5.8cm}{LL} \SetRowColor{FootBackground} \mymulticolumn{2}{p{5.377cm}}{\bf\textcolor{white}{Cheatographer}} \\ \vspace{-2pt}Robyn.jll \\ \uline{cheatography.com/robyn-jll} \\ \end{tabulary} \vfill \columnbreak \begin{tabulary}{5.8cm}{L} \SetRowColor{FootBackground} \mymulticolumn{1}{p{5.377cm}}{\bf\textcolor{white}{Cheat Sheet}} \\ \vspace{-2pt}Not Yet Published.\\ Updated 13th April, 2022.\\ Page {\thepage} of \pageref{LastPage}. \end{tabulary} \vfill \columnbreak \begin{tabulary}{5.8cm}{L} \SetRowColor{FootBackground} \mymulticolumn{1}{p{5.377cm}}{\bf\textcolor{white}{Sponsor}} \\ \SetRowColor{white} \vspace{-5pt} %\includegraphics[width=48px,height=48px]{dave.jpeg} Measure your website readability!\\ www.readability-score.com \end{tabulary} \end{multicols}} \begin{document} \raggedright \raggedcolumns % Set font size to small. Switch to any value % from this page to resize cheat sheet text: % www.emerson.emory.edu/services/latex/latex_169.html \footnotesize % Small font. \begin{multicols*}{3} \begin{tabularx}{5.377cm}{x{2.04057 cm} x{2.93643 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{First look at the Data}} \tn % Row 0 \SetRowColor{LightBackground} Population & entire group that you want to draw conclusions about. \tn % Row Count 3 (+ 3) % Row 1 \SetRowColor{white} Sample & he specific group that you will collect data from. The size of the sample is always less than the total size of the population \tn % Row Count 9 (+ 6) % Row 2 \SetRowColor{LightBackground} Mean & average (μ mean of population; x̄ mean of sample) \tn % Row Count 12 (+ 3) % Row 3 \SetRowColor{white} Median & separates the sample (Mittelpunkt) \tn % Row Count 14 (+ 2) % Row 4 \SetRowColor{LightBackground} Mode & highest score \tn % Row Count 15 (+ 1) % Row 5 \SetRowColor{white} Variance & measures dispersion around the mean \tn % Row Count 17 (+ 2) % Row 6 \SetRowColor{LightBackground} Standart Deviation (SD) & estimates the SD of the sampling distribution \tn % Row Count 19 (+ 2) % Row 7 \SetRowColor{white} & FORMULA \tn % Row Count 20 (+ 1) % Row 8 \SetRowColor{LightBackground} Standard Error & Square root of the variance (σ SD of population; s SD of sample) \tn % Row Count 23 (+ 3) % Row 9 \SetRowColor{white} & s/√n \tn % Row Count 24 (+ 1) % Row 10 \SetRowColor{LightBackground} Confidence Intervalls (CI) & This is the range of values you expect your estimate to fall between if you redo your test, within a certain level of confidence. Confidence, in statistics, is another way to describe probability \tn % Row Count 33 (+ 9) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{5.377cm}{x{2.04057 cm} x{2.93643 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{First look at the Data (cont)}} \tn % Row 11 \SetRowColor{LightBackground} Quantitative data & s expressed in numbers and graphs and is analyzed through statistical methods. \tn % Row Count 4 (+ 4) % Row 12 \SetRowColor{white} Qualitative data & is expressed in words and analyzed through interpretations and categorizations. \tn % Row Count 8 (+ 4) % Row 13 \SetRowColor{LightBackground} \mymulticolumn{2}{x{5.377cm}}{{\bf{Hypothesis Testing}}} \tn % Row Count 9 (+ 1) % Row 14 \SetRowColor{white} H0 & the null hypothesis of a test always predicts no effect or no relationship between variables \tn % Row Count 13 (+ 4) % Row 15 \SetRowColor{LightBackground} H1 & alternative hypothesis states your research prediction of an effect or relationship \tn % Row Count 17 (+ 4) % Row 16 \SetRowColor{white} \mymulticolumn{2}{x{5.377cm}}{{\bf{Randomisation}}} \tn % Row Count 18 (+ 1) % Row 17 \SetRowColor{LightBackground} completely randomized design & every subject is assigned to a treatment group at random. \tn % Row Count 21 (+ 3) % Row 18 \SetRowColor{white} & Ex. Subjects are all randomly assigned a level of phone use using a random number generator. \tn % Row Count 25 (+ 4) % Row 19 \SetRowColor{LightBackground} randomized block design & subjects are first grouped according to a characteristic they share, and then randomly assigned to treatments within those groups \tn % Row Count 31 (+ 6) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{5.377cm}{x{2.04057 cm} x{2.93643 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{First look at the Data (cont)}} \tn % Row 20 \SetRowColor{LightBackground} & Ex. Subjects are first grouped by age, and then phone use treatments are randomly assigned within these groups. \tn % Row Count 5 (+ 5) % Row 21 \SetRowColor{white} \mymulticolumn{2}{x{5.377cm}}{{\bf{Between-subjects vs. within-subjects}}} \tn % Row Count 6 (+ 1) % Row 22 \SetRowColor{LightBackground} \seqsplit{between-subjects} design & AKA independent measures design or classic ANOVA design \tn % Row Count 9 (+ 3) % Row 23 \SetRowColor{white} & individuals receive only one of the possible levels of an experimental treatment. \tn % Row Count 13 (+ 4) % Row 24 \SetRowColor{LightBackground} & EX. Subjects are randomly assigned a level of phone use (none, low, or high) and follow that level of phone use throughout the experiment. \tn % Row Count 19 (+ 6) % Row 25 \SetRowColor{white} within-subjects design & AKA repeated measures design \tn % Row Count 21 (+ 2) % Row 26 \SetRowColor{LightBackground} & every individual receives each of the experimental treatments consecutively, and their responses to each treatment are measured. \tn % Row Count 27 (+ 6) % Row 27 \SetRowColor{white} & EX. Subjects are assigned consecutively to zero, low, and high levels of phone use throughout the experiment, and the order in which they follow these treatments is randomized. \tn % Row Count 35 (+ 8) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{5.377cm}{x{2.04057 cm} x{2.93643 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Different Scales of Measurement}} \tn % Row 0 \SetRowColor{LightBackground} Nominal Categories & do not correspond to numerical value \tn % Row Count 2 (+ 2) % Row 1 \SetRowColor{white} & Ex. British Team, German Team, ... \tn % Row Count 4 (+ 2) % Row 2 \SetRowColor{LightBackground} Ordinal Measurement or Ranks & scores can be ordered from smallest to largest, only a rank order is implied \tn % Row Count 8 (+ 4) % Row 3 \SetRowColor{white} & Ex. 1st, 2nd, 3rd, ... \tn % Row Count 9 (+ 1) % Row 4 \SetRowColor{LightBackground} Interval Measurement & size of the difference between scores is an indication of magnitude \tn % Row Count 12 (+ 3) % Row 5 \SetRowColor{white} & Ex. Bill was 5 seconds behind the winner, ... (equal interval scale of measurement - interval of 1 second) \tn % Row Count 17 (+ 5) % Row 6 \SetRowColor{LightBackground} Ratio Measurement & like Interval Measurement, but allows ratios to be meaningfully calculated between scores \tn % Row Count 21 (+ 4) % Row 7 \SetRowColor{white} & Ex. Tom took 50 seconds and Bill took 100 seconds -\textgreater{} Tom is twice as fast as Bill \tn % Row Count 25 (+ 4) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{5.377cm}{x{2.4885 cm} x{2.4885 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Types of Variables}} \tn % Row 0 \SetRowColor{LightBackground} Dependent Variable & Variables that represent the outcome of the experiment. \tn % Row Count 3 (+ 3) % Row 1 \SetRowColor{white} & Ex. Any measurement of plant health and growth: in this case, plant height and wilting. \tn % Row Count 8 (+ 5) % Row 2 \SetRowColor{LightBackground} Independent Variable & Variables you manipulate in order to affect the outcome of an experiment \tn % Row Count 12 (+ 4) % Row 3 \SetRowColor{white} & Ex. The amount of salt added to each plant's water. \tn % Row Count 15 (+ 3) % Row 4 \SetRowColor{LightBackground} Controlled Variable & Variables that are held constant throughout the experiment. \tn % Row Count 18 (+ 3) % Row 5 \SetRowColor{white} & Ex. The temperature and light in the room the plants are kept in, and the volume of water given to each plant. \tn % Row Count 24 (+ 6) % Row 6 \SetRowColor{LightBackground} Confounding Variable & A variable that hides the true effect of another variable in your experiment. This can happen when another variable is closely related to a variable you are interested in, but you haven't controlled it in your experiment. \tn % Row Count 36 (+ 12) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{5.377cm}{x{2.4885 cm} x{2.4885 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Types of Variables (cont)}} \tn % Row 7 \SetRowColor{LightBackground} & Ex. Pot size and soil type might affect plant survival as much or more than salt additions. In an experiment you would control these potential confounders by holding them constant. \tn % Row Count 9 (+ 9) % Row 8 \SetRowColor{white} Latent variables & A variable that can't be directly measured, but that you represent via a proxy. \tn % Row Count 14 (+ 5) % Row 9 \SetRowColor{LightBackground} & Ex. Salt tolerance in plants cannot be measured directly, but can be inferred from measurements of plant health in our salt-addition experiment. \tn % Row Count 22 (+ 8) % Row 10 \SetRowColor{white} Composite variables & A variable that is made by combining multiple variables in an experiment. These variables are created when you analyze data, not when you measure it. \tn % Row Count 30 (+ 8) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{5.377cm}{x{2.4885 cm} x{2.4885 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Types of Variables (cont)}} \tn % Row 11 \SetRowColor{LightBackground} & Ex. The three plant health variables could be combined into a single plant-health score to make it easier to present your findings. \tn % Row Count 7 (+ 7) % Row 12 \SetRowColor{white} \mymulticolumn{2}{x{5.377cm}}{{\bf{Quantitative Variables}}} \tn % Row Count 8 (+ 1) % Row 13 \SetRowColor{LightBackground} Discrete/ integer variables & Counts of individual items or values. \tn % Row Count 10 (+ 2) % Row 14 \SetRowColor{white} & Ex. Number of students in a class; Number of different tree species in a forest \tn % Row Count 14 (+ 4) % Row 15 \SetRowColor{LightBackground} Continuous variables (aka ratio variables) & Measurements of continuous or non-finite values. \tn % Row Count 17 (+ 3) % Row 16 \SetRowColor{white} & Ex. Distance, Volume, Age \tn % Row Count 19 (+ 2) % Row 17 \SetRowColor{LightBackground} \mymulticolumn{2}{x{5.377cm}}{{\bf{Categorial Variables}}} \tn % Row Count 20 (+ 1) % Row 18 \SetRowColor{white} Binary/dichotomous variables & Yes/no outcomes \tn % Row Count 22 (+ 2) % Row 19 \SetRowColor{LightBackground} Nominal variables & Groups with no rank or order between them. \tn % Row Count 25 (+ 3) % Row 20 \SetRowColor{white} & Ex. Species, Names, Colors, Brands \tn % Row Count 27 (+ 2) % Row 21 \SetRowColor{LightBackground} Ordinal variables & Groups that are ranked in a specific order. \tn % Row Count 30 (+ 3) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{5.377cm}{x{2.4885 cm} x{2.4885 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Types of Variables (cont)}} \tn % Row 22 \SetRowColor{LightBackground} & Ex. Finishing place in a race, Rating scale responses in a survey \tn % Row Count 4 (+ 4) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{5.377cm}{x{1.9908 cm} x{2.9862 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Sampling}} \tn % Row 0 \SetRowColor{LightBackground} \mymulticolumn{2}{x{5.377cm}}{{\bf{Probability sampling methods}}} \tn % Row Count 1 (+ 1) % Row 1 \SetRowColor{white} \mymulticolumn{2}{x{5.377cm}}{Probability sampling means that every member of the population has a chance of being selected. It is mainly used in quantitative research. If you want to produce results that are representative of the whole population, probability sampling techniques are the most valid choice.} \tn % Row Count 7 (+ 6) % Row 2 \SetRowColor{LightBackground} Simple random sampling & every member of the population has an equal chance of being selected. Your sampling frame should include the whole population. \tn % Row Count 13 (+ 6) % Row 3 \SetRowColor{white} Systematic sampling & is similar to simple random sampling, but it is usually slightly easier to conduct. Every member of the population is listed with a number, but instead of randomly generating numbers, individuals are chosen at regular intervals. \tn % Row Count 23 (+ 10) % Row 4 \SetRowColor{LightBackground} Stratified sampling & involves dividing the population into subpopulations that may differ in important ways. It allows you draw more precise conclusions by ensuring that every subgroup is properly represented in the sample. To use this sampling method, you divide the population into subgroups (called strata) based on the relevant characteristic (e.g. gender, age range, income bracket, job role). \tn % Row Count 39 (+ 16) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{5.377cm}{x{1.9908 cm} x{2.9862 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Sampling (cont)}} \tn % Row 5 \SetRowColor{LightBackground} Cluster sampling & also involves dividing the population into subgroups, but each subgroup should have similar characteristics to the whole sample. Instead of sampling individuals from each subgroup, you randomly select entire subgroups \tn % Row Count 10 (+ 10) % Row 6 \SetRowColor{white} \mymulticolumn{2}{x{5.377cm}}{{\bf{Non-probability sampling methods}}} \tn % Row Count 11 (+ 1) % Row 7 \SetRowColor{LightBackground} \mymulticolumn{2}{x{5.377cm}}{In a non-probability sample, individuals are selected based on non-random criteria, and not every individual has a chance of being included. This type of sample is easier and cheaper to access, but it has a higher risk of sampling bias. That means the inferences you can make about the population are weaker than with probability samples, and your conclusions may be more limited. If you use a non-probability sample, you should still aim to make it as representative of the population as possible. Non-probability sampling techniques are often used in exploratory and qualitative research. In these types of research, the aim is not to test a hypothesis about a broad population, but to develop an initial understanding of a small or under-researched population.} \tn % Row Count 27 (+ 16) % Row 8 \SetRowColor{white} Convenience sampling & A convenience sample simply includes the individuals who happen to be most accessible to the researcher. This is an easy and inexpensive way to gather initial data, but there is no way to tell if the sample is representative of the population, so it can't produce generalizable results. \tn % Row Count 40 (+ 13) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{5.377cm}{x{1.9908 cm} x{2.9862 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Sampling (cont)}} \tn % Row 9 \SetRowColor{LightBackground} Voluntary response sampling & Similar to a convenience sample, a voluntary response sample is mainly based on ease of access. Instead of the researcher choosing participants and directly contacting them, people volunteer themselves (e.g. by responding to a public online survey). Voluntary response samples are always at least somewhat biased, as some people will inherently be more likely to volunteer than others. \tn % Row Count 17 (+ 17) % Row 10 \SetRowColor{white} Purposive sampling & This type of sampling, also known as judgement sampling, involves the researcher using their expertise to select a sample that is most useful to the purposes of the research. It is often used in qualitative research, where the researcher wants to gain detailed knowledge about a specific phenomenon rather than make statistical inferences, or where the population is very small and specific. An effective purposive sample must have clear criteria and rationale for inclusion. \tn % Row Count 37 (+ 20) \end{tabularx} \par\addvspace{1.3em} \vfill \columnbreak \begin{tabularx}{5.377cm}{x{1.9908 cm} x{2.9862 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Sampling (cont)}} \tn % Row 11 \SetRowColor{LightBackground} Snowball sampling & If the population is hard to access, snowball sampling can be used to recruit participants via other participants. The number of people you have access to "snowballs" as you get in contact with more people. \tn % Row Count 9 (+ 9) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} \begin{tabularx}{5.377cm}{p{0.4977 cm} p{0.4977 cm} } \SetRowColor{DarkBackground} \mymulticolumn{2}{x{5.377cm}}{\bf\textcolor{white}{Data Cleansing}} \tn % Row 0 \SetRowColor{LightBackground} \mymulticolumn{2}{x{5.377cm}}{Data cleansing involves spotting and resolving potential data inconsistencies or errors to improve your data quality.} \tn % Row Count 3 (+ 3) % Row 1 \SetRowColor{white} \mymulticolumn{2}{x{5.377cm}}{{\bf{Type I vs Type II error}}} \tn % Row Count 4 (+ 1) % Row 2 \SetRowColor{LightBackground} \mymulticolumn{2}{x{5.377cm}}{Type I error (false positive)} \tn % Row Count 5 (+ 1) % Row 3 \SetRowColor{white} \mymulticolumn{2}{x{5.377cm}}{Type II error (false negative)} \tn % Row Count 6 (+ 1) \hhline{>{\arrayrulecolor{DarkBackground}}--} \end{tabularx} \par\addvspace{1.3em} % That's all folks \end{multicols*} \end{document}