diff --git a/.gitignore b/.gitignore index b494fbc4faa9a1da0207cd29210d13c923874115..1dfbf9f47ecb51dd4ff87e282d2ca6786bfde63b 100644 --- a/.gitignore +++ b/.gitignore @@ -10,8 +10,10 @@ env/ *.pyc -# Do not track word lock files. +# Do not track auto-generated files. .~lock.* +*.aux +*.synctex.gz # Do not track local environment logs. diff --git a/documents/a1_report.pdf b/documents/a1_report.pdf new file mode 100644 index 0000000000000000000000000000000000000000..b9ced017ce9ccb6324987635bae5d39a0a4afca3 Binary files /dev/null and b/documents/a1_report.pdf differ diff --git a/documents/latex/a1_report.tex b/documents/latex/a1_report.tex new file mode 100644 index 0000000000000000000000000000000000000000..df3b24765a3925097ac339b07e0d450f66e38d25 --- /dev/null +++ b/documents/latex/a1_report.tex @@ -0,0 +1,118 @@ +\documentclass[a4paper,12pt]{article} + + +% For latex basics, see http://www.docs.is.ed.ac.uk/skills/documents/3722/3722-2014.pdf. +% For help on symbols, see https://oeis.org/wiki/List_of_LaTeX_mathematical_symbols. +% For info on state machines, look up youtube "Neso Academy" channel. + + +% Import Packages. +% Multi-column package. Allows formatting in columns. +\usepackage{multicol} + + +% Adjust page margins to not be so excessive. +\addtolength{\oddsidemargin}{-.2in} +\addtolength{\evensidemargin}{-.2in} +\addtolength{\textwidth}{.4in} +\addtolength{\topmargin}{-.8in} +\begin{document} + \title{CS6530 Assignment 1 Report} + \author{Brandon Rodriguez} + \date{\today} + \maketitle + + \vspace{-3ex}~ + All answers are acquired from associated Python program, which was written from scratch for this assignment. See readme.md at project root for documentation on running it. + + \section* {Question 1} + + \subsection{Midterm Score Calculations} + \vspace{-2ex}~ + \textbf{\scriptsize Rounded to nearest 2 decimal places.}\\ + \\ + Max: 100 \\ + Min: 37 \\ + Q1: 77.0 \\ + Median: 77.0 \\ + Q3: 77.0 \\ + Mean: 76.72 \\ + Mode: 77 \\ + Variance: 173.11 \\ + + \subsection{Final Score Calculations} + \vspace{-2ex}~ + \textbf{\scriptsize Rounded to nearest 2 decimal places.}\\ + \\ + Max: 100 \\ + Min: 35 \\ + Q1: 89.0 \\ + Median: 89.0 \\ + Q3: 89.5 \\ + Mean: 87.08 \\ + Mode: 97 \\ + Variance: 119.11 \\ + + + \section* {Question 2} + + \subsection{Compare Variance before and after Normalization} + \vspace{-2ex}~ + \textbf{\scriptsize Rounded to nearest 4 decimal places.}\\ + \\ + Orig Midterm Score Variance: 173.1058 \\ + Z-Score Normalized Midterm Variance: 0.999$\bar{9}$ \\ + \\ + Orig Final Score Variance: 119.1129 \\ + Z-Score Normalized Final Score Calculations: 1.0 + + \subsection{Normalized value of an original score of 90} + \vspace{-2ex}~ + \textbf{\scriptsize Rounded to nearest 4 decimal places.}\\ + \\ + Record 223 has both a original midterm and original final of 90.\\ + \\ + Normalized, this comes to:\\ + Midterm: 1.0097 \\ + Final: 0.2672 \\ + + We have two different values because we're using z-score normalization, which normalizes around the mean and standard deviation. + + If we used a different normalization, such as "Min-Max" normalization, then we'd have much closer normalized values. Note that because the minimum scores of "midterm" and "final" are different, "Min-Max" won't give identical normalized values for 90 either. But it will be a lot closer than z-score. + + \subsection{Pearson's Correlation Coefficient} + Person's Correlation Coeficient: 0.544424742312412 + + \subsection{Covariance Value} + Covariance: 78.25419419419427 + + \pagebreak + \section* {Question 3} + + \subsection{Jaccard Coefficient} + Jaccard Coefficient: 0.32222222222222224 + + \subsection{Minkowski Distance} + h of 1: 6152.0\\ + h of 2: 715.3278968417211\\ + h of $\infty$: 170.0\\ + + \subsection{Cosine Similarity} + Cosine Similarity: 0.8414040256623078 + + \subsection{Kullback-leibler Divergence} + Kullback-Leibler Divergence: 0.19420536448348794 + + \vspace{4ex} + \section* {Question 4} + Expected Table:\\ + \lbrack ~~ 8.94436519, ~ 181.05563481\rbrack\\ + \lbrack 156.05563481, 3158.94436519\rbrack\\ + \\ + Chi Stat: 2450.716326822006\\ + Degrees of Freedom: 1\\ + P-Value: 0.0\\ + \\ + This indicates that there is a strong correlation, I think? + +\end{document} \ No newline at end of file