Makefiles for projects done
This commit is contained in:
parent
490c6161f8
commit
4e5361f6d2
16
projects/Makefile
Normal file
16
projects/Makefile
Normal file
@ -0,0 +1,16 @@
|
||||
all:
|
||||
for d in `ls -d project_*/`; do \
|
||||
echo "Processing $$d" ; \
|
||||
cd $$d; $(MAKE) zip ; \
|
||||
done
|
||||
|
||||
mv project_*/*zip .
|
||||
|
||||
clean:
|
||||
for d in `ls -d project_*/`; do \
|
||||
echo "Cleaning up $$d" ; \
|
||||
cd $$d; $(MAKE) clean ; \
|
||||
done
|
||||
|
||||
rm -f *.zip
|
||||
rm -rf auto
|
15
projects/disclaimer.tex
Normal file
15
projects/disclaimer.tex
Normal file
@ -0,0 +1,15 @@
|
||||
\fbox{\parbox{0.985\linewidth}{ \small Please answer all questions
|
||||
in an electronic file (.txt, .doc are ok, but we prefer .pdf) and
|
||||
submit in ILIAS. If the assignments include programming
|
||||
exercises, hand in a pdf for the questions, the .py files for
|
||||
the programs, and the data in one zip file.
|
||||
|
||||
Use complete and correct sentences unless otherwise
|
||||
noted. Please be succinct. Use your own words. Write down a
|
||||
concise reasoning, not just the result. We expect you to do
|
||||
exercises on your own, but you are encouraged to discuss the
|
||||
exercises with your fellow students. If you blindly copy your
|
||||
results from others, you miss out on a chance to learn something
|
||||
new. Use all resources available to you, but always make sure
|
||||
that you truly understand why you give the answer you give.
|
||||
}}
|
10
projects/project_PCA_natural_images/Makefile
Normal file
10
projects/project_PCA_natural_images/Makefile
Normal file
@ -0,0 +1,10 @@
|
||||
latex:
|
||||
pdflatex *.tex
|
||||
pdflatex *.tex
|
||||
|
||||
clean:
|
||||
rm -f *.log *.aux *.zip *.out
|
||||
rm -f `basename *.tex .tex`.pdf
|
||||
|
||||
zip: latex
|
||||
zip `basename *.tex .tex`.zip *.pdf *.dat *.mat
|
217
projects/project_PCA_natural_images/pca_natural_images.tex
Executable file
217
projects/project_PCA_natural_images/pca_natural_images.tex
Executable file
@ -0,0 +1,217 @@
|
||||
\documentclass[addpoints,10pt]{exam}
|
||||
\usepackage{url}
|
||||
\usepackage{color}
|
||||
\usepackage{hyperref}
|
||||
|
||||
\pagestyle{headandfoot}
|
||||
\runningheadrule
|
||||
\firstpageheadrule
|
||||
|
||||
\firstpageheader{Essential Statistics}{Homework 01 due 10/29/2014 23:59 am}{23. October 2014}
|
||||
\runningheader{Homework 01}{Page \thepage\ of \numpages}{23. October 2014}
|
||||
\firstpagefooter{}{}{}
|
||||
\runningfooter{}{}{}
|
||||
\pointsinmargin
|
||||
\bracketedpoints
|
||||
|
||||
%\printanswers
|
||||
\shadedsolutions
|
||||
|
||||
|
||||
\begin{document}
|
||||
%%%%%%%%%%%%%%%%%%%%% Submission instructions %%%%%%%%%%%%%%%%%%%%%%%%%
|
||||
\sffamily
|
||||
\begin{flushright}
|
||||
\gradetable[h][questions]
|
||||
\end{flushright}
|
||||
|
||||
\begin{center}
|
||||
\fbox{\parbox{0.985\linewidth}{ \small Please answer all questions
|
||||
in an electronic file (.txt, .doc are ok, but we prefer .pdf) and
|
||||
submit in ILIAS.
|
||||
|
||||
Use complete and correct sentences unless otherwise
|
||||
noted. Please be succinct. Use your own words. Write down a
|
||||
concise reasoning, not just the result. We expect you to do
|
||||
exercises on your own, but you are encouraged to discuss the
|
||||
exercises with your fellow students. If you blindly copy your
|
||||
results from others, you miss out on a chance to learn something
|
||||
new. Use all resources available to you, but always make sure
|
||||
that you truly understand why you give the answer you give.
|
||||
}}
|
||||
\end{center}
|
||||
|
||||
%%%%%%%%%%%%%% Questions %%%%%%%%%%%%%%%%%%%%%%%%%
|
||||
|
||||
\begin{questions}
|
||||
\question {\bf Reading assignment: Do not submit answers to this
|
||||
question! }
|
||||
|
||||
Read chapter 1. up to 2.4 (including) of Samuels/Wittmer/Schaffner.
|
||||
|
||||
Pay special attention to the following questions.
|
||||
\begin{enumerate}
|
||||
\item What types of scientific evidence do the authors list? How
|
||||
strong are these evidences?
|
||||
\item What are the different types of data encountered in
|
||||
statistical analysis?
|
||||
\item What is a population? What is a random sample? What are
|
||||
sampling errors? What are nonsampling errors?
|
||||
\item What is a descriptive statistic?
|
||||
\item What property do robust statistics have?
|
||||
\end{enumerate}
|
||||
|
||||
\question Install python and a suitable editor on your computer.
|
||||
\begin{parts}
|
||||
\part For installing python, I recommend the anaconda
|
||||
distribution: \url{http://continuum.io/downloads}. It does not
|
||||
matter whether you install python 2.7 or 3.4. I will use python
|
||||
3.4 syntax.
|
||||
|
||||
\part As editor I recommend either sublime text (for people new to
|
||||
programming) or pycharm (for people with programming
|
||||
experience). I do not recommend to use a text editor that comes
|
||||
with your operating system (like word pad). Text processing
|
||||
programs like Mircosoft Word or Libre-Office {\bf won't work at
|
||||
all}. Programming needs a little more than just typing text and
|
||||
you will make your life unnecessarily hard by using an editor not
|
||||
suited for it.
|
||||
\part Find out how to run a python program on your operating
|
||||
system and how to install new python packages. Install the
|
||||
packages {\tt pandas} and {\tt seaborn}.
|
||||
\end{parts}
|
||||
|
||||
\question To publish scientific results, you will usually need
|
||||
to use statistical methods. Some journals provide you with a brief
|
||||
description of how they expect you to apply statistical methods. One
|
||||
example can be found in the author guidelines of the journal
|
||||
Nature
|
||||
|
||||
\begin{center}
|
||||
\url{http://www.nature.com/neuro/pdf/sm_checklist.pdf}
|
||||
\end{center}
|
||||
|
||||
Please read the ‘checklist’ and answer the following questions:
|
||||
|
||||
\begin{parts}
|
||||
\part[2] Why is it important that statistical methods are applied
|
||||
correctly?
|
||||
|
||||
\begin{solution}
|
||||
When not applied correctly, the results of statistical methods
|
||||
might not support your hypothesis and can lead to false
|
||||
conclusions.
|
||||
\end{solution}
|
||||
|
||||
\part[2] Name two common descriptive statistics and what you have
|
||||
to specify for them in nature.
|
||||
|
||||
\begin{solution}
|
||||
\begin{itemize}
|
||||
\item A clearly defined number $n$ of data points should be
|
||||
specified. If the sample is small, plot points instead of
|
||||
using descriptive statistics. Errorbars should be clearly
|
||||
defined.
|
||||
\item measure of center: mean, median
|
||||
\item measure of variability: standard deviation, range
|
||||
\end{itemize}
|
||||
\end{solution}
|
||||
|
||||
\part[3] Name one statistical test that you have heard of or
|
||||
used. If you were to apply any of them, what would you have to
|
||||
specify to follow the Nature guidelines?
|
||||
|
||||
\begin{solution}
|
||||
{\bf Student's T-Test} for testing whether the mean of two
|
||||
populations is the same
|
||||
\begin{itemize}
|
||||
\item a clearly defined $n$ for the test
|
||||
\item a justification for the sample size used
|
||||
\item a clear description of the statistical method: since the
|
||||
t-test is very common, stating that a two independent sample
|
||||
t-test was used should be sufficient.
|
||||
\item Justify that the data meets the definition: the two
|
||||
populations should be normally distributed with the same
|
||||
variance; the data was sampled independently from the two
|
||||
populations being compared.
|
||||
\item Is the variance in the different groups different.
|
||||
\item was it one-sided or two-sided
|
||||
\end{itemize}
|
||||
\end{solution}
|
||||
|
||||
\part[3] Why are you asked to justify each incidence in which
|
||||
you exclude some of the data that you collected? What could be a
|
||||
valid reason to exclude a data point?
|
||||
|
||||
\begin{solution}
|
||||
Excluded data points might make a sample from a population not
|
||||
representative anymore, and can therefore alter the outcome and
|
||||
conclusions of a study. They might be excluded if there is a
|
||||
good reason to believe that they are not part of the population
|
||||
under investigation.
|
||||
\end{solution}
|
||||
|
||||
\end{parts}
|
||||
|
||||
\question {\bf Robust statistics} In 1888, P. Topinard published
|
||||
data on the brain weights of hundreds of French men and women. Here
|
||||
are ten brain weights (in Gramm) of female brains from the dataset
|
||||
\begin{center} [1125, 1027, 1112, 983, 1090, 1247, 1045, 983, 972, 1045]
|
||||
\end{center}
|
||||
|
||||
Open a new file ``brain\_weight.py'' with you text editor to write
|
||||
the following python program (please hand in the plots and the program).
|
||||
\begin{parts}
|
||||
\part[2] Create a list that contains the above brain weights.
|
||||
\part[2] Create a new list that contains the following ten means:
|
||||
Each mean is computed from the original list after removing one
|
||||
element (hint use slicing and adding lists for that; we did this
|
||||
in the lecture already). {\bf Warning:} I {\em do not} expect you
|
||||
to use {\tt for}-loops. Only use them if you know them already. If
|
||||
you do use them, be prepared to explain your code to me to get
|
||||
credits for this task.
|
||||
\part[2] Create yet another list that does the same, only for the
|
||||
median.
|
||||
\part[2] Make a boxplot with the different means and medias (like
|
||||
in the lecture). To show the plot at the end of the program
|
||||
you need to put a {\tt plt.show()} at the end of the program. If
|
||||
you want to save the plot, put the command {\tt
|
||||
plt.gcf().savefig('YOUR\_NAME\_homework01.pdf')} before that. Label
|
||||
the y-axis by using the function {\tt plt.ylabel('FILL IN YOUR LABEL')}
|
||||
\part[2] What can you observe and what does that tell you about
|
||||
the robustness of the statistic?
|
||||
\end{parts}
|
||||
\begin{solution}
|
||||
\begin{verbatim}
|
||||
import matplotlib.pyplot as plt
|
||||
import seaborn as sns
|
||||
import numpy as np
|
||||
|
||||
sns.set_context("paper", font_scale=1.5, rc={"lines.linewidth": 2.5})
|
||||
|
||||
w = [1125, 1027, 1112, 983, 1090, 1247, 1045, 983, 972, 1045]
|
||||
|
||||
brain_means = [ np.mean(w[1:]), np.mean(w[:1] + w[2:]), np.mean(w[:2] + w[3:]), \
|
||||
np.mean(w[:3] + w[4:]), np.mean(w[:4] + w[5:]), np.mean(w[:5] + w[6:]), \
|
||||
np.mean(w[:6] + w[7:]), np.mean(w[:7] + w[8:]), np.mean(w[:8] + w[9:]),\
|
||||
np.mean(w[:9]) ]
|
||||
brain_medians = [ np.median(w[1:]), np.median(w[:1] + w[2:]), np.median(w[:2] + w[3:]), \
|
||||
np.median(w[:3] + w[4:]), np.median(w[:4] + w[5:]), np.median(w[:5] + w[6:]), \
|
||||
np.median(w[:6] + w[7:]), np.median(w[:7] + w[8:]), np.median(w[:8] + w[9:]),\
|
||||
np.median(w[:9]) ]
|
||||
|
||||
sns.boxplot([brain_means, brain_medians], names=['means', 'medians'])
|
||||
plt.ylabel('brain weight [g]')
|
||||
plt.gcf().savefig('fabian_sinz_homework01.pdf')
|
||||
plt.show()
|
||||
\end{verbatim}
|
||||
\end{solution}
|
||||
|
||||
|
||||
\end{questions}
|
||||
|
||||
|
||||
|
||||
|
||||
|
||||
\end{document}
|
Reference in New Issue
Block a user