Merge branch 'master' of https://whale.am28.uni-tuebingen.de/git/teaching/scientificComputing

2021-01-25 13:29:10 +01:00 · 2021-01-25 13:29:10 +01:00 · ee665dc163
commit ee665dc163
parent 40e06d7eaa 1fbb04860d
271 changed files with 405627 additions and 6246 deletions
--- a/.gitignore
+++ b/.gitignore
@ -26,4 +26,4 @@
 *.vrb
 __*
 pointprocesses/lecture/pointprocessscetch*.tex
-
+*.DS_Store
--- a/8
+++ b/8
@ -3,7 +3,7 @@ BASENAME=scientificcomputing-script
 SUBDIRS=programming debugging plotting codestyle statistics bootstrap regression likelihood pointprocesses designpattern 
 SUBTEXS=$(foreach subd, $(SUBDIRS), $(subd)/lecture/$(subd).tex)

-all : script chapters
+all : plots chapters index script exercises

 chapters :
 	for sd in $(SUBDIRS); do $(MAKE) -C $$sd/lecture chapter; done
@ -37,6 +37,11 @@ watchpdf :
 watchscript :
 	while true; do ! make -s -q script && make script; sleep 0.5; done

+
+exercises:
+	for sd in $(SUBDIRS); do if test -d $$sd/exercises; then $(MAKE) -C $$sd/exercises pdf; fi; done
+
+
 cleanplots:
 	for sd in $(SUBDIRS); do $(MAKE) -C $$sd/lecture cleanplots; done

@ -46,6 +51,7 @@ cleantex:

 clean : cleantex
 	for sd in $(SUBDIRS); do $(MAKE) -C $$sd/lecture clean; done
+	for sd in $(SUBDIRS); do if test -d $$sd/exercises; then $(MAKE) -C $$sd/exercises clean; fi; done

 cleanall : clean
 	rm -f $(BASENAME).pdf
--- a/README.fonts
+++ b/README.fonts
@ -1,6 +1,20 @@
 Fonts for matplotlib
 --------------------

+Install Humor Sans font
+```
+sudo apt install fonts-humor-sans
+```
+
+Clear matplotlib font cache:
+```
+cd ~/.cache/matplotlib/
+rm -r *
+```
+
+Older problems
+--------------
+
 Make sure the right fonts are installed:
 ```
 sudo apt-get install ttf-lyx2.0 
--- a/bootstrap/code/bootstrapsem.m
+++ b/bootstrap/code/bootstrapsem.m
@ -1,24 +1,25 @@
 nsamples = 100;
 nresamples = 1000;

-% draw a SRS (simple random sample, "Stichprobe") from the population:
-x = randn( 1, nsamples );
-fprintf('%-30s  %-5s  %-5s  %-5s\n', '', 'mean', 'stdev', 'sem' )
-fprintf('%30s  %5.2f  %5.2f  %5.2f\n', 'single SRS', mean( x ), std( x ), std( x )/sqrt(nsamples) )
+% draw a simple random sample ("Stichprobe") from the population:
+x = randn(1, nsamples);
+fprintf('%-30s  %-5s  %-5s  %-5s\n', '', 'mean', 'stdev', 'sem')
+fprintf('%30s  %5.2f  %5.2f  %5.2f\n', 'single SRS', mean(x), std(x), std(x)/sqrt(nsamples))

 % bootstrap the mean:
-mus = zeros(nresamples,1);  % vector for storing the means
-for i = 1:nresamples        % loop for generating the bootstraps
+mus = zeros(nresamples,1);    % vector for storing the means
+for i = 1:nresamples          % loop for generating the bootstraps
    inx = randi(nsamples, 1, nsamples);  % range, 1D-vector, number
-    xr = x(inx);            % resample the original SRS
-    mus(i) = mean(xr);      % compute statistic of the resampled SRS
+    xr = x(inx);              % resample the original SRS
+    mus(i) = mean(xr);        % compute statistic of the resampled SRS
 end
-fprintf('%30s  %5.2f  %5.2f  -\n', 'bootstrapped distribution', mean( mus ), std( mus ) )
+fprintf('%30s  %5.2f  %5.2f  -\n', 'bootstrapped distribution', mean(mus), std(mus))

-% many SRS (we can do that with the random number generator, but not in real life!):
-musrs = zeros(nresamples,1);      % vector for the means of each SRS
+% many SRS (we can do that with the random number generator,
+% but not in real life!):
+musrs = zeros(nresamples,1);  % vector for the means of each SRS
 for i = 1:nresamples
-    x = randn( 1, nsamples );     % draw a new SRS
-    musrs(i) = mean( x );         % compute its mean
+    x = randn(1, nsamples);   % draw a new SRS
+    musrs(i) = mean(x);       % compute its mean
 end
-fprintf('%30s  %5.2f  %5.2f  -\n', 'sampling distribution', mean( musrs ), std( musrs ) )
+fprintf('%30s  %5.2f  %5.2f  -\n', 'sampling distribution', mean(musrs), std(musrs))
--- a/bootstrap/code/correlationsignificance.m
+++ b/bootstrap/code/correlationsignificance.m
@ -1,27 +1,27 @@
 % generate correlated data:
-n=200;
-a=0.2;
+n = 200;
+a = 0.2;
 x = randn(n, 1);
 y = randn(n, 1) + a*x;

 % correlation coefficient:
 rd = corr(x, y);
-fprintf('correlation coefficient of data r = %.2f\n', rd );
+fprintf('correlation coefficient of data r = %.2f\n', rd);

 % distribution of null hypothesis by permutation:
 nperm = 1000;
 rs = zeros(nperm,1);
-for i=1:nperm
-    xr=x(randperm(length(x)));  % shuffle x
-    yr=y(randperm(length(y)));  % shuffle y
+for i = 1:nperm
+    xr = x(randperm(length(x)));  % shuffle x
+    yr = y(randperm(length(y)));  % shuffle y
    rs(i) = corr(xr, yr);
 end
-[h,b] = hist(rs, 20 );
-h = h/sum(h)/(b(2)-b(1));  % normalization
+[h, b] = hist(rs, 20);
+h = h/sum(h)/(b(2)-b(1));         % normalization

 % significance:
 rq = quantile(rs, 0.95);
-fprintf('correlation coefficient of null hypothesis at 5%% significance = %.2f\n', rq );
+fprintf('correlation coefficient of null hypothesis at 5%% significance = %.2f\n', rq);
 if rd >= rq
    fprintf('--> correlation r=%.2f is significant\n', rd);
 else
@ -32,7 +32,7 @@ end
 bar(b, h, 'facecolor', 'b');
 hold on;
 bar(b(b>=rq), h(b>=rq), 'facecolor', 'r');
-plot( [rd rd], [0 4], 'r', 'linewidth', 2 );
+plot([rd rd], [0 4], 'r', 'linewidth', 2);
 xlabel('Correlation coefficient');
 ylabel('Probability density of H0');
 hold off;
--- a/bootstrap/code/meandiffsignificance.m
+++ b/bootstrap/code/meandiffsignificance.m
@ -0,0 +1,40 @@
+% generate two data sets:
+n = 200;
+d = 0.2;
+x = randn(n, 1);
+y = randn(n, 1) + d;
+
+% difference of sample means:
+md = mean(y) - mean(x);
+fprintf('difference of means of data d = %.2f\n', md);
+
+% distribution of null hypothesis by permutation:
+nperm = 1000;
+xy = [x; y];                         % x and y data in one column vector
+ds = zeros(nperm,1);
+for i = 1:nperm
+    xyr = xy(randperm(length(xy)));  % shuffle data
+    xr = xyr(1:length(x));           % random x-data
+    yr = xyr(length(x)+1:end);       % random y-data
+    ds(i) = mean(yr) - mean(xr);     % difference of means
+end
+[h, b] = hist(ds, 20);
+h = h/sum(h)/(b(2)-b(1));       % normalization
+
+% significance:
+dq = quantile(ds, 0.95);
+fprintf('difference of means of null hypothesis at 5%% significance = %.2f\n', dq);
+if md >= dq
+    fprintf('--> difference of means d=%.2f is significant\n', md);
+else
+    fprintf('--> d=%.2f is not a significant difference of means\n', md);
+end
+
+% plot:
+bar(b, h, 'facecolor', 'b');
+hold on;
+bar(b(b>=dq), h(b>=dq), 'facecolor', 'r');
+plot([md md], [0 4], 'r', 'linewidth', 2);
+xlabel('Difference of means');
+ylabel('Probability density of H0');
+hold off;
--- a/bootstrap/code/meandiffsignificance.out
+++ b/bootstrap/code/meandiffsignificance.out
@ -0,0 +1,4 @@
+>> meandiffsignificance
+difference of means of data d = 0.18
+difference of means of null hypothesis at 5% significance = 0.17
+--> difference of means d=0.18 is significant
--- a/bootstrap/exercises/Makefile
+++ b/bootstrap/exercises/Makefile
@ -1,34 +1,3 @@
-TEXFILES=$(wildcard exercises??.tex)
-EXERCISES=$(TEXFILES:.tex=.pdf)
-SOLUTIONS=$(EXERCISES:exercises%=solutions%)
+TEXFILES=$(wildcard resampling-?.tex)

-.PHONY: pdf exercises solutions watch watchexercises watchsolutions clean
-
-pdf : $(SOLUTIONS) $(EXERCISES)
-
-exercises : $(EXERCISES)
-
-solutions : $(SOLUTIONS)
-
-$(SOLUTIONS) : solutions%.pdf : exercises%.tex instructions.tex
-	{ echo "\\documentclass[answers,12pt,a4paper,pdftex]{exam}"; sed -e '1d' $<; } > $(patsubst %.pdf,%.tex,$@)
-	pdflatex -interaction=scrollmode $(patsubst %.pdf,%.tex,$@) | tee /dev/stderr | fgrep -q "Rerun to get cross-references right" && pdflatex -interaction=scrollmode $(patsubst %.pdf,%.tex,$@) || true
-	rm $(patsubst %.pdf,%,$@).[!p]*
-
-$(EXERCISES) : %.pdf : %.tex instructions.tex
-	pdflatex -interaction=scrollmode $< | tee /dev/stderr | fgrep -q "Rerun to get cross-references right" && pdflatex -interaction=scrollmode $< || true
-
-watch :
-	while true; do ! make -q pdf && make pdf; sleep 0.5; done
-
-watchexercises :
-	while true; do ! make -q exercises && make exercises; sleep 0.5; done
-
-watchsolutions :
-	while true; do ! make -q solutions && make solutions; sleep 0.5; done
-
-clean :
-	rm -f *~ *.aux *.log *.out
-
-cleanup : clean
-	rm -f $(SOLUTIONS) $(EXERCISES)
+include ../../exercises.mk
--- a/bootstrap/exercises/bootstrapmean.m
+++ b/bootstrap/exercises/bootstrapmean.m
@ -10,7 +10,7 @@ function [bootsem, mu] = bootstrapmean(x, resample)
    for i = 1:resample
        % resample:
        xr = x(randi(nsamples, nsamples, 1));
-        % compute statistics on sample:
+        % compute statistics of resampled sample:
        mu(i) = mean(xr);
    end
    bootsem = std(mu);
--- a/bootstrap/exercises/correlationbootstrap.m
+++ b/bootstrap/exercises/correlationbootstrap.m
@ -1,18 +1,18 @@
 %% (a) bootstrap:
 nperm = 1000;
-rb = zeros(nperm,1);
+rb = zeros(nperm, 1);
 for i=1:nperm
    % indices for resampling the data:
    inx = randi(length(x), length(x), 1);
    % resampled data pairs:
-    xb=x(inx);
-    yb=y(inx);
+    xb = x(inx);
+    yb = y(inx);
    rb(i) = corr(xb, yb);
 end

 %% (b) pdf of the correlation coefficients:
-[hb,bb] = hist(rb, 20);
-hb = hb/sum(hb)/(bb(2)-bb(1));  % normalization
+[hb, bb] = hist(rb, 20);
+hb = hb/sum(hb)/(bb(2)-bb(1));      % normalization

 %% (c) significance:
 rbq = quantile(rb, 0.05);
@ -25,8 +25,8 @@ end

 %% plot:
 hold on;
-bar(b, h, 'facecolor', [0.5 0.5 0.5]);
-bar(bb, hb, 'facecolor', 'b');
+bar(b, h, 'facecolor', [0.5 0.5 0.5]);           % permuation test
+bar(bb, hb, 'facecolor', 'b');                   % bootstrap
 bar(bb(bb<=rbq), hb(bb<=rbq), 'facecolor', 'r');
 plot([rd rd], [0 4], 'r', 'linewidth', 2);
 xlim([-0.25 0.75])
--- a/bootstrap/exercises/correlationsignificance.m
+++ b/bootstrap/exercises/correlationsignificance.m
@ -1,4 +1,4 @@
-%% (a) generate correlated data
+%% (a) generate correlated data:
 n = 1000;
 a = 0.2;
 x = randn(n, 1);
@ -8,7 +8,7 @@ y = randn(n, 1) + a*x;
 subplot(1, 2, 1);
 plot(x, a*x, 'r', 'linewidth', 3);
 hold on
-%scatter(x, y );   % either scatter ...
+%scatter(x, y );                    % either scatter ...
 plot(x, y, 'o', 'markersize', 2 );  % ... or plot - same plot.
 xlim([-4 4])
 ylim([-4 4])
@ -20,20 +20,20 @@ hold off
 %c = corrcoef(x, y);  % returns correlation matrix
 %rd = c(1, 2);
 rd = corr(x, y);
-fprintf('correlation coefficient = %.2f\n', rd );
+fprintf('correlation coefficient = %.2f\n', rd);

 %% (e) permutation:
 nperm = 1000;
-rs = zeros(nperm,1);
-for i=1:nperm
-    xr=x(randperm(length(x)));  % shuffle x
-    yr=y(randperm(length(y)));  % shuffle y
+rs = zeros(nperm, 1);
+for i = 1:nperm
+    xr = x(randperm(length(x)));      % shuffle x
+    yr = y(randperm(length(y)));      % shuffle y
    rs(i) = corr(xr, yr);
 end

 %% (g) pdf of the correlation coefficients:
-[h,b] = hist(rs, 20);
-h = h/sum(h)/(b(2)-b(1));  % normalization
+[h, b] = hist(rs, 20);
+h = h/sum(h)/(b(2)-b(1));           % normalization

 %% (h) significance:
 rq = quantile(rs, 0.95);
@ -49,7 +49,7 @@ subplot(1, 2, 2)
 hold on;
 bar(b, h, 'facecolor', 'b');
 bar(b(b>=rq), h(b>=rq), 'facecolor', 'r');
-plot( [rd rd], [0 4], 'r', 'linewidth', 2);
+plot([rd rd], [0 4], 'r', 'linewidth', 2);
 xlim([-0.25 0.25])
 xlabel('Correlation coefficient');
 ylabel('Probability density of H0');
--- a/bootstrap/exercises/exercises01.tex
+++ b/bootstrap/exercises/exercises01.tex
@ -1,205 +0,0 @@
-\documentclass[12pt,a4paper,pdftex]{exam}
-
-\usepackage[english]{babel}
-\usepackage{pslatex}
-\usepackage[mediumspace,mediumqspace,Gray]{SIunits}      % \ohm, \micro
-\usepackage{xcolor}
-\usepackage{graphicx}
-\usepackage[breaklinks=true,bookmarks=true,bookmarksopen=true,pdfpagemode=UseNone,pdfstartview=FitH,colorlinks=true,citecolor=blue]{hyperref}
-
-%%%%% layout %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\usepackage[left=20mm,right=20mm,top=25mm,bottom=25mm]{geometry}
-\pagestyle{headandfoot}
-\ifprintanswers
-\newcommand{\stitle}{: Solutions}
-\else
-\newcommand{\stitle}{}
-\fi
-\header{{\bfseries\large Exercise 9\stitle}}{{\bfseries\large Bootstrap}}{{\bfseries\large December 9th, 2019}}
-\firstpagefooter{Prof. Dr. Jan Benda}{Phone: 29 74573}{Email:
-jan.benda@uni-tuebingen.de}
-\runningfooter{}{\thepage}{}
-
-\setlength{\baselineskip}{15pt}
-\setlength{\parindent}{0.0cm}
-\setlength{\parskip}{0.3cm}
-\renewcommand{\baselinestretch}{1.15}
-
-%%%%% listings %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\usepackage{listings}
-\lstset{
-  language=Matlab,
-  basicstyle=\ttfamily\footnotesize,
-  numbers=left,
-  numberstyle=\tiny,
-  title=\lstname,
-  showstringspaces=false,
-  commentstyle=\itshape\color{darkgray},
-  breaklines=true,
-  breakautoindent=true,
-  columns=flexible,
-  frame=single,
-  xleftmargin=1em,
-  xrightmargin=1em,
-  aboveskip=10pt
-}
-
-%%%%% math stuff: %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\usepackage{amsmath}
-\usepackage{amssymb}
-\usepackage{bm} 
-\usepackage{dsfont}
-\newcommand{\naZ}{\mathds{N}}
-\newcommand{\gaZ}{\mathds{Z}}
-\newcommand{\raZ}{\mathds{Q}}
-\newcommand{\reZ}{\mathds{R}}
-\newcommand{\reZp}{\mathds{R^+}}
-\newcommand{\reZpN}{\mathds{R^+_0}}
-\newcommand{\koZ}{\mathds{C}}
-
-%%%%% page breaks %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\newcommand{\continue}{\ifprintanswers%
-\else
-\vfill\hspace*{\fill}$\rightarrow$\newpage%
-\fi}
-\newcommand{\continuepage}{\ifprintanswers%
-\newpage
-\else
-\vfill\hspace*{\fill}$\rightarrow$\newpage%
-\fi}
-\newcommand{\newsolutionpage}{\ifprintanswers%
-\newpage%
-\else
-\fi}
-
-%%%%% new commands %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\newcommand{\qt}[1]{\textbf{#1}\\}
-\newcommand{\pref}[1]{(\ref{#1})}
-\newcommand{\extra}{--- Zusatzaufgabe ---\ \mbox{}}
-\newcommand{\code}[1]{\texttt{#1}}
-
-
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\begin{document}
-
-\input{instructions}
-
-\begin{questions}
-
-\question \qt{Bootstrap the standard error of the mean}
-We want to compute the standard error of the mean of a data set by
-means of the bootstrap method and compare the result with the formula
-``standard deviation divided by the square-root of $n$''.
-\begin{parts}
-  \part Download the file \code{thymusglandweights.dat} from Ilias.
-  This is a data set of the weights of the thymus glands of 14-day old chicken embryos
-  measured in milligram.
-  \part Load the data into Matlab (\code{load} function).
-  \part Compute histogram, mean, and standard error of the mean of the first 80 data points.
-  \part Compute the standard error of the mean of the first 80 data
-  points by bootstrapping the data 500 times. Write a function that
-  bootstraps the standard error of the mean of a given data set. The
-  function should also return a vector with the bootstrapped means.
-  \part Compute the 95\,\% confidence interval for the mean from the
-  bootstrap distribution (\code{quantile()} function) --- the
-  interval that contains the true mean with 95\,\% probability.
-  \part Use the whole data set and the bootstrap method for computing
-  the dependence of the standard error of the mean from the sample
-  size $n$.
-  \part Compare your result with the formula for the standard error
-  $\sigma/\sqrt{n}$.
-\end{parts}
-\begin{solution}
-  \lstinputlisting{bootstrapmean.m}
-  \lstinputlisting{bootstraptymus.m}
-  \includegraphics[width=0.5\textwidth]{bootstraptymus-datahist}
-  \includegraphics[width=0.5\textwidth]{bootstraptymus-meanhist}
-  \includegraphics[width=0.5\textwidth]{bootstraptymus-samples}
-\end{solution}
-
-
-\question \qt{Student t-distribution}
-The distribution of Student's t, $t=\bar x/(\sigma_x/\sqrt{n})$, the
-estimated mean $\bar x$ of a data set of size $n$ divided by the
-estimated standard error of the mean $\sigma_x/\sqrt{n}$, where
-$\sigma_x$ is the estimated standard deviation, is not a normal
-distribution but a Student-t distribution.  We want to compute the
-Student-t distribution and compare it with the normal distribution.
-\begin{parts}
-\part Generate 100000 normally distributed random numbers.
-\part Draw from these data 1000 samples of size $n=3$, 5, 10, and
-50. For each sample size $n$ ...
-\part ... compute the mean $\bar x$ of the samples and plot the
-probability density of these means.
-\part ... compare the resulting probability densities with corresponding
-normal distributions.
-\part ... compute Student's $t=\bar x/(\sigma_x/\sqrt{n})$ and compare its
-distribution with the normal distribution with standard deviation of
-one. Is $t$ normally distributed? Under which conditions is $t$
-normally distributed?
-\end{parts}
-\newsolutionpage
-\begin{solution}
-  \lstinputlisting{tdistribution.m}
-  \includegraphics[width=1\textwidth]{tdistribution-n03}\\
-  \includegraphics[width=1\textwidth]{tdistribution-n05}\\
-  \includegraphics[width=1\textwidth]{tdistribution-n10}\\
-  \includegraphics[width=1\textwidth]{tdistribution-n50}
-\end{solution}
-
-
-\continue
-\question \qt{Permutation test} \label{permutationtest}
-We want to compute the significance of a correlation by means of a permutation test.
-\begin{parts}
-  \part \label{permutationtestdata} Generate 1000 correlated pairs
-  $x$, $y$ of random numbers according to:
-\begin{verbatim}
-n = 1000
-a = 0.2;
-x = randn(n, 1);
-y = randn(n, 1) + a*x;
-\end{verbatim}
-  \part Generate a scatter plot of the two variables.
-  \part Why is $y$ correlated with $x$?
-  \part Compute the correlation coefficient between $x$ and $y$.
-  \part What do you need to do in order to destroy the correlations between the $x$-$y$ pairs?
-  \part Do exactly this 1000 times and compute each time the correlation coefficient.
-  \part Compute and plot the probability density of these correlation
-  coefficients.
-  \part Is the correlation of the original data set significant?
-  \part What does ``significance of the correlation'' mean?
-%  \part Vary the sample size \code{n} and compute in the same way the
-%  significance of the correlation.
-\end{parts}
-\begin{solution}
-  \lstinputlisting{correlationsignificance.m}
-  \includegraphics[width=1\textwidth]{correlationsignificance}
-\end{solution}
-
-\question \qt{Bootstrap the correlation coefficient} 
-The permutation test generates the distribution of the null hypothesis
-of uncorrelated data and we check whether the correlation coefficient
-of the data differs significantly from this
-distribution. Alternatively we can bootstrap the data while keeping
-the pairs and determine the confidence interval of the correlation
-coefficient of the data. If this differs significantly from a
-correlation coefficient of zero we can conclude that the correlation
-coefficient of the data indeed quantifies correlated data.
-
-We take the same data set that we have generated in exercise
-\ref{permutationtest} (\ref{permutationtestdata}).
-\begin{parts}
-  \part Bootstrap 1000 times the correlation coefficient from the data.
-  \part Compute and plot the probability density of these correlation
-  coefficients.
-  \part Is the correlation of the original data set significant?
-\end{parts}
-\begin{solution}
-  \lstinputlisting{correlationbootstrap.m}
-  \includegraphics[width=1\textwidth]{correlationbootstrap}
-\end{solution}
-
-\end{questions}
-
-\end{document}
--- a/bootstrap/exercises/instructions.tex
+++ b/bootstrap/exercises/instructions.tex
@ -1,6 +0,0 @@
-\vspace*{-7.8ex}
-\begin{center}
-\textbf{\Large Introduction to Scientific Computing}\\[2.3ex]
-{\large Jan Grewe, Jan Benda}\\[-3ex]
-Neuroethology Lab \hfill --- \hfill Institute for Neurobiology \hfill --- \hfill \includegraphics[width=0.28\textwidth]{UT_WBMW_Black_RGB} \\
-\end{center}
--- a/bootstrap/exercises/meandiffpermutation.m
+++ b/bootstrap/exercises/meandiffpermutation.m
@ -0,0 +1,29 @@
+function [md, ds, dq] = meandiffpermutation(x, y, nperm, alpha)
+% Permutation test for difference of means of two independent samples.
+%
+% [md, ds, dq] = meandiffpermutation(x, y, nperm, alpha);
+%
+% Arguments:
+%   x: vector with the samples of the x data set.
+%   y: vector with the samples of the y data set.
+%   nperm: number of permutations run.
+%   alpha: significance level.
+%
+% Returns:
+%   md: difference of the means 
+%   ds: vector containing the differences of the means of the resampled data sets
+%   dq: difference of the means at a significance of alpha.
+
+  md = mean(x) - mean(y);             % measured difference
+  xy = [x; y];                        % merge data sets
+  % permutations:
+  ds = zeros(nperm, 1);
+  for i = 1:nperm
+      xyr = xy(randperm(length(xy))); % shuffle xy
+      xr = xyr(1:length(x));          % random x sample
+      yr = xyr(length(x)+1:end);      % random y sample
+      ds(i) = mean(xr) - mean(yr);
+  end
+  % significance:
+  dq = quantile(ds, 1.0 - alpha);
+end
--- a/bootstrap/exercises/meandiffplot.m
+++ b/bootstrap/exercises/meandiffplot.m
@ -0,0 +1,42 @@
+function meandiffplot(x, y, md, ds, dq, k, nrows)
+% Plot histogram of data sets and of null hypothesis for differences in mean.
+%
+% meandiffplot(x, y, md, ds, dq, k, rows);
+%
+% Arguments:
+%   x: vector with the samples of the x data set.
+%   y: vector with the samples of the y data set.
+%   md: difference of means of the two data sets.
+%   ds: vector containing the differences of the means of the resampled data sets
+%   dq: minimum difference of the means considered significant.
+%   k: current row for the plot panels.
+%   nrows: number of rows of panels in the figure.
+
+  %% (b) plot histograms:
+  subplot(nrows, 2, k*2-1);
+  bmin = min([x; y]);
+  bmax = max([x; y]);
+  bins = bmin:(bmax-bmin)/20.0:bmax;
+  [xh, b] = hist(x, bins);
+  [yh, b] = hist(y, bins);
+  bar(bins, xh, 'facecolor', 'b')
+  hold on
+  bar(bins, yh, 'facecolor', 'r');
+  xlabel('x and y [mV]')
+  ylabel('counts')
+  hold off
+
+  %% (f) pdf of the differences:
+  [h, b] = hist(ds, 20);
+  h = h/sum(h)/(b(2)-b(1));           % normalization
+
+  %% plot:
+  subplot(nrows, 2, k*2)
+  bar(b, h, 'facecolor', 'b');
+  hold on;
+  bar(b(b>=dq), h(b>=dq), 'facecolor', 'r');
+  plot([md md], [0 4], 'r', 'linewidth', 2);
+  xlabel('Difference of means [mV]');
+  ylabel('pdf of H0');
+  hold off;
+end
--- a/bootstrap/exercises/meandiffsignificance.m
+++ b/bootstrap/exercises/meandiffsignificance.m
@ -0,0 +1,37 @@
+n = 200;
+mx = -40.0;
+nperm = 1000;
+alpha = 0.05;
+
+%% (h) repeat for various means of the y-data set:
+mys = [-40.1, -40.2, -40.5];
+for k=1:length(mys)
+
+  %% (a) generate data:
+  my = mys(k);
+  x = randn(n, 1) + mx;
+  y = randn(n, 1) + my;
+
+  %% (d), (e) permutation test:
+  [md, ds, dq] = meandiffpermutation(x, y, nperm, alpha);
+
+  %% (c) difference of means:
+  fprintf('\nmean x = %.1fmV, mean y = %.1fmV\n', mx, my);
+  fprintf('  difference of means = %.2fmV\n', md);
+
+  %% (g) significance:
+  fprintf('  difference of means at 5%% significance = %.2fmV\n', dq);
+  if md >= dq
+      fprintf('  --> measured difference of means is significant\n');
+  else
+      fprintf('  --> measured difference of means is not significant\n');
+  end
+
+  %% (b), (f) plot histograms of data and pdf of differences:
+  meandiffplot(x, y, md, ds, dq, k, length(mys));
+
+  subplot(length(mys), 2, k*2-1);
+  title(sprintf('mx=%.1fmV, my=%.1fmV', mx, my))
+end
+
+savefigpdf(gcf, 'meandiffsignificance.pdf', 12, 10);
--- a/bootstrap/exercises/meandiffsignificance.pdf
+++ b/bootstrap/exercises/meandiffsignificance.pdf
--- a/bootstrap/exercises/resampling-1.tex
+++ b/bootstrap/exercises/resampling-1.tex
@ -0,0 +1,116 @@
+\documentclass[12pt,a4paper,pdftex]{exam}
+
+\newcommand{\exercisetopic}{Resampling}
+\newcommand{\exercisenum}{8}
+\newcommand{\exercisedate}{December 14th, 2020}
+
+\input{../../exercisesheader}
+
+\firstpagefooter{Prof. Dr. Jan Benda}{}{jan.benda@uni-tuebingen.de}
+
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\begin{document}
+
+\input{../../exercisestitle}
+
+\begin{questions}
+
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\question \qt{Read chapter 7 of the script on ``resampling methods''!}\vspace{-3ex}
+
+\question \qt{Permutation test of correlations} \label{correlationtest}
+We want to compute the significance of a correlation by means of a permutation test.
+\begin{parts}
+  \part \label{correlationtestdata} Generate 1000 correlated pairs
+  $x$, $y$ of random numbers according to:
+\begin{verbatim}
+n = 1000
+a = 0.2;
+x = randn(n, 1);
+y = randn(n, 1) + a*x;
+\end{verbatim}
+  \part Generate a scatter plot of the two variables.
+  \part Why is $y$ correlated with $x$?
+  \part Compute the correlation coefficient between $x$ and $y$.
+  \part What do you need to do in order to destroy the correlations between the $x$-$y$ pairs?
+  \part Do exactly this 1000 times and compute each time the correlation coefficient.
+  \part Compute and plot the probability density of these correlation
+  coefficients.
+  \part Is the correlation of the original data set significant?
+  \part What does ``significance of the correlation'' mean?
+%  \part Vary the sample size \code{n} and compute in the same way the
+%  significance of the correlation.
+\end{parts}
+\begin{solution}
+  \lstinputlisting{correlationsignificance.m}
+  \includegraphics[width=1\textwidth]{correlationsignificance}
+\end{solution}
+
+\newsolutionpage
+\question \qt{Bootstrap the correlation coefficient} 
+The permutation test generates the distribution of the null hypothesis
+of uncorrelated data and we check whether the correlation coefficient
+of the data differs significantly from this
+distribution. Alternatively we can bootstrap the data while keeping
+the pairs and determine the confidence interval of the correlation
+coefficient of the data. If this differs significantly from a
+correlation coefficient of zero we can conclude that the correlation
+coefficient of the data indeed quantifies correlated data.
+
+We take the same data set that we have generated in exercise
+\ref{correlationtest} (\ref{correlationtestdata}).
+\begin{parts}
+  \part Bootstrap 1000 times the correlation coefficient from the
+  data, i.e.  generate bootstrap data by randomly resampling the
+  original data pairs with replacement. Use the \code{randi()}
+  function for generating random indices that you can use to select a
+  random sample from the original data.
+  \part Compute and plot the probability density of these correlation
+  coefficients.
+  \part Is the correlation of the original data set significant?
+\end{parts}
+\begin{solution}
+  \lstinputlisting{correlationbootstrap.m}
+  \includegraphics[width=1\textwidth]{correlationbootstrap}
+\end{solution}
+
+
+\continue 
+\question \qt{Permutation test of difference of means}
+We want to test whether two data sets come from distributions that
+differ in their mean by means of a permutation test.
+\begin{parts}
+  \part Generate two normally distributed data sets $x$ and $y$
+  containing each $n=200$ samples. Let's assume the $x$ samples are
+  measurements of the membrane potential of a mammalian photoreceptor
+  in darkness with a mean of $-40$\,mV and a standard deviation of
+  1\,mV. The $y$ values are the membrane potentials measured under dim
+  illumination and come from a distribution with the same standard
+  deviation and a mean of $-40.5$\,mV. See section 5.2 ``Scaling and
+  shifting random numbers'' in the script.
+  \part Plot histograms of the $x$ and $y$ data in a single
+  plot. Choose appropriate bins.
+  \part Compute the means of $x$ and $y$ and their difference.
+  \part The null hypothesis is that the $x$ and $y$ data come from the
+  same distribution. How can you generate new samples $x_r$ and $y_r$
+  from the original data that come from the same distribution?
+  \part Do exactly this 1000 times and compute each time the
+  difference of the means of the two resampled samples.
+  \part Compute and plot the probability density of the resulting
+  distribution of the null hypothesis.
+  \part Is the difference of the means of the original data sets significant?
+  \part Repeat this procedure for $y$ samples that are closer or
+  further apart from the mean of the $x$ data set. For this put the
+  computations of the permuation test in a function and all the plotting
+  in another function.
+\end{parts}
+\begin{solution}
+  \lstinputlisting{meandiffpermutation.m}
+  \lstinputlisting{meandiffplot.m}
+  \lstinputlisting{meandiffsignificance.m}
+  \includegraphics[width=1\textwidth]{meandiffsignificance}
+\end{solution}
+
+\end{questions}
+
+\end{document}
--- a/bootstrap/exercises/resampling-2.tex
+++ b/bootstrap/exercises/resampling-2.tex
@ -0,0 +1,84 @@
+\documentclass[12pt,a4paper,pdftex]{exam}
+
+\newcommand{\exercisetopic}{Resampling}
+\newcommand{\exercisenum}{X2}
+\newcommand{\exercisedate}{December 14th, 2020}
+
+\input{../../exercisesheader}
+
+\firstpagefooter{Prof. Dr. Jan Benda}{}{jan.benda@uni-tuebingen.de}
+
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\begin{document}
+
+\input{../../exercisestitle}
+
+\begin{questions}
+
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\question \qt{Read chapter 7 of the script on ``resampling methods''!}\vspace{-3ex}
+
+\question \qt{Bootstrap the standard error of the mean}
+We want to compute the standard error of the mean of a data set by
+means of the bootstrap method and compare the result with the formula
+``standard deviation divided by the square-root of $n$''.
+\begin{parts}
+  \part Download the file \code{thymusglandweights.dat} from Ilias.
+  This is a data set of the weights of the thymus glands of 14-day old chicken embryos
+  measured in milligram.
+  \part Load the data into Matlab (\code{load} function).
+  \part Compute histogram, mean, and standard error of the mean of the first 80 data points.
+  \part Compute the standard error of the mean of the first 80 data
+  points by bootstrapping the data 500 times. Write a function that
+  bootstraps the standard error of the mean of a given data set. The
+  function should also return a vector with the bootstrapped means.
+  \part Compute the 95\,\% confidence interval for the mean from the
+  bootstrap distribution (\code{quantile()} function) --- the
+  interval that contains the true mean with 95\,\% probability.
+  \part Use the whole data set and the bootstrap method for computing
+  the dependence of the standard error of the mean from the sample
+  size $n$.
+  \part Compare your result with the formula for the standard error
+  $\sigma/\sqrt{n}$.
+\end{parts}
+\begin{solution}
+  \lstinputlisting{bootstrapmean.m}
+  \lstinputlisting{bootstraptymus.m}
+  \includegraphics[width=0.5\textwidth]{bootstraptymus-datahist}
+  \includegraphics[width=0.5\textwidth]{bootstraptymus-meanhist}
+  \includegraphics[width=0.5\textwidth]{bootstraptymus-samples}
+\end{solution}
+
+
+\question \qt{Student t-distribution}
+The distribution of Student's t, $t=\bar x/(\sigma_x/\sqrt{n})$, the
+estimated mean $\bar x$ of a data set of size $n$ divided by the
+estimated standard error of the mean $\sigma_x/\sqrt{n}$, where
+$\sigma_x$ is the estimated standard deviation, is not a normal
+distribution but a Student-t distribution.  We want to compute the
+Student-t distribution and compare it with the normal distribution.
+\begin{parts}
+\part Generate 100000 normally distributed random numbers.
+\part Draw from these data 1000 samples of size $n=3$, 5, 10, and
+50. For each sample size $n$ ...
+\part ... compute the mean $\bar x$ of the samples and plot the
+probability density of these means.
+\part ... compare the resulting probability densities with corresponding
+normal distributions.
+\part ... compute Student's $t=\bar x/(\sigma_x/\sqrt{n})$ and compare its
+distribution with the normal distribution with standard deviation of
+one. Is $t$ normally distributed? Under which conditions is $t$
+normally distributed?
+\end{parts}
+\newsolutionpage
+\begin{solution}
+  \lstinputlisting{tdistribution.m}
+  \includegraphics[width=1\textwidth]{tdistribution-n03}\\
+  \includegraphics[width=1\textwidth]{tdistribution-n05}\\
+  \includegraphics[width=1\textwidth]{tdistribution-n10}\\
+  \includegraphics[width=1\textwidth]{tdistribution-n50}
+\end{solution}
+
+\end{questions}
+
+\end{document}
--- a/bootstrap/exercises/savefigpdf.m
+++ b/bootstrap/exercises/savefigpdf.m
@ -1,28 +1,28 @@
-function savefigpdf( fig, name, width, height )
+function savefigpdf(fig, name, width, height)
 % Saves figure fig in pdf file name.pdf with appropriately set page size
 % and fonts

-% default width:
-if nargin < 3
-    width = 11.7;
-end
-% default height:
-if nargin < 4
-    height = 9.0;
-end
+  % default width:
+  if nargin < 3
+      width = 11.7;
+  end
+  % default height:
+  if nargin < 4
+      height = 9.0;
+  end

-% paper:
-set( fig, 'PaperUnits', 'centimeters' );
-set( fig, 'PaperSize', [width height] );
-set( fig, 'PaperPosition', [0.0 0.0 width height] );
-set( fig, 'Color', 'white')
+  % paper:
+  set(fig, 'PaperUnits', 'centimeters');
+  set(fig, 'PaperSize', [width height]);
+  set(fig, 'PaperPosition', [0.0 0.0 width height]);
+  set(fig, 'Color', 'white')

-% font:
-set( findall( fig, 'type', 'axes' ), 'FontSize', 12 )
-set( findall( fig, 'type', 'text' ), 'FontSize', 12 )
+  % font:
+  set(findall(fig, 'type', 'axes'), 'FontSize', 12)
+  set(findall(fig, 'type', 'text'), 'FontSize', 12)

-% save:
-saveas( fig, name, 'pdf' )
+  % save:
+  saveas(fig, name, 'pdf')

 end

--- a/bootstrap/exercises/tdistribution.m
+++ b/bootstrap/exercises/tdistribution.m
@ -1,10 +1,10 @@
 %% (a) generate random numbers:
 n = 100000;
-x=randn(n, 1);
+x = randn(n, 1);

-for nsamples=[3 5 10 50]
+for nsamples = [3 5 10 50]
    nsamples
-    %% compute mean, standard deviation and t:
+    % compute mean, standard deviation and t:
    nmeans = 10000;
    means = zeros(nmeans, 1);
    sdevs = zeros(nmeans, 1);
@ -19,14 +19,14 @@ for nsamples=[3 5 10 50]
    % Gaussian pdfs:
    msdev = std(means);
    tsdev = 1.0;
-    dxg=0.01;
+    dxg = 0.01;
    xmax = 10.0;
    xmin = -xmax;
    xg = [xmin:dxg:xmax];
    pm = exp(-0.5*(xg/msdev).^2)/sqrt(2.0*pi)/msdev;
    pt = exp(-0.5*(xg/tsdev).^2)/sqrt(2.0*pi)/tsdev;
    
-    %% plots
+    % plots:
    subplot(1, 2, 1)
    bins = xmin:0.2:xmax;
    [h,b] = hist(means, bins);
@ -35,7 +35,7 @@ for nsamples=[3 5 10 50]
    hold on
    plot(xg, pm, 'r', 'linewidth', 2)
    title(sprintf('sample size = %d', nsamples));
-    xlim( [-3, 3] );
+    xlim([-3, 3]);
    xlabel('Mean');
    ylabel('pdf');
    hold off;
@ -48,11 +48,11 @@ for nsamples=[3 5 10 50]
    hold on
    plot(xg, pt, 'r', 'linewidth', 2)
    title(sprintf('sample size = %d', nsamples));
-    xlim( [-8, 8] );
+    xlim([-8, 8]);
    xlabel('Student-t');
    ylabel('pdf');
    hold off;
    
    savefigpdf(gcf, sprintf('tdistribution-n%02d.pdf', nsamples), 14, 5);
-    pause( 3.0 )
+    pause(3.0)
 end
--- a/bootstrap/lecture/bootstrap-chapter.tex
+++ b/bootstrap/lecture/bootstrap-chapter.tex
@ -10,6 +10,8 @@
 \setcounter{page}{\pagenumber}
 \setcounter{chapter}{\chapternumber}

+\renewcommand{\exercisesolutions}{here}  % 0: here, 1: chapter, 2: end
+
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \begin{document} 
@ -17,10 +19,20 @@
 \include{bootstrap}

 \section{TODO}
+
 This chapter easily covers two lectures:
 \begin{itemize}
 \item 1. Bootstrapping with a proper introduction of of confidence intervals
-\item 2. Permutation test with a proper introduction of statistical tests (dsitribution of nullhypothesis, significance, power, etc.)
+\item 2. Permutation test with a proper introduction of statistical tests (distribution of nullhypothesis, significance, power, etc.)
+\end{itemize}
+ToDo:
+\begin{itemize}
+\item Add jacknife methods to bootstrapping
+\item Add discussion of confidence intervals to descriptive statistics chapter
+\item Have a separate chapter on statistical tests before. What is the
+  essence of a statistical test (null hypothesis distribution), power
+  analysis, and a few examples of existing functions for statistical
+  tests.
 \end{itemize}

 \end{document}
--- a/bootstrap/lecture/bootstrap-slides.tex
+++ b/bootstrap/lecture/bootstrap-slides.tex
@ -49,7 +49,6 @@

 %%%% graphics %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \usepackage{graphicx}
-\newcommand{\texpicture}[1]{{\sffamily\small\input{#1.tex}}}

 %%%%% listings %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \usepackage{listings}
--- a/bootstrap/lecture/bootstrap.tex
+++ b/bootstrap/lecture/bootstrap.tex
@ -1,20 +1,28 @@
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\chapter{Bootstrap methods}
+\chapter{Resampling methods}
 \label{bootstrapchapter}
-\exercisechapter{Bootstrap methods}
+\exercisechapter{Resampling methods}

-Bootstrapping methods are applied to create distributions of
-statistical measures via resampling of a sample. Bootstrapping offers several
-advantages:
+
+\entermde{Resampling-Methoden}{Resampling methods} are applied to
+generate distributions of statistical measures via resampling of
+existing samples. Resampling offers several advantages:
 \begin{itemize}
 \item Fewer assumptions (e.g. a measured sample does not need to be
  normally distributed).
 \item Increased precision as compared to classical methods. %such as?
-\item General applicability: the bootstrapping methods are very
+\item General applicability: the resampling methods are very
  similar for different statistics and there is no need to specialize
  the method to specific statistic measures.
 \end{itemize}
+Resampling methods can be used for both estimating the precision of
+estimated statistics (e.g. standard error of the mean, confidence
+intervals) and testing for significane.
+
+
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\section{Bootstrapping}

 \begin{figure}[tp]
  \includegraphics[width=0.8\textwidth]{2012-10-29_16-26-05_771}\\[2ex]
@ -72,10 +80,10 @@ distribution of average values around the true mean of the population

 Alternatively, we can use \enterm{bootstrapping}
 (\determ[Bootstrap!Verfahren]{Bootstrapverfahren}) to generate new
-samples from one set of measurements
-(\entermde{Resampling}{resampling}). From these bootstrapped samples
-we compute the desired statistical measure and estimate their
-distribution (\entermde{Bootstrap!Verteilung}{bootstrap distribution},
+samples from one set of measurements by means of resampling. From
+these bootstrapped samples we compute the desired statistical measure
+and estimate their distribution
+(\entermde{Bootstrap!Verteilung}{bootstrap distribution},
 \subfigref{bootstrapsamplingdistributionfig}{c}).  Interestingly, this
 distribution is very similar to the sampling distribution regarding
 its width. The only difference is that the bootstrapped values are
@ -84,19 +92,20 @@ of the statistical population. We can use the bootstrap distribution
 to draw conclusion regarding the precision of our estimation (e.g.
 standard errors and confidence intervals).

-Bootstrapping methods create bootstrapped samples from a SRS by
+Bootstrapping methods generate bootstrapped samples from a SRS by
 resampling. The bootstrapped samples are used to estimate the sampling
 distribution of a statistical measure. The bootstrapped samples have
-the same size as the original sample and are created by randomly
+the same size as the original sample and are generated by randomly
 drawing with replacement. That is, each value of the original sample
-can occur once, multiple time, or not at all in a bootstrapped
+can occur once, multiple times, or not at all in a bootstrapped
 sample. This can be implemented by generating random indices into the
 data set using the \code{randi()} function.


-\section{Bootstrap of the standard error}
+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\subsection{Bootstrap the standard error}

-Bootstrapping can be nicely illustrated at the example of the
+Bootstrapping can be nicely illustrated on the example of the
 \enterm{standard error} of the mean (\determ{Standardfehler}). The
 arithmetic mean is calculated for a simple random sample. The standard
 error of the mean is the standard deviation of the expected
@ -116,11 +125,10 @@ population.
    the standard error of the mean.}
 \end{figure}

-Via bootstrapping we create a distribution of the mean values
+Via bootstrapping we generate a distribution of mean values
 (\figref{bootstrapsemfig}) and the standard deviation of this
-distribution is the standard error of the mean.
+distribution is the standard error of the sample mean.

-\pagebreak[4]
 \begin{exercise}{bootstrapsem.m}{bootstrapsem.out}
  Create the distribution of mean values from bootstrapped samples
  resampled from a single SRS. Use this distribution to estimate the
@ -138,68 +146,166 @@ distribution is the standard error of the mean.
 \end{exercise}


+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \section{Permutation tests}
+
 Statistical tests ask for the probability of a measured value to
 originate from a null hypothesis. Is this probability smaller than the
 desired \entermde{Signifikanz}{significance level}, the
-\entermde{Nullhypothese}{null hypothesis} may be rejected.
+\entermde{Nullhypothese}{null hypothesis} can be rejected.

 Traditionally, such probabilities are taken from theoretical
-distributions which are based on assumptions about the data.  Thus the
-applied statistical test has to be appropriate for the type of
-data. An alternative approach is to calculate the probability density
-of the null hypothesis directly from the data itself. To do this, we
-need to resample the data according to the null hypothesis from the
-SRS. By such permutation operations we destroy the feature of interest
-while we conserve all other statistical properties of the data.
+distributions which have been derived based on some assumptions about
+the data. For example, the data should be normally distributed.  Given
+some data one has to find an appropriate test that matches the
+properties of the data. An alternative approach is to calculate the
+probability density of the null hypothesis directly from the data
+themselves. To do so, we need to resample the data according to the
+null hypothesis from the SRS. By such permutation operations we
+destroy the feature of interest while conserving all other statistical
+properties of the data.
+
+
+\subsection{Significance of a difference in the mean}
+
+Often we would like to know whether two data sets differ in their
+mean. Whether the ears of foxes are larger in southern Europe compared
+to the ones from Scandinavia, whether a drug decreases blood pressure
+in humans, whether a sensory stimulus increases the firing rate of a
+neuron, etc. The \entermde{Nullhypothese}{null hypothesis} is that
+they do not differ in their means, i.e. that both data sets come from
+the same distribution. But even if the two data sets come from the
+same distribution, their sample means may nevertheless differ by
+chance. We need to figure out how these differences of the means are
+distributed. Only if the measured difference between the means is
+significantly larger than the ones obtained by chance we can reject
+the null hypothesis and consider the two data sets to differ
+significantly in their means.
+
+We can easily estimate the distribution of the null hypothesis by
+putting the data of both data sets in one big bag. By merging the two
+data sets we assume that all the data values come from the same
+distribution. We then randomly separate the data values into two new
+data sets. These random data sets contain data from both original data
+sets and thus come from the same distribution. From these random data
+sets we compute the difference of their sample means. This procedure
+is repeated many, say one thousand, times and each time we get a value
+for a difference of means. The distribution of these values is the
+distribution of the null hypothesis. It is the distribution of
+differences of mean values that we get by chance although the two data
+sets come from the same distribution. For a one-sided test that checks
+whether the measured difference of means is significantly larger than
+zero at a significance level of 5\,\% we compute the value of the
+95\,\% percentile of the null distribution. If the measured value is
+larger, we can reject the null hypothesis and consider the two data
+sets to differ significantly in their means.
+
+By using the original data to estimate the null hypothesis, we make no
+assumption about the properties of the data. We do not need to worry
+about the data being normally distributed. We do not need to memorize
+which test to use in which situation. And we better understand what we
+are testing, because we design the test ourselves. Nowadays, computer
+are powerful enough to iterate even ten thousand times over the data
+to compute the distribution of the null hypothesis --- with only a few
+lines of code. This is why \entermde{Permutationstest}{permutaion
+  test} are getting quite popular.
+
+\begin{figure}[tp]
+  \includegraphics[width=1\textwidth]{permuteaverage}
+  \titlecaption{\label{permuteaverage}Permutation test for differences
+    in means.}{We want to test whether two datasets
+    $\left\{x_i\right\}$ (red) and $\left\{y_i\right\}$ (blue) come
+    from different distributions by assessing the significance of the
+    difference in their sample means. The data sets were generated
+    with a difference in their population means of $d=0.7$. For
+    generating the distribution of the null hypothesis, i.e. the
+    distribution of differences in the means if the two data sets come
+    from the same distribution, we randomly select the same number of
+    samples from both data sets (top right). This is repeated many
+    times and results in the desired distribution of differences of
+    means (bottom). The measured difference is clearly beyond the
+    95\,\% percentile of this distribution and thus indicates a
+    significant difference between the distributions of the two
+    original data sets.}
+\end{figure}
+
+\begin{exercise}{meandiffsignificance.m}{meandiffsignificance.out}
+Estimate the statistical significance of a difference in the mean of two data sets.
+\vspace{-1ex}
+\begin{enumerate}
+\item Generate two independent data sets, $\left\{x_i\right\}$ and
+  $\left\{y_i\right\}$, of $n=200$ samples each, by drawing random
+  numbers from a normal distribution. Add 0.2 to all the $y_i$ samples
+  to ensure the population means to differ by 0.2.
+\item Calculate the difference between the sample means of the two data sets.
+\item Estimate the distribution of the null hypothesis of no
+  difference of the means by generating new data sets with the same
+  number of samples randomly selected from both data sets.  For this
+  lump the two data sets together into a single vector. Then permute
+  the order of the elements in this vector using the function
+  \varcode{randperm()}, split it into two data sets and calculate
+  the difference of their means. Repeat this 1000 times.
+\item Read out the 95\,\% percentile from the resulting distribution
+  of the differences in the mean, the null hypothesis using the
+  \varcode{quantile()} function, and compare it with the difference of
+  means measured from the original data sets.
+\end{enumerate}
+\end{exercise}
+
+
+\subsection{Significance of correlations}
+
+Another nice example for the application of a
+\entermde{Permutationstest}{permutaion test} is testing for
+significant \entermde[correlation]{Korrelation}{correlations}
+(figure\,\ref{permutecorrelationfig}). Given are measured pairs of
+data points $(x_i, y_i)$. By calculating the
+\entermde[correlation!correlation
+coefficient]{Korrelationskoeffizient}{correlation coefficient} we can
+quantify how strongly $y$ depends on $x$. The correlation coefficient
+alone, however, does not tell whether the correlation is significantly
+different from a non-zero correlation that we might get although there
+is no true correlation in the data. The \entermde{Nullhypothese}{null
+  hypothesis} for such a situation is that $y$ does not depend on
+$x$. In order to perform a permutation test, we need to destroy the
+correlation between the data pairs by permuting the $(x_i, y_i)$
+pairs, i.e. we rearrange the $x_i$ and $y_i$ values in a random
+fashion. Generating many sets of random pairs and computing the
+corresponding correlation coefficients yields a distribution of
+correlation coefficients that result randomly from truly uncorrelated
+data. By comparing the actually measured correlation coefficient with
+this distribution we can directly assess the significance of the
+correlation.

 \begin{figure}[tp]
  \includegraphics[width=1\textwidth]{permutecorrelation}
  \titlecaption{\label{permutecorrelationfig}Permutation test for
    correlations.}{Let the correlation coefficient of a dataset with
-    200 samples be $\rho=0.21$. The distribution of the null
-    hypothesis (yellow), optained from the correlation coefficients of
-    permuted and therefore uncorrelated datasets is centered around
-    zero. The measured correlation coefficient is larger than the
-    95\,\% percentile of the null hypothesis. The null hypothesis may
-    thus be rejected and the measured correlation is considered
-    statistically significant.}
+    200 samples be $\rho=0.21$ (top left). By shuffling the data pairs
+    we destroy any true correlation (top right). The resulting
+    distribution of the null hypothesis (bottm, yellow), optained from
+    the correlation coefficients of permuted and therefore
+    uncorrelated datasets is centered around zero. The measured
+    correlation coefficient is larger than the 95\,\% percentile of
+    the null hypothesis. The null hypothesis may thus be rejected and
+    the measured correlation is considered statistically significant.}
 \end{figure}

-A good example for the application of a
-\entermde{Permutationstest}{permutaion test} is the statistical
-assessment of \entermde[correlation]{Korrelation}{correlations}. Given
-are measured pairs of data points $(x_i, y_i)$. By calculating the
-\entermde[correlation!correlation
-coefficient]{Korrelationskoeffizient}{correlation
-  coefficient} we can quantify how strongly $y$ depends on $x$. The
-correlation coefficient alone, however, does not tell whether the
-correlation is significantly different from a random correlation. The
-\entermde{Nullhypothese}{null hypothesis} for such a situation is that
-$y$ does not depend on $x$. In order to perform a permutation test, we
-need to destroy the correlation by permuting the $(x_i, y_i)$ pairs,
-i.e. we rearrange the $x_i$ and $y_i$ values in a random
-fashion. Generating many sets of random pairs and computing the
-resulting correlation coefficients yields a distribution of
-correlation coefficients that result randomly from uncorrelated
-data. By comparing the actually measured correlation coefficient with
-this distribution we can directly assess the significance of the
-correlation (figure\,\ref{permutecorrelationfig}).
-
 \begin{exercise}{correlationsignificance.m}{correlationsignificance.out}
 Estimate the statistical significance of a correlation coefficient.
 \begin{enumerate}
-\item Create pairs of $(x_i, y_i)$ values. Randomly choose $x$-values
+\item Generate pairs of $(x_i, y_i)$ values. Randomly choose $x$-values
  and calculate the respective $y$-values according to $y_i =0.2 \cdot x_i + u_i$
  where $u_i$ is a random number drawn from a normal distribution.
 \item Calculate the correlation coefficient.
-\item Generate the distribution of the null hypothesis by generating
+\item Estimate the distribution of the null hypothesis by generating
  uncorrelated pairs. For this permute $x$- and $y$-values
  \matlabfun{randperm()} 1000 times and calculate for each permutation
  the correlation coefficient.
 \item Read out the 95\,\% percentile from the resulting distribution
-  of the null hypothesis and compare it with the correlation
-  coefficient computed from the original data.
+  of the null hypothesis using the \varcode{quantile()} function and
+  compare it with the correlation coefficient computed from the
+  original data.
 \end{enumerate}
 \end{exercise}

--- a/bootstrap/lecture/bootstrapsem.py
+++ b/bootstrap/lecture/bootstrapsem.py
@ -24,7 +24,7 @@ for i in range(nresamples) :
    musrs.append(np.mean(rng.randn(nsamples)))
 hmusrs, _ = np.histogram(musrs, bins, density=True)

-fig, ax = plt.subplots(figsize=cm_size(figure_width, 1.2*figure_height))
+fig, ax = plt.subplots(figsize=cm_size(figure_width, 1.1*figure_height))
 fig.subplots_adjust(**adjust_fs(left=4.0, bottom=2.7, right=1.5))
 ax.set_xlabel('Mean')
 ax.set_xlim(-0.4, 0.4)
--- a/bootstrap/lecture/permuteaverage.py
+++ b/bootstrap/lecture/permuteaverage.py
@ -0,0 +1,103 @@
+import numpy as np
+import scipy.stats as st
+import matplotlib.pyplot as plt
+import matplotlib.gridspec as gridspec
+import matplotlib.ticker as ticker
+from plotstyle import *
+
+rng = np.random.RandomState(637281)
+
+# generate data that differ in their mein by d:
+n = 200
+d = 0.7
+x = rng.randn(n) + d;
+y = rng.randn(n);
+#x = rng.exponential(1.0, n);
+#y = rng.exponential(1.0, n) + d;
+
+# histogram of data:
+db = 0.5
+bins = np.arange(-2.5, 2.6, db)
+hx, _ = np.histogram(x, bins)
+hy, _ = np.histogram(y, bins)
+
+# Diference of means, pooled standard deviation and Cohen's d:
+ad = np.mean(x)-np.mean(y)
+s = np.sqrt(((len(x)-1)*np.var(x)+(len(y)-1)*np.var(y))/(len(x)+len(y)-2))
+cd = ad/s
+
+# permutation:
+nperm = 1000
+ads = []
+xy = np.hstack((x, y))
+for i in range(nperm) :
+    xyp = rng.permutation(xy)
+    ads.append(np.mean(xyp[:len(x)])-np.mean(xyp[len(x):]))
+
+# histogram of shuffled data:
+hxp, _ = np.histogram(xyp[:len(x)], bins)
+hyp, _ = np.histogram(xyp[len(x):], bins)
+    
+# pdf of the differences of means:
+h, b = np.histogram(ads, 20, density=True)
+
+# significance:
+dq = np.percentile(ads, 95.0)
+print('Measured difference of means = %.2f, difference at 95%% percentile of permutation = %.2f' % (ad, dq))
+da = 1.0-0.01*st.percentileofscore(ads, ad)
+print('Measured difference of means %.2f is at %.2f%% percentile of permutation' % (ad, 100.0*da))
+
+ap, at = st.ttest_ind(x, y)
+print('Measured difference of means %.2f is at %.2f%% percentile of test' % (ad, ap))
+
+
+fig = plt.figure(figsize=cm_size(figure_width, 1.8*figure_height))
+gs = gridspec.GridSpec(nrows=2, ncols=2, wspace=0.35, hspace=0.8,
+                       **adjust_fs(fig, left=5.0, right=1.5, top=1.0, bottom=2.7))
+
+ax = fig.add_subplot(gs[0,0])
+ax.bar(bins[:-1]-0.25*db, hy, 0.5*db, **fsA)
+ax.bar(bins[:-1]+0.25*db, hx, 0.5*db, **fsB)
+ax.annotate('', xy=(0.0, 45.0), xytext=(d, 45.0), arrowprops=dict(arrowstyle='<->'))
+ax.text(0.5*d, 50.0, 'd=%.1f' % d, ha='center')
+ax.set_xlim(-2.5, 2.5)
+ax.set_ylim(0.0, 50)
+ax.yaxis.set_major_locator(ticker.MultipleLocator(20.0))
+ax.set_xlabel('Original x and y values')
+ax.set_ylabel('Counts')
+
+ax = fig.add_subplot(gs[0,1])
+ax.bar(bins[:-1]-0.25*db, hyp, 0.5*db, **fsA)
+ax.bar(bins[:-1]+0.25*db, hxp, 0.5*db, **fsB)
+ax.set_xlim(-2.5, 2.5)
+ax.set_ylim(0.0, 50)
+ax.yaxis.set_major_locator(ticker.MultipleLocator(20.0))
+ax.set_xlabel('Shuffled x and y values')
+ax.set_ylabel('Counts')
+
+ax = fig.add_subplot(gs[1,:])
+ax.annotate('Measured\ndifference\nis significant!',
+            xy=(ad, 1.2), xycoords='data',
+            xytext=(ad-0.1, 2.2), textcoords='data', ha='right',
+            arrowprops=dict(arrowstyle="->", relpos=(1.0,0.5),
+                connectionstyle="angle3,angleA=-20,angleB=100") )
+ax.annotate('95% percentile',
+            xy=(0.19, 0.9), xycoords='data',
+            xytext=(0.3, 5.0), textcoords='data', ha='left',
+            arrowprops=dict(arrowstyle="->", relpos=(0.1,0.0),
+                connectionstyle="angle3,angleA=40,angleB=80") )
+ax.annotate('Distribution of\nnullhypothesis',
+            xy=(-0.08, 3.0), xycoords='data',
+            xytext=(-0.22, 4.5), textcoords='data', ha='left',
+            arrowprops=dict(arrowstyle="->", relpos=(0.2,0.0),
+                connectionstyle="angle3,angleA=60,angleB=150") )
+ax.bar(b[:-1], h, width=b[1]-b[0], **fsC)
+ax.bar(b[:-1][b[:-1]>=dq], h[b[:-1]>=dq], width=b[1]-b[0], **fsB)
+ax.plot( [ad, ad], [0, 1], **lsA)
+ax.set_xlim(-0.25, 0.85)
+ax.set_ylim(0.0, 5.0)
+ax.yaxis.set_major_locator(ticker.MultipleLocator(2.0))
+ax.set_xlabel('Difference of means')
+ax.set_ylabel('PDF of H0')
+
+plt.savefig('permuteaverage.pdf')
--- a/bootstrap/lecture/permutecorrelation.py
+++ b/bootstrap/lecture/permutecorrelation.py
@ -1,9 +1,11 @@
 import numpy as np
 import scipy.stats as st
 import matplotlib.pyplot as plt
+import matplotlib.gridspec as gridspec
+import matplotlib.ticker as ticker
 from plotstyle import *

-rng = np.random.RandomState(637281)
+rng = np.random.RandomState(37281)

 # generate correlated data:
 n = 200
@ -19,32 +21,56 @@ rd = np.corrcoef(x, y)[0, 1]
 nperm = 1000
 rs = []
 for i in range(nperm) :
-    xr=rng.permutation(x)
-    yr=rng.permutation(y)
-    rs.append( np.corrcoef(xr, yr)[0, 1] )
+    xr = rng.permutation(x)
+    yr = rng.permutation(y)
+    rs.append(np.corrcoef(xr, yr)[0, 1])
+rr = np.corrcoef(xr, yr)[0, 1]

 # pdf of the correlation coefficients:
 h, b = np.histogram(rs, 20, density=True)

 # significance:
 rq = np.percentile(rs, 95.0)
-print('Measured correlation coefficient = %.2f, correlation coefficient at 95%% percentile of bootstrap = %.2f' % (rd, rq))
+print('Measured correlation coefficient = %.2f, correlation coefficient at 95%% percentile of permutation = %.2f' % (rd, rq))
 ra = 1.0-0.01*st.percentileofscore(rs, rd)
-print('Measured correlation coefficient %.2f is at %.4f percentile of bootstrap' % (rd, ra))
+print('Measured correlation coefficient %.2f is at %.4f percentile of permutation' % (rd, ra))

 rp, ra = st.pearsonr(x, y)
 print('Measured correlation coefficient %.2f is at %.4f percentile of test' % (rp, ra))

-fig, ax = plt.subplots(figsize=cm_size(figure_width, 1.2*figure_height))
-fig.subplots_adjust(**adjust_fs(left=4.0, bottom=2.7, right=0.5, top=1.0))
+fig = plt.figure(figsize=cm_size(figure_width, 1.8*figure_height))
+gs = gridspec.GridSpec(nrows=2, ncols=2, wspace=0.35, hspace=0.8,
+                       **adjust_fs(fig, left=5.0, right=1.5, top=1.0, bottom=2.7))
+
+ax = fig.add_subplot(gs[0,0])
+ax.text(0.0, 4.0, 'r=%.2f' % rd, ha='center')
+ax.plot(x, y, **psAm)
+ax.set_xlim(-4.0, 4.0)
+ax.set_ylim(-4.0, 4.0)
+ax.xaxis.set_major_locator(ticker.MultipleLocator(2.0))
+ax.yaxis.set_major_locator(ticker.MultipleLocator(2.0))
+ax.set_xlabel('x')
+ax.set_ylabel('y')
+
+ax = fig.add_subplot(gs[0,1])
+ax.text(0.0, 4.0, 'r=%.2f' % rr, ha='center')
+ax.plot(xr, yr, **psAm)
+ax.set_xlim(-4.0, 4.0)
+ax.set_ylim(-4.0, 4.0)
+ax.xaxis.set_major_locator(ticker.MultipleLocator(2.0))
+ax.yaxis.set_major_locator(ticker.MultipleLocator(2.0))
+ax.set_xlabel('Shuffled x')
+ax.set_ylabel('Shuffled y')
+
+ax = fig.add_subplot(gs[1,:])
 ax.annotate('Measured\ncorrelation\nis significant!',
            xy=(rd, 1.1), xycoords='data',
-            xytext=(rd, 2.2), textcoords='data', ha='left',
-            arrowprops=dict(arrowstyle="->", relpos=(0.2,0.0),
+            xytext=(rd-0.01, 3.0), textcoords='data', ha='left',
+            arrowprops=dict(arrowstyle="->", relpos=(0.3,0.0),
                connectionstyle="angle3,angleA=10,angleB=80") )
 ax.annotate('95% percentile',
            xy=(0.14, 0.9), xycoords='data',
-            xytext=(0.18, 4.0), textcoords='data', ha='left',
+            xytext=(0.16, 6.2), textcoords='data', ha='left',
            arrowprops=dict(arrowstyle="->", relpos=(0.1,0.0),
                connectionstyle="angle3,angleA=30,angleB=80") )
 ax.annotate('Distribution of\nuncorrelated\nsamples',
@ -56,7 +82,9 @@ ax.bar(b[:-1], h, width=b[1]-b[0], **fsC)
 ax.bar(b[:-1][b[:-1]>=rq], h[b[:-1]>=rq], width=b[1]-b[0], **fsB)
 ax.plot( [rd, rd], [0, 1], **lsA)
 ax.set_xlim(-0.25, 0.35)
+ax.set_ylim(0.0, 6.0)
+ax.yaxis.set_major_locator(ticker.MultipleLocator(2.0))
 ax.set_xlabel('Correlation coefficient')
-ax.set_ylabel('Prob. density of H0')
+ax.set_ylabel('PDF of H0')

 plt.savefig('permutecorrelation.pdf')
--- a/chapter.mk
+++ b/chapter.mk
@ -1,5 +1,5 @@
 # plots:
-plots : pythonplots gnuplots
+plots : pythonplots

 # python plots:
 PYFILES=$(wildcard *.py)
@ -10,25 +10,12 @@ pythonplots : $(PYPDFFILES)

 $(PYPDFFILES) : %.pdf: %.py ../../plotstyle.py
 	PYTHONPATH="../../" python3 $<
+#ps2pdf $@ $(@:.pdf=-temp.pdf)  # strip fonts, saves only about 1.5MB
+#mv $(@:.pdf=-temp.pdf) $@

 cleanpythonplots :
 	rm -f $(PYPDFFILES)

-
-# gnuplot plots:
-GPTFILES=$(wildcard *.gpt)
-GPTTEXFILES=$(GPTFILES:.gpt=.tex)
-
-gnuplots : $(GPTTEXFILES)
-
-$(GPTTEXFILES) : %.tex: %.gpt whitestyles.gp
-	gnuplot whitestyles.gp $<
-	epstopdf $*.eps
-
-cleangnuplots :
-	rm -f $(GPTTEXFILES)
-
-
 # script:
 chapter : $(BASENAME)-chapter.pdf

@ -42,12 +29,15 @@ $(BASENAME)-chapter.pdf : $(BASENAME)-chapter.tex $(BASENAME).tex $(wildcard $(B
 watchchapter :
 	while true; do ! make -q chapter && make chapter; sleep 0.5; done

+watchplots :
+	while true; do ! make -q plots && make plots; sleep 0.5; done
+
 cleantex:
 	rm -f *~ 
 	rm -f $(BASENAME).aux $(BASENAME).log *.idx
 	rm -f $(BASENAME)-chapter.aux $(BASENAME)-chapter.log $(BASENAME)-chapter.out $(BASENAME)-chapter.idx $(BASENAME)-chapter-solutions.tex $(BASENAME)-solutions.tex

-cleanplots: cleanpythonplots cleangnuplots
+cleanplots: cleanpythonplots

 cleanchapter : cleanplots cleantex

--- a/codestyle/lecture/codestyle.tex
+++ b/codestyle/lecture/codestyle.tex
@ -4,6 +4,7 @@
  more months might as well have been written by someone
  else.}{Eagleson's law}

+\noindent
 Cultivating a good code style is not just a matter of good taste but
 rather is a key ingredient for readability and maintainability of code
 and, in the end, facilitates reproducibility of scientific
@ -204,7 +205,7 @@ random walk\footnote{A random walk is a simple simulation of Brownian
 (listing \ref{chaoticcode}) then in cleaner way (listing
 \ref{cleancode})

-\begin{lstlisting}[label=chaoticcode, caption={Chaotic implementation of the random-walk.}]
+\begin{pagelisting}[label=chaoticcode, caption={Chaotic implementation of the random-walk.}]
 num_runs = 10; max_steps = 1000;

 positions = zeros(max_steps, num_runs);
@ -217,18 +218,15 @@ for step = 2:max_steps
 x = randn(1);
 if x<0
 positions(step, run)= positions(step-1, run)+1;
-    
       
 elseif x>0
 positions(step,run)=positions(step-1,run)-1;
 end
 end
 end
-\end{lstlisting}
+\end{pagelisting}

-\pagebreak[4]
-
-\begin{lstlisting}[label=cleancode, caption={Clean implementation of the random-walk.}]
+\begin{pagelisting}[label=cleancode, caption={Clean implementation of the random-walk.}]
 num_runs = 10;
 max_steps = 1000;
 positions = zeros(max_steps, num_runs);
@ -243,7 +241,7 @@ for run = 1:num_runs
        end
    end
 end
-\end{lstlisting}
+\end{pagelisting}

 \section{Using comments}

@ -275,7 +273,6 @@ avoided:\\ \varcode{ x = x + 2; \% add two to x}\\
    make it even clearer.}{Steve McConnell}
 \end{important}

-\pagebreak[4]
 \section{Documenting functions}
 All pre-defined \matlab{} functions begin with a comment block that
 describes the purpose of the function, the required and optional
@ -335,8 +332,7 @@ used within the context of another function \matlab{} allows to define
 within the same file. Listing \ref{localfunctions} shows an example of
 a local function definition.

-\pagebreak[3] 
-\lstinputlisting[label=localfunctions, caption={Example for local
+\pageinputlisting[label=localfunctions, caption={Example for local
  functions.}]{calculateSines.m}

 \emph{Local function} live in the same \entermde{m-File}{m-file} as
--- a/debugging/lecture/debugging.tex
+++ b/debugging/lecture/debugging.tex
@ -59,14 +59,14 @@ every opening parenthesis must be matched by a closing one or every
 respective error messages are clear and the editor will point out and
 highlight most syntax errors.

-\begin{lstlisting}[label=syntaxerror, caption={Unbalanced parenthesis error.}]
+\begin{pagelisting}[label=syntaxerror, caption={Unbalanced parenthesis error.}]
 >> mean(random_numbers
                      |
 Error: Expression or statement is incorrect--possibly unbalanced (, {, or [.

 Did you mean:
 >>   mean(random_numbers)
-\end{lstlisting}
+\end{pagelisting}

 \subsection{Indexing error}\label{index_error}
 Second on the list of common errors are the
@ -125,7 +125,7 @@ dimensions. The command in line 7 works due to the fact, that matlab
 automatically extends the matrix, if you assign values to a range
 outside its bounds.

-\begin{lstlisting}[label=assignmenterror, caption={Assignment errors.}]
+\begin{pagelisting}[label=assignmenterror, caption={Assignment errors.}]
 >> a = zeros(1, 100);
 >> b = 0:10;

@ -136,7 +136,7 @@ outside its bounds.
 >> size(a)
 ans =
     110    1
-\end{lstlisting}
+\end{pagelisting}

 \subsection{Dimension mismatch error}
 Similarly, some arithmetic operations are only valid if the variables
@ -154,7 +154,7 @@ in listing\,\ref{dimensionmismatch} does not throw an error but the
 result is something else than the expected elementwise multiplication.

 % XXX Some arithmetic operations make size constraints, violating them leads to dimension mismatch errors.
-\begin{lstlisting}[label=dimensionmismatch, caption={Dimension mismatch errors.}]
+\begin{pagelisting}[label=dimensionmismatch, caption={Dimension mismatch errors.}]
  >> a = randn(100, 1);
  >> b = randn(10, 1);
  >> a + b
@ -171,7 +171,7 @@ result is something else than the expected elementwise multiplication.
  >> size(c)
  ans =
       100    10
-\end{lstlisting}
+\end{pagelisting}



@ -239,7 +239,7 @@ but it requires a deep understanding of the applied functions and also
 the task at hand.

 % XXX Converting a series of spike times into the firing rate as a function of time. Many tasks can be solved with a single line of code. But is this readable?
-\begin{lstlisting}[label=easyvscomplicated, caption={One-liner versus readable code.}]
+\begin{pagelisting}[label=easyvscomplicated, caption={One-liner versus readable code.}]
 % the one-liner
 rate = conv(full(sparse(1, round(spike_times/dt), 1, 1, length(time))), kernel, 'same');

@ -248,7 +248,7 @@ rate = zeros(size(time));
 spike_indices = round(spike_times/dt);
 rate(spike_indices) = 1;
 rate = conv(rate, kernel, 'same');
-\end{lstlisting}
+\end{pagelisting}

 The preferred way depends on several considerations. (i) How deep is
 your personal understanding of the programming language?  (ii) What
@ -291,7 +291,7 @@ example given in the \matlab{} help and assume that there is a
 function \varcode{rightTriangle()} (listing\,\ref{trianglelisting}).

 % XXX Slightly more readable version of the example given in the \matlab{} help system. Note: The variable name for the angles have been capitalized in order to not override the matlab defined functions \code{alpha, beta,} and \code{gamma}.
-\begin{lstlisting}[label=trianglelisting, caption={Example function for unit testing.}]
+\begin{pagelisting}[label=trianglelisting, caption={Example function for unit testing.}]
 function angles = rightTriangle(length_a, length_b)
    ALPHA = atand(length_a / length_b);
    BETA = atand(length_a / length_b);
@ -300,7 +300,7 @@ function angles = rightTriangle(length_a, length_b)

    angles = [ALPHA BETA GAMMA];
 end
-\end{lstlisting}
+\end{pagelisting}

 This function expects two input arguments that are the length of the
 sides $a$ and $b$ and assumes a right angle between them. From this
@ -337,7 +337,7 @@ The test script for the \varcode{rightTriangle()} function
 (listing\,\ref{trianglelisting}) may look like in
 listing\,\ref{testscript}.

-\begin{lstlisting}[label=testscript, caption={Unit test for the \varcode{rightTriangle()} function stored in an m-file testRightTriangle.m}]
+\begin{pagelisting}[label=testscript, caption={Unit test for the \varcode{rightTriangle()} function stored in an m-file testRightTriangle.m}]
 tolerance = 1e-10;

 % preconditions
@ -373,7 +373,7 @@ angles = rightTriangle(1, 1500);
 smallAngle = (pi / 180) * angles(1); % radians
 approx = sin(smallAngle);
 assert(abs(approx - smallAngle) <= tolerance, 'Problem with small angle approximation')
-\end{lstlisting}
+\end{pagelisting}

 In a test script we can execute any code. The actual test whether or
 not the results match our predictions is done using the
@ -390,16 +390,16 @@ executed. We further define a \varcode{tolerance} variable that is
 used when comparing double values (Why might the test on equality of
 double values be tricky?).

-\begin{lstlisting}[label=runtestlisting, caption={Run the test!}]
+\begin{pagelisting}[label=runtestlisting, caption={Run the test!}]
 result = runtests('testRightTriangle')
-\end{lstlisting}
+\end{pagelisting}

 During the run, \matlab{} will put out error messages onto the command
 line and a summary of the test results is then stored within the
 \varcode{result} variable. These can be displayed using the function
 \code[table()]{table(result)}.

-\begin{lstlisting}[label=testresults, caption={The test results.}, basicstyle=\ttfamily\scriptsize]
+\begin{pagelisting}[label=testresults, caption={The test results.}, basicstyle=\ttfamily\scriptsize]
 table(result)
 ans =
  4x6 table
@ -411,7 +411,7 @@ _________________________________   ______  ______  ___________  ________  _____
 'testR.../Test_IsoscelesTriangles'   true   false   false        0.004893   [1x1 struct]
 'testR.../Test_30_60_90Triangle'     true   false   false        0.005057   [1x1 struct]
 'testR.../Test_SmallAngleApprox'     true   false   false        0.0049     [1x1 struct]
-\end{lstlisting}
+\end{pagelisting}

 So far so good, all tests pass and our function appears to do what it
 is supposed to do. But tests are only as good as the programmer who
@ -479,11 +479,11 @@ stopped in debug mode (listing\,\ref{debuggerlisting}).
 \end{figure}


-\begin{lstlisting}[label=debuggerlisting, caption={Command line when the program execution was stopped in the debugger.}]
+\begin{pagelisting}[label=debuggerlisting, caption={Command line when the program execution was stopped in the debugger.}]
 >> simplerandomwalk
 6   for run = 1:num_runs
 K>>
-\end{lstlisting}
+\end{pagelisting}

 When stopped in the debugger we can view and change the state of the
 program at this point, we can also issue commands to try the next
--- a/designpattern/lecture/designpattern.tex
+++ b/designpattern/lecture/designpattern.tex
@ -10,7 +10,8 @@ pattern]{design pattern}.
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \section{Looping over  vector elements}
 Iterating over vector elements by means of a \mcode{for}-loop is a very commen pattern:
-\begin{lstlisting}[caption={\varcode{for}-loop for accessing vector elements by indices}]
+
+\begin{pagelisting}[caption={\varcode{for}-loop for accessing vector elements by indices}]
 x = [2:3:20];      % Some vector.
 for i=1:length(x)  % For loop over the indices of the vector.
  i                % This is the index (an integer number)
@ -22,12 +23,14 @@ for i=1:length(x)  % For loop over the indices of the vector.
  % as an argument to a function:
  do_something(x(i));
 end
-\end{lstlisting}
+\end{pagelisting}

+\noindent
 If the result of the computation within the loop are single numbers
 that are to be stored in a vector, you should create this vector with
 the right size before the loop:
-\begin{lstlisting}[caption={\varcode{for}-loop for writing a vector}]
+
+\begin{pagelisting}[caption={\varcode{for}-loop for writing a vector}]
 x = [1.2 2.3 2.6 3.1];   % Some vector.
 % Create a vector for the results, as long as the number of loops:
 y = zeros(length(x),1);
@ -38,13 +41,15 @@ for i=1:length(x)
 end
 % Now the result vector can be further processed:
 mean(y);
-\end{lstlisting}
+\end{pagelisting}

+\noindent
 The computation within the loop could also result in a vector of some
 length and not just a single number. If the length of this vector
 (here 10) is known beforehand, then you should create a matrix of
 appropriate size for storing the results:
-\begin{lstlisting}[caption={\varcode{for}-loop for writing rows of a matrix}]
+
+\begin{pagelisting}[caption={\varcode{for}-loop for writing rows of a matrix}]
 x = [2:3:20];             % Some vector.
 % Create space for results -
 % as many rows as loops, as many columns as needed:
@ -56,30 +61,33 @@ for i=1:length(x)
 end
 % Process the results stored in matrix y:
 mean(y, 1)
-\end{lstlisting}
+\end{pagelisting}

+\noindent
 Another possibility is that the result vectors (here of unknown size)
 need to be combined into a single large vector:
-\begin{lstlisting}[caption={\varcode{for}-loop for appending vectors}]
+
+\begin{pagelisting}[caption={\varcode{for}-loop for appending vectors}]
 x = [2:3:20];        % Some vector.
 y = [];              % Empty vector for storing the results.
 for i=1:length(x)
  % The function get_something() returns a vector of unspecified size:
-  z = get_somehow_more(x(i));
+  z = get_something(x(i));
  % The content of z is appended to the result vector y:
-  y = [y; z(:)];
+  y = [y, z(:)];
  % The z(:) syntax ensures that we append column-vectors.
 end
-% Process the results stored in the vector z:
-mean(y)
-\end{lstlisting}
+% Process the results stored in the vector y:
+mean(y, 1)
+\end{pagelisting}


 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \section{Scaling and shifting random numbers, zeros, and ones}
 Random number generators usually return random numbers of a given mean
 and standard deviation. Multiply those numbers by a factor to change their standard deviation and add a number to shift the mean.
-\begin{lstlisting}[caption={Scaling and shifting of random numbers}]
+
+\begin{pagelisting}[caption={Scaling and shifting of random numbers}]
 % 100 random numbers drawn from a normal distribution 
 % with mean 0 and standard deviation 1:
 x = randn(100, 1);
@ -89,18 +97,20 @@ x = randn(100, 1);
 mu = 4.8;
 sigma = 2.3;
 y = randn(100, 1)*sigma + mu;
-\end{lstlisting}
+\end{pagelisting}

+\noindent
 The same principle can be useful for in the context of the functions
 \mcode{zeros()} or \mcode{ones()}:
-\begin{lstlisting}[caption={Scaling and shifting of \varcode{zeros()} and \varcode{ones()}}]
+
+\begin{pagelisting}[caption={Scaling and shifting of \varcode{zeros()} and \varcode{ones()}}]
 x = -1:0.01:2;      % Vector of x-values for plotting
 plot(x, exp(-x.*x));
 % Plot for the same x-values a horizontal line with y=0.8:
 plot(x, zeros(size(x))+0.8);
 % ... or a line with y=0.5:
 plot(x, ones(size(x))*0.5);
-\end{lstlisting}
+\end{pagelisting}


 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
@ -119,25 +129,26 @@ can plot the values of the $y$ vector against the ones of the $x$
 vector.

 The following scripts compute and plot the function $f(x)=e^{-x^2}$:
-\begin{lstlisting}[caption={Plotting a mathematical function --- very detailed}]
+
+\begin{pagelisting}[caption={Plotting a mathematical function --- very detailed}]
 xmin = -1.0;
 xmax = 2.0;
 dx = 0.01;        % Step size
 x = xmin:dx:xmax; % Vector with x-values.
 y = exp(-x.*x);   % No for loop! '.*' for multiplying the vector elements.
 plot(x, y);
-\end{lstlisting}
+\end{pagelisting}

-\begin{lstlisting}[caption={Plotting a mathematical function --- shorter}]
+\begin{pagelisting}[caption={Plotting a mathematical function --- shorter}]
 x = -1:0.01:2;
 y = exp(-x.*x);
 plot(x, y);
-\end{lstlisting}
+\end{pagelisting}

-\begin{lstlisting}[caption={Plotting a mathematical function --- compact}]
+\begin{pagelisting}[caption={Plotting a mathematical function --- compact}]
 x = -1:0.01:2;
 plot(x, exp(-x.*x));
-\end{lstlisting}
+\end{pagelisting}


 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
@ -146,28 +157,34 @@ For estimating probabilities or probability densities from histograms
 we need to normalize them appropriately.

 The \mcode{histogram()} function does this automatically with the appropriate arguments:
-\begin{lstlisting}[caption={Probability density with the \varcode{histogram()}-function}]
+
+\begin{pagelisting}[caption={Probability density with the \varcode{histogram()}-function}]
 x = randn(100, 1);         % Some real-valued data.
 histogram(x, 'Normalization', 'pdf');
-\end{lstlisting}
-\begin{lstlisting}[caption={Probability with the \varcode{histogram()}-function}]
+\end{pagelisting}
+
+\begin{pagelisting}[caption={Probability with the \varcode{histogram()}-function}]
 x = randi(6, 100, 1);      % Some integer-valued data.
 histogram(x, 'Normalization', 'probability');
-\end{lstlisting}
+\end{pagelisting}
+
+\noindent
 Alternatively one can normalize the histogram data as returned by the
 \code{hist()}-function manually:
-\begin{lstlisting}[caption={Probability density with the \varcode{hist()}- and \varcode{bar()}-function}]
+
+\begin{pagelisting}[caption={Probability density with the \varcode{hist()}- and \varcode{bar()}-function}]
 x = randn(100, 1);         % Some real-valued data.
 [h, b] = hist(x);          % Compute histogram.
 h = h/sum(h)/(b(2)-b(1));  % Normalization to a probability density.
 bar(b, h);                 % Plot the probability density.
-\end{lstlisting}
-\begin{lstlisting}[caption={Probability with the \varcode{hist()}- and \varcode{bar()}-function}]
+\end{pagelisting}
+
+\begin{pagelisting}[caption={Probability with the \varcode{hist()}- and \varcode{bar()}-function}]
 x = randi(6, 100, 1);      % Some integer-valued data.
 [h, b] = hist(x);          % Compute histogram.
 h = h/sum(h);              % Normalize to probability.
 bar(b, h);                 % Plot the probabilities.
-\end{lstlisting}
+\end{pagelisting}


 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
--- a/exercises.mk
+++ b/exercises.mk
@ -0,0 +1,33 @@
+EXERCISES=$(TEXFILES:.tex=.pdf)
+SOLUTIONS=$(EXERCISES:%.pdf=%-solutions.pdf)
+
+.PHONY: pdf exercises solutions watch watchexercises watchsolutions clean
+
+pdf : $(SOLUTIONS) $(EXERCISES)
+
+exercises : $(EXERCISES)
+
+solutions : $(SOLUTIONS)
+
+$(SOLUTIONS) : %-solutions.pdf : %.tex ../../exercisesheader.tex ../../exercisestitle.tex
+	{ echo "\\documentclass[answers,12pt,a4paper,pdftex]{exam}"; sed -e '1d' $<; } > $(patsubst %.pdf,%.tex,$@)
+	pdflatex -interaction=scrollmode $(patsubst %.pdf,%.tex,$@) | tee /dev/stderr | fgrep -q "Rerun to get cross-references right" && pdflatex -interaction=scrollmode $(patsubst %.pdf,%.tex,$@) || true
+	rm $(patsubst %.pdf,%,$@).[!p]*
+
+$(EXERCISES) : %.pdf : %.tex ../../exercisesheader.tex ../../exercisestitle.tex
+	pdflatex -interaction=scrollmode $< | tee /dev/stderr | fgrep -q "Rerun to get cross-references right" && pdflatex -interaction=scrollmode $< || true
+
+watch :
+	while true; do ! make -q pdf && make pdf; sleep 0.5; done
+
+watchexercises :
+	while true; do ! make -q exercises && make exercises; sleep 0.5; done
+
+watchsolutions :
+	while true; do ! make -q solutions && make solutions; sleep 0.5; done
+
+clean :
+	rm -f *~ *.aux *.log $(EXERCISES:.pdf=.out) $(SOLUTIONS:.pdf=.out)
+
+cleanup : clean
+	rm -f $(SOLUTIONS) $(EXERCISES)
--- a/exercisesheader.tex
+++ b/exercisesheader.tex
@ -0,0 +1,110 @@
+\usepackage[english]{babel}
+\usepackage{pslatex}
+\usepackage{graphicx}
+\usepackage{tikz}
+\usepackage{xcolor}
+\usepackage{amsmath}
+\usepackage{amssymb}
+
+%%%%% listings %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\usepackage{listings}
+\lstset{
+  language=Matlab,
+  basicstyle=\ttfamily\footnotesize,
+  numbers=left,
+  numberstyle=\tiny,
+  title=\lstname,
+  showstringspaces=false,
+  commentstyle=\itshape\color{darkgray},
+  breaklines=true,
+  breakautoindent=true,
+  % columns=flexible,
+  frame=single,
+  xleftmargin=1.5em,
+  xrightmargin=1em,
+  aboveskip=10pt
+}
+
+%%%%% page style %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\usepackage[left=20mm,right=20mm,top=25mm,bottom=19mm,headsep=2ex,headheight=3ex,footskip=3.5ex]{geometry}
+\pagestyle{headandfoot}
+\ifprintanswers
+\newcommand{\stitle}{Solutions}
+\else
+\newcommand{\stitle}{}
+\fi
+\header{{\bfseries\large \exercisenum. \exercisetopic}}{{\bfseries\large\stitle}}{{\bfseries\large\exercisedate}}
+\firstpagefooter{Prof. Dr. Jan Benda}{}{jan.benda@uni-tuebingen.de}
+\runningfooter{}{\thepage}{}
+
+\shadedsolutions
+\definecolor{SolutionColor}{gray}{0.9}
+
+\setlength{\baselineskip}{15pt}
+\setlength{\parindent}{0.0cm}
+\setlength{\parskip}{0.3cm}
+
+\usepackage{multicol}
+
+%%%%% units %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\usepackage[mediumspace,mediumqspace,Gray,squaren]{SIunits}      % \ohm, \micro
+
+%%%%% new commands %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\newcommand{\cin}[1]{[{\rm #1}]_{\text{in}}}
+\newcommand{\cout}[1]{[{\rm #1}]_{\text{out}}}
+\newcommand{\units}[1]{\text{#1}}
+\newcommand{\K}{\text{K$^+$}}
+\newcommand{\Na}{\text{Na$^+$}}
+\newcommand{\Cl}{\text{Cl$^-$}}
+\newcommand{\Ca}{\text{Ca$^{2+}$}}
+\newcommand{\water}{$\text{H}_2\text{O}$}
+
+\usepackage{dsfont}
+\newcommand{\naZ}{\mathds{N}}
+\newcommand{\gaZ}{\mathds{Z}}
+\newcommand{\raZ}{\mathds{Q}}
+\newcommand{\reZ}{\mathds{R}}
+\newcommand{\reZp}{\mathds{R^+}}
+\newcommand{\reZpN}{\mathds{R^+_0}}
+\newcommand{\koZ}{\mathds{C}}
+\newcommand{\RT}{{\rm Re\!\ }}
+\newcommand{\IT}{{\rm Im\!\ }}
+\newcommand{\arccot}{{\rm arccot}}
+\newcommand{\sgn}{{\rm sgn}}
+\newcommand{\im}{{\rm i}}
+\newcommand{\drv}{\mathrm{d}}
+\newcommand{\divis}[2]{$^{#1}\!\!/\!_{#2}$}
+\newcommand{\vect}[2]{\left( \!\! \begin{array}{c} #1 \\ #2 \end{array} \!\! \right)}
+\newcommand{\matt}[2]{\left( \!\! \begin{array}{cc} #1 \\ #2 \end{array} \!\! \right)}
+\renewcommand{\Re}{\mathrm{Re}}
+\renewcommand{\Im}{\mathrm{Im}}
+\newcommand{\av}[1]{\left\langle #1 \right\rangle}
+
+\newcommand{\pref}[1]{(\ref{#1})}
+\newcommand{\eqnref}[1]{(\ref{#1})}
+
+\newcommand{\hr}{\par\vspace{-5ex}\noindent\rule{\textwidth}{1pt}\par\vspace{-1ex}}
+
+\newcommand{\qt}[1]{\textbf{#1}\\}
+
+\newcommand{\extra}{--- Optional ---\ \mbox{}}
+
+\newcommand{\code}[1]{\texttt{#1}}
+
+%%%%% page breaks %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\newcommand{\continue}{\ifprintanswers%
+\else
+\vfill\hspace*{\fill}$\rightarrow$\newpage%
+\fi}
+\newcommand{\continuepage}{\ifprintanswers%
+\newpage
+\else
+\vfill\hspace*{\fill}$\rightarrow$\newpage%
+\fi}
+\newcommand{\newsolutionpage}{\ifprintanswers%
+\newpage%
+\else
+\fi}
+
+%%%%% hyperref %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+\usepackage[breaklinks=true,bookmarks=true,bookmarksopen=true,pdfpagemode=UseNone,pdfstartview=FitH,colorlinks=true,citecolor=blue!50!black,linkcolor=blue!50!black,urlcolor=blue!50!black]{hyperref}
--- a/pointprocesses/exercises/instructions.tex
+++ b/pointprocesses/exercises/instructions.tex
@ -4,3 +4,4 @@
 {\large Jan Grewe, Jan Benda}\\[-3ex]
 Neuroethology Lab \hfill --- \hfill Institute for Neurobiology \hfill --- \hfill \includegraphics[width=0.28\textwidth]{UT_WBMW_Black_RGB} \\
 \end{center}
+\hr
--- a/header.tex
+++ b/header.tex
@ -1,8 +1,10 @@
 %%%%% title %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \title{\textbf{\huge\sffamily\tr{Introduction to\\[1ex] Scientific Computing}%
       {Einf\"uhrung in die\\[1ex] wissenschaftliche Datenverarbeitung}}}
+%\title{\textbf{\huge\sffamily\tr{Scientific Computing for Neurobiologists}%
+%       {Wissenschaftliche Datenverarbeitung f\"ur Neurobiologen}}}

-\author{{\LARGE Jan Grewe \& Jan Benda}\\[5ex]Abteilung Neuroethologie\\[2ex]%
+\author{{\LARGE Jan Grewe \& Jan Benda}\\[5ex]Neuroethology Lab\\[2ex]%
        \includegraphics[width=0.3\textwidth]{UT_WBMW_Rot_RGB}\vspace{3ex}}

 \date{WS 2020/2021\\\vfill%
@ -66,20 +68,16 @@
 \pagecolor{white}

 %%%%% figures %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-% gnuplot figures:
-\newcommand{\texinputpath}{}
-\newcommand{\texpicture}[1]{{\sffamily\footnotesize\input{\texinputpath#1.tex}}}
-\newcommand{\figlabel}[1]{\textsf{\textbf{\large \uppercase{#1}}}}

 % maximum number of floats:
-\setcounter{topnumber}{2}
-\setcounter{bottomnumber}{0}
+\setcounter{topnumber}{1}
+\setcounter{bottomnumber}{1}
 \setcounter{totalnumber}{2}

 % float placement fractions:
-\renewcommand{\textfraction}{0.2}
+\renewcommand{\textfraction}{0.1}
 \renewcommand{\topfraction}{0.9}
-\renewcommand{\bottomfraction}{0.0}
+\renewcommand{\bottomfraction}{0.9}
 \renewcommand{\floatpagefraction}{0.7}

 % spacing for floats:
@ -209,11 +207,41 @@
 \let\l@lstlisting\l@figure
 \makeatother

-%%%%% english, german, code and file terms: %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+% \lstinputlisting wrapped in a minipage to avoid page breaks:
+\newcommand{\pageinputlisting}[2][]{\vspace{-2ex}\noindent\begin{minipage}[t]{1\linewidth}\lstinputlisting[#1]{#2}\end{minipage}}
+
+%%%%% listing environment: %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+% usage:
+%
+% \begin{pagelisting}[label=listing1, caption={A script.}]
+%   >> x = 6
+% \end{pagelisting}
+%
+% This is the lstlisting environment but wrapped in a minipage to avoid page breaks.
+\lstnewenvironment{pagelisting}[1][]%
+  {\vspace{-2ex}\lstset{#1}\noindent\minipage[t]{1\linewidth}}%
+  {\endminipage}
+
+%%%%% english and german terms: %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \usepackage{ifthen}

+% \enterm[en-index]{term}: Typeset term and add it to the index of english terms
+%
+% \determ[de-index]{term}: Typeset term and add it to the index of german terms
+%
+% \entermde[en-index]{de-index}{term}: Typeset term and add it to the index of english terms
+%                                      and de-index to the index of german terms
+%
+% how to specificy an index:
+% \enterm{term}                                 - just put term into the index
+% \enterm[en-index]{term}                       - typeset term and put en-index into the index
+% \enterm[statistics!mean]{term}                - mean is a subentry of statistics
+% \enterm[statistics!average|see{statistics!mean}]{term} - cross reference to statistics mean
+% \enterm[statistics@\textbf{statistics}]{term} - put index at statistics but use 
+%                                               \textbf{statistics} for typesetting in the index
+
 % \enterm[english index entry]{<english term>}
-% typeset the term in italics and add it (or the optional argument) to
+% typeset the term in italics and add it (or rather the optional argument) to
 % the english index.
 \newcommand{\enterm}[2][]{\textit{#2}\ifthenelse{\equal{#1}{}}{\protect\sindex[enterm]{#2}}{\protect\sindex[enterm]{#1}}}

@ -349,11 +377,12 @@
      }{%
        \immediate\write\solutions{\unexpanded{\subsection}{Exercise \thechapter.\arabic{exercisef}}}%
        \immediate\write\solutions{\unexpanded{\label}{solution\arabic{chapter}-\arabic{exercisef}}}%
-        \immediate\write\solutions{\unexpanded{\lstinputlisting[belowskip=0ex,aboveskip=0ex,%
-          nolol=true, title={\textbf{Source code:} \protect\StrSubstitute{#1}{_}{\_}}]}{\codepath#1}}%
+        \immediate\write\solutions{\unexpanded{\begin{minipage}{1\linewidth}\lstinputlisting[belowskip=0ex,aboveskip=0ex,%
+          nolol=true, title={\textbf{Source code:} \protect\StrSubstitute{#1}{_}{\_}}]}{\codepath#1}\unexpanded{\end{minipage}}}%
        \ifthenelse{\equal{#2}{}}{}%
-          {\immediate\write\solutions{\unexpanded{\lstinputlisting[language={},%
-             nolol=true, title={\textbf{Output:}}, belowskip=0ex, aboveskip=1ex]}{\codepath#2}}}%
+          {\immediate\write\solutions{\unexpanded{\begin{minipage}{1\linewidth}\lstinputlisting[language={},%
+             nolol=true, title={\textbf{Output:}}, belowskip=0ex, aboveskip=1ex]}{\codepath#2}\unexpanded{\end{minipage}}}}%
+        \immediate\write\solutions{\unexpanded{\vspace*{\fill}}}%
        \immediate\write\solutions{}%
      }%
  }%
@ -362,14 +391,18 @@
        { \hypersetup{hypertexnames=false}%
          \ifthenelse{\equal{\exercisesource}{}}{}%
          { \addtocounter{lstlisting}{-1}%
-            \lstinputlisting[belowskip=0pt,aboveskip=1ex,nolol=true,%
+            \par\noindent\begin{minipage}[t]{1\linewidth}%
+            \lstinputlisting[belowskip=1ex,aboveskip=-1ex,nolol=true,%
                             title={\textbf{Solution:} \exercisefile}]%
                            {\exercisesource}%
+            \end{minipage}%
            \ifthenelse{\equal{\exerciseoutput}{}}{}%
              { \addtocounter{lstlisting}{-1}%
+                \par\noindent\begin{minipage}[t]{1\linewidth}%
                \lstinputlisting[language={},title={\textbf{Output:}},%
-                                 nolol=true,belowskip=0pt]%
+                                 nolol=true,belowskip=0pt,aboveskip=-0.5ex]%
                                {\exerciseoutput}%
+                \end{minipage}%
              }%
          }%
          \hypersetup{hypertexnames=true}%
@ -452,12 +485,12 @@
  { \captionsetup{singlelinecheck=off,hypcap=false,labelformat={empty},%
                  labelfont={large,sf,it,bf},font={large,sf,it,bf}}
    \ifthenelse{\equal{#1}{}}%
-    { \begin{mdframed}[linecolor=importantline,linewidth=1ex,%
+    { \begin{mdframed}[nobreak=true,linecolor=importantline,linewidth=1ex,%
                       backgroundcolor=importantback,font={\sffamily}]%
        \setlength{\parindent}{0pt}%
        \setlength{\parskip}{1ex}%
    }%
-    { \begin{mdframed}[linecolor=importantline,linewidth=1ex,%
+    { \begin{mdframed}[nobreak=true,linecolor=importantline,linewidth=1ex,%
                       backgroundcolor=importantback,font={\sffamily},%
                       frametitle={\captionof{iboxf}{#1}},frametitleaboveskip=-1ex,%
                       frametitlebackgroundcolor=importantline]%
--- a/likelihood/exercises/Makefile
+++ b/likelihood/exercises/Makefile
@ -1,34 +1,3 @@
-TEXFILES=$(wildcard exercises??.tex)
-EXERCISES=$(TEXFILES:.tex=.pdf)
-SOLUTIONS=$(EXERCISES:exercises%=solutions%)
+TEXFILES=$(wildcard likelihood-?.tex)

-.PHONY: pdf exercises solutions watch watchexercises watchsolutions clean
-
-pdf : $(SOLUTIONS) $(EXERCISES)
-
-exercises : $(EXERCISES)
-
-solutions : $(SOLUTIONS)
-
-$(SOLUTIONS) : solutions%.pdf : exercises%.tex instructions.tex
-	{ echo "\\documentclass[answers,12pt,a4paper,pdftex]{exam}"; sed -e '1d' $<; } > $(patsubst %.pdf,%.tex,$@)
-	pdflatex -interaction=scrollmode $(patsubst %.pdf,%.tex,$@) | tee /dev/stderr | fgrep -q "Rerun to get cross-references right" && pdflatex -interaction=scrollmode $(patsubst %.pdf,%.tex,$@) || true
-	rm $(patsubst %.pdf,%,$@).[!p]*
-
-$(EXERCISES) : %.pdf : %.tex instructions.tex
-	pdflatex -interaction=scrollmode $< | tee /dev/stderr | fgrep -q "Rerun to get cross-references right" && pdflatex -interaction=scrollmode $< || true
-
-watch :
-	while true; do ! make -q pdf && make pdf; sleep 0.5; done
-
-watchexercises :
-	while true; do ! make -q exercises && make exercises; sleep 0.5; done
-
-watchsolutions :
-	while true; do ! make -q solutions && make solutions; sleep 0.5; done
-
-clean :
-	rm -f *~ *.aux *.log *.out
-
-cleanup : clean
-	rm -f $(SOLUTIONS) $(EXERCISES)
+include ../../exercises.mk
--- a/likelihood/exercises/instructions.tex
+++ b/likelihood/exercises/instructions.tex
@ -1,41 +0,0 @@
-\vspace*{-8ex}
-\begin{center}
-\textbf{\Large Introduction to scientific computing}\\[1ex]
-{\large Jan Grewe, Jan Benda}\\[-3ex]
-Neuroethology lab \hfill --- \hfill Institute for Neurobiology \hfill --- \hfill \includegraphics[width=0.28\textwidth]{UT_WBMW_Black_RGB} \\
-\end{center}
-
-% \ifprintanswers%
-% \else
-
-% % Die folgenden Aufgaben dienen der Wiederholung, \"Ubung und
-% % Selbstkontrolle und sollten eigenst\"andig bearbeitet und gel\"ost
-% % werden. Die L\"osung soll in Form eines einzelnen Skriptes (m-files)
-% % im ILIAS hochgeladen werden. Jede Aufgabe sollte in einer eigenen
-% % ``Zelle'' gel\"ost sein. Die Zellen \textbf{m\"ussen} unabh\"angig
-% % voneinander ausf\"uhrbar sein. Das Skript sollte nach dem Muster:
-% % ``variablen\_datentypen\_\{nachname\}.m'' benannt werden
-% % (z.B. variablen\_datentypen\_mueller.m).
-
-% \begin{itemize}
-% \item \"Uberzeuge dich von jeder einzelnen Zeile deines Codes, dass
-%   sie auch wirklich das macht, was sie machen soll! Teste dies mit
-%   kleinen Beispielen direkt in der Kommandozeile.
-% \item Versuche die L\"osungen der Aufgaben m\"oglichst in
-%   sinnvolle kleine Funktionen herunterzubrechen.
-%   Sobald etwas \"ahnliches mehr als einmal berechnet werden soll,
-%   lohnt es sich eine Funktion daraus zu schreiben!
-% \item Teste rechenintensive \code{for} Schleifen, Vektoren, Matrizen
-%   zuerst mit einer kleinen Anzahl von Wiederholungen oder kleiner
-%   Gr\"o{\ss}e, und benutze erst am Ende, wenn alles \"uberpr\"uft
-%   ist, eine gro{\ss}e Anzahl von Wiederholungen oder Elementen, um eine gute
-%   Statistik zu bekommen.
-% \item Benutze die Hilfsfunktion von \code{matlab} (\code{help
-%     commando} oder \code{doc commando}) und das Internet, um
-%   herauszufinden, wie bestimmte \code{matlab} Funktionen zu verwenden
-%   sind und was f\"ur M\"oglichkeiten sie bieten.
-%   Auch zu inhaltlichen Konzepten bietet das Internet oft viele
-%   Antworten!
-% \end{itemize}
-
-% \fi
--- a/likelihood/exercises/likelihood-1.tex
+++ b/likelihood/exercises/likelihood-1.tex
@ -1,93 +1,23 @@
 \documentclass[12pt,a4paper,pdftex]{exam}

-\usepackage[german]{babel}
-\usepackage{pslatex}
-\usepackage[mediumspace,mediumqspace,Gray]{SIunits}      % \ohm, \micro
-\usepackage{xcolor}
-\usepackage{graphicx}
-\usepackage[breaklinks=true,bookmarks=true,bookmarksopen=true,pdfpagemode=UseNone,pdfstartview=FitH,colorlinks=true,citecolor=blue]{hyperref}
+\newcommand{\exercisetopic}{Maximum Likelihood}
+\newcommand{\exercisenum}{10}
+\newcommand{\exercisedate}{January 12th, 2021}

-%%%%% layout %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\usepackage[left=20mm,right=20mm,top=25mm,bottom=25mm]{geometry}
-\pagestyle{headandfoot}
-\ifprintanswers
-\newcommand{\stitle}{: Solutions}
-\else
-\newcommand{\stitle}{}
-\fi
-\header{{\bfseries\large Exercise 11\stitle}}{{\bfseries\large Maximum likelihood}}{{\bfseries\large January 7th, 2020}}
-\firstpagefooter{Prof. Dr. Jan Benda}{Phone: 29 74573}{Email:
-jan.benda@uni-tuebingen.de}
-\runningfooter{}{\thepage}{}
+\input{../../exercisesheader}

-\setlength{\baselineskip}{15pt}
-\setlength{\parindent}{0.0cm}
-\setlength{\parskip}{0.3cm}
-\renewcommand{\baselinestretch}{1.15}
+\firstpagefooter{Prof. Dr. Jan Benda}{}{jan.benda@uni-tuebingen.de}

-%%%%% listings %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\usepackage{listings}
-\lstset{
-  language=Matlab,
-  basicstyle=\ttfamily\footnotesize,
-  numbers=left,
-  numberstyle=\tiny,
-  title=\lstname,
-  showstringspaces=false,
-  commentstyle=\itshape\color{darkgray},
-  breaklines=true,
-  breakautoindent=true,
-  columns=flexible,
-  frame=single,
-  xleftmargin=1em,
-  xrightmargin=1em,
-  aboveskip=10pt
-}
-
-%%%%% math stuff: %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\usepackage{amsmath}
-\usepackage{amssymb}
-\usepackage{bm} 
-\usepackage{dsfont}
-\newcommand{\naZ}{\mathds{N}}
-\newcommand{\gaZ}{\mathds{Z}}
-\newcommand{\raZ}{\mathds{Q}}
-\newcommand{\reZ}{\mathds{R}}
-\newcommand{\reZp}{\mathds{R^+}}
-\newcommand{\reZpN}{\mathds{R^+_0}}
-\newcommand{\koZ}{\mathds{C}}
-
-%%%%% page breaks %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\newcommand{\continue}{\ifprintanswers%
-\else
-\vfill\hspace*{\fill}$\rightarrow$\newpage%
-\fi}
-\newcommand{\continuepage}{\ifprintanswers%
-\newpage
-\else
-\vfill\hspace*{\fill}$\rightarrow$\newpage%
-\fi}
-\newcommand{\newsolutionpage}{\ifprintanswers%
-\newpage%
-\else
-\fi}
-
-%%%%% new commands %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\newcommand{\qt}[1]{\textbf{#1}\\}
-\newcommand{\pref}[1]{(\ref{#1})}
-\newcommand{\extra}{--- Zusatzaufgabe ---\ \mbox{}}
-\newcommand{\code}[1]{\texttt{#1}}
-
-
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \begin{document}

-\input{instructions}
-
+\input{../../exercisestitle}

 \begin{questions}

+%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% 
+\question \qt{Read chapter 9 on ``Maximum likelihood estimation''!}\vspace{-3ex}
+
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \question \qt{Maximum likelihood of the standard deviation}
 Let's compute the likelihood and the log-likelihood for the estimation
@ -107,10 +37,11 @@ of the standard deviation.
 \end{parts}
 \begin{solution}
  \lstinputlisting{mlestd.m}
+  \lstinputlisting[language={}]{mlestd.out}
  \includegraphics[width=1\textwidth]{mlestd}\\

  The more data the smaller the product of the probabilities ($\approx
-  p^n$ with $0 \le p < 1$) and the smaller the sum of the logarithms
+  p^n$ if $0 \le p < 1$) and the smaller the sum of the logarithms
  of the probabilities ($\approx n\log p$, note that $\log p < 0$).

  The product eventually gets smaller than the precision of the
@ -121,10 +52,10 @@ of the standard deviation.
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \question \qt{Maximum-likelihood estimator of a line through the origin} 
 In the lecture we derived the following equation for an
-maximum-likelihood estimate of the slope $\theta$ of a straight line
+maximum-likelihood estimate of the slope $m$ of a straight line
 through the origin fitted to $n$ pairs of data values $(x_i|y_i)$ with
 standard deviation $\sigma_i$:
-\[\theta = \frac{\sum_{i=1}^n \frac{x_i y_i}{\sigma_i^2}}{ \sum_{i=1}^n
+\[ m = \frac{\sum_{i=1}^n \frac{x_i y_i}{\sigma_i^2}}{ \sum_{i=1}^n
  \frac{x_i^2}{\sigma_i^2}} \]
 \begin{parts}
  \part \label{mleslopefunc} Write a function that takes two vectors
@ -175,7 +106,7 @@ normally-distributed data. Such parameter need to be estimated
 numerically by means of maximum-likelihood from the data.

 Let us demonstrate this approach by means of data that are drawn from a
-gamma distribution,
+gamma distribution.
 \begin{parts}
  \part Find out which \code{matlab} function computes the
  probability-density function of the gamma distribution.
@ -193,7 +124,7 @@ gamma distribution,
  \part Compute and plot a properly normalized histogram of these
  random numbers.

-  \part Find out which \code{matlab} function fit a distribution to a
+  \part Find out which \code{matlab} function fits a distribution to a
  vector of random numbers according to the maximum-likelihood method.
  How do you need to use this function in order to fit a gamma
  distribution to the data?
--- a/likelihood/exercises/mlestd.m
+++ b/likelihood/exercises/mlestd.m
@ -6,16 +6,19 @@ for k = 1:length(ns)
    fprintf('\nn=%d\n', n);
    % draw random numbers:
    x = randn(n,1)*sigma+mu;
-    fprintf('                                mean of the data is %.2f\n', mean(x))
-    fprintf('                  standard deviation of the data is %.2f\n', std(x))
+    datamean = mean(x);
+    fprintf('                                mean %.3f\n', datamean)
+    % we assume the mean to be given, therefore dof=n:
+    fprintf('                  standard deviation %.3f\n', std(x, 1))

    % standard deviation as parameter:
-    psigs = 1.0:0.01:3.0;
+    psigs = 1.0:0.001:3.0;
    % matrix with the probabilities for each x and psigs:
    lms = zeros(length(x), length(psigs));
    for i=1:length(psigs)
        psig = psigs(i);
-        p = exp(-0.5*((x-mu)/psig).^2.0)/sqrt(2.0*pi)/psig;
+        % same mean as for the standard deviation of the data:
+        p = exp(-0.5*((x-datamean)/psig).^2.0)/sqrt(2.0*pi)/psig;
        lms(:,i) = p;
    end
    lm = prod(lms, 1);              % likelihood
@ -24,8 +27,9 @@ for k = 1:length(ns)
    if length(maxlm) > 1
        maxlm = maxlm(1);
    end
-    fprintf('      likelihood: standard deviation of the data is %.2f\n', maxlm)
-    fprintf('  log-likelihood: standard deviation of the data is %.2f\n', psigs(loglm==max(loglm)))
+    maxloglm = psigs(loglm==max(loglm));
+    fprintf('      likelihood: standard deviation %.3f\n', maxlm)
+    fprintf('  log-likelihood: standard deviation %.3f\n', maxloglm)

    % plot likelihood of standard deviation:
    subplot(2, 2, 2*k-1);
--- a/likelihood/exercises/mlestd.out
+++ b/likelihood/exercises/mlestd.out
@ -0,0 +1,11 @@
+n=50
+                                mean 3.468
+                  standard deviation 1.833
+      likelihood: standard deviation 1.833
+  log-likelihood: standard deviation 1.833
+
+n=1000
+                                mean 2.993
+                  standard deviation 2.077
+      likelihood: standard deviation 1.000
+  log-likelihood: standard deviation 2.077
--- a/likelihood/lecture/likelihood-chapter.tex
+++ b/likelihood/lecture/likelihood-chapter.tex
@ -20,12 +20,11 @@

 \section{TODO}
 \begin{itemize}
-\item Fitting psychometric functions:
+\item Fitting psychometric functions, logistic regression:
  Variable $x_i$, responses $r_i$ either 0 or 1.
-  $p(x_i, \theta)$ is Weibull or Boltzmann function.
+  $p(x_i, \theta)$ is Weibull or Boltzmann or logistic function.
  Likelihood is $L = \prod p(x_i, \theta)^{r_i} (1-p(x_i, \theta))^{1-r_i}$.
-  Use fminsearch for fitting.
-\item GLM model fitting?
+  Use fminsearch for fitting?
 \end{itemize}

 \end{document}
--- a/likelihood/lecture/likelihood.tex
+++ b/likelihood/lecture/likelihood.tex
@ -4,111 +4,132 @@
 \label{maximumlikelihoodchapter}
 \exercisechapter{Maximum likelihood estimation}

-A common problem in statistics is to estimate from a probability
-distribution one or more parameters $\theta$ that best describe the
-data $x_1, x_2, \ldots x_n$.  \enterm[maximum likelihood
-estimator]{Maximum likelihood estimators} (\enterm[mle|see{maximum
+The core task of statistics is to infer from measured data some
+parameters describing the data. These parameters can be simply a mean,
+a standard deviation, or any other parameter needed to describe the
+distribution the data are originating from, a correlation coefficient,
+or some parameters of a function describing a particular dependence
+between the data. The brain faces exactly the same problem. Given the
+activity pattern of some neurons (the data) it needs to infer some
+aspects (parameters) of the environment and the internal state of the
+body in order to generate some useful behavior. One possible approach
+to estimate parameters from data are \enterm[maximum likelihood
+estimator]{maximum likelihood estimators} (\enterm[mle|see{maximum
  likelihood estimator}]{mle},
-\determ{Maximum-Likelihood-Sch\"atzer}) choose the parameters such
-that they maximize the likelihood of the data $x_1, x_2, \ldots x_n$
-to originate from the distribution.
+\determ{Maximum-Likelihood-Sch\"atzer}).  They choose the parameters
+such that they maximize the likelihood of the specific data values to
+originate from a specific distribution.

 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\section{Maximum Likelihood}
+\section{Maximum likelihood}

 Let $p(x|\theta)$ (to be read as ``probability(density) of $x$ given
-$\theta$.'') the probability (density) distribution of $x$ given the
-parameters $\theta$. This could be the normal distribution
+$\theta$.'') the probability (density) distribution of data value $x$
+given parameter values $\theta$. This could be the normal distribution
 \begin{equation}
  \label{normpdfmean}
  p(x|\mu, \sigma) = \frac{1}{\sqrt{2\pi \sigma^2}}e^{-\frac{(x-\mu)^2}{2\sigma^2}}
 \end{equation}
 defined by the mean $\mu$ and the standard deviation $\sigma$ as
-parameters $\theta$.  If the $n$ independent observations of $x_1,
-x_2, \ldots x_n$ originate from the same probability density
-distribution (they are \enterm[i.i.d.|see{independent and identically
-  distributed}]{i.i.d.}, \enterm{independent and identically
-  distributed}) then the conditional probability $p(x_1,x_2, \ldots
-x_n|\theta)$ of observing $x_1, x_2, \ldots x_n$ given some specific
-parameter values $\theta$ is given by
+parameters $\theta$.  If the $n$ observations $x_1, x_2, \ldots, x_n$
+are independent of each other and originate from the same probability
+density distribution (they are \enterm[i.i.d.|see{independent and
+  identically distributed}]{i.i.d.}, \enterm{independent and
+  identically distributed}), then the conditional probability
+$p(x_1,x_2, \ldots, x_n|\theta)$ of observing the particular data
+values $x_1, x_2, \ldots, x_n$ given some specific parameter values
+$\theta$ of the probability density is given by the product of the
+probability densities of each data value:
 \begin{equation}
-  p(x_1,x_2, \ldots x_n|\theta) = p(x_1|\theta) \cdot p(x_2|\theta)
-  \ldots p(x_n|\theta) = \prod_{i=1}^n p(x_i|\theta) \; .
+  \label{probdata}
+  p(x_1,x_2, \ldots, x_n|\theta) = p(x_1|\theta) \cdot p(x_2|\theta)
+  \ldots, p(x_n|\theta) = \prod_{i=1}^n p(x_i|\theta) \; .
 \end{equation}
 Vice versa, the \entermde{Likelihood}{likelihood} of the parameters $\theta$
-given the observed data $x_1, x_2, \ldots x_n$ is
+given the observed data $x_1, x_2, \ldots, x_n$ is
 \begin{equation}
-  {\cal L}(\theta|x_1,x_2, \ldots x_n) = p(x_1,x_2, \ldots x_n|\theta) \; .
+  \label{likelihood}
+  {\cal L}(\theta|x_1,x_2, \ldots, x_n) = p(x_1,x_2, \ldots, x_n|\theta) \; .
 \end{equation}
-Note: the likelihood ${\cal L}$ is not a probability in the
+Note, that the likelihood ${\cal L}$ is not a probability in the
 classic sense since it does not integrate to unity ($\int {\cal
-  L}(\theta|x_1,x_2, \ldots x_n) \, d\theta \ne 1$).
+  L}(\theta|x_1,x_2, \ldots, x_n) \, d\theta \ne 1$). For given
+observations $x_1, x_2, \ldots, x_n$, the likelihood
+\eqref{likelihood} is a function of the parameters $\theta$. This
+function has a global maximum for some specific parameter values. At
+this maximum the probability \eqref{probdata} to observe the measured
+data values is the largest.

-When applying maximum likelihood estimations we are interested in the
-parameter values
+Maximum likelihood estimators just find the parameter values
 \begin{equation}
-  \theta_{mle} = \text{argmax}_{\theta} {\cal L}(\theta|x_1,x_2, \ldots x_n)
+  \theta_{mle} = \text{argmax}_{\theta} {\cal L}(\theta|x_1,x_2, \ldots, x_n)
 \end{equation}
-that maximize the likelihood.  $\text{argmax}_xf(x)$ is the value of
-the argument $x$ for which the function $f(x)$ assumes its global
-maximum. Thus, we search for the parameter values $\theta$ at which
-the likelihood ${\cal L}(\theta)$ reaches its maximum. For these
-paraemter values the measured data most likely originated from the
-corresponding distribution.
+that maximize the likelihood \eqref{likelihood}.
+$\text{argmax}_xf(x)$ is the value of the argument $x$ for which the
+function $f(x)$ assumes its global maximum. Thus, we search for the
+parameter values $\theta$ at which the likelihood ${\cal L}(\theta)$
+reaches its maximum. For these parameter values the measured data most
+likely originated from the corresponding distribution.

 The position of a function's maximum does not change when the values
 of the function are transformed by a strictly monotonously rising
 function such as the logarithm. For numerical reasons and reasons that
-we will discuss below, we search for the maximum of the logarithm of
-the likelihood
-(\entermde[likelihood!log-]{Likelihood!Log-}{log-likelihood}):
-
+we discuss below, we instead search for the maximum of the logarithm
+of the likelihood
+(\entermde[likelihood!log-]{Likelihood!Log-}{log-likelihood})
 \begin{eqnarray}
-  \theta_{mle} & = & \text{argmax}_{\theta}\; {\cal L}(\theta|x_1,x_2, \ldots x_n) \nonumber \\
-              & = & \text{argmax}_{\theta}\; \log {\cal L}(\theta|x_1,x_2, \ldots x_n) \nonumber \\
+  \theta_{mle} & = & \text{argmax}_{\theta}\; {\cal L}(\theta|x_1,x_2, \ldots, x_n) \nonumber \\
+              & = & \text{argmax}_{\theta}\; \log {\cal L}(\theta|x_1,x_2, \ldots, x_n) \nonumber \\
              & = & \text{argmax}_{\theta}\; \log \prod_{i=1}^n p(x_i|\theta) \nonumber \\
              & = & \text{argmax}_{\theta}\; \sum_{i=1}^n \log p(x_i|\theta) \label{loglikelihood}
 \end{eqnarray}
+which is the sum of the logarithms of the probabilites of each
+observation. Let's illustrate the concept of maximum likelihood
+estimation on the arithmetic mean.

 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\subsection{Example: the arithmetic mean}
-Suppose that the measurements $x_1, x_2, \ldots x_n$ originate from a
-normal distribution \eqnref{normpdfmean} and we consider the mean
-$\mu$ as the only parameter $\theta$.  Which value of $\theta$
-maximizes the likelihood of the data?
+\subsection{Arithmetic mean}
+Suppose that the measurements $x_1, x_2, \ldots, x_n$ originate from a
+normal distribution \eqref{normpdfmean} and we do not know the
+population mean $\mu$ of the normal distribution
+(\figrefb{mlemeanfig}). In this setting $\mu$ is the only parameter
+$\theta$.  Which value of $\mu$ maximizes the likelihood of the data?

 \begin{figure}[t]
  \includegraphics[width=1\textwidth]{mlemean}
  \titlecaption{\label{mlemeanfig} Maximum likelihood estimation of
    the mean.}{Top: The measured data (blue dots) together with three
-    different possible normal distributions with different means
-    (arrows) the data could have originated from.  Bottom left: the
-    likelihood as a function of $\theta$ i.e. the mean. It is maximal
-    at a value of $\theta = 2$. Bottom right: the
-    log-likelihood. Taking the logarithm does not change the position
-    of the maximum.}
+    normal distributions differing in their means (arrows) from which
+    the data could have originated from.  Bottom left: the likelihood
+    as a function of the parameter $\mu$. For the data it is maximal
+    at a value of $\mu = 2$. Bottom right: the log-likelihood. Taking
+    the logarithm does not change the position of the maximum.}
 \end{figure}

-The log-likelihood \eqnref{loglikelihood}
+With the normal distribution \eqref{normpdfmean} and applying
+logarithmic identities, the log-likelihood \eqref{loglikelihood} reads
 \begin{eqnarray}
-  \log {\cal L}(\theta|x_1,x_2, \ldots x_n)
-  & = & \sum_{i=1}^n \log \frac{1}{\sqrt{2\pi \sigma^2}}e^{-\frac{(x_i-\theta)^2}{2\sigma^2}} \nonumber \\
-  & = & \sum_{i=1}^n - \log \sqrt{2\pi \sigma^2} -\frac{(x_i-\theta)^2}{2\sigma^2} \; .
+  \log {\cal L}(\mu|x_1,x_2, \ldots, x_n)
+  & = & \sum_{i=1}^n \log \frac{1}{\sqrt{2\pi \sigma^2}}e^{-\frac{(x_i-\mu)^2}{2\sigma^2}} \nonumber \\
+  & = & \sum_{i=1}^n - \log \sqrt{2\pi \sigma^2} -\frac{(x_i-\mu)^2}{2\sigma^2} \; .
 \end{eqnarray}
 Since the logarithm is the inverse function of the exponential
 ($\log(e^x)=x$), taking the logarithm removes the exponential from the
-normal distribution.  To calculate the maximum of the log-likelihood,
-we need to take the derivative with respect to $\theta$ and set it to
-zero:
+normal distribution. This is the second reason why it is useful to
+maximize the log-likelihood. To calculate the maximum of the
+log-likelihood, we need to take the derivative with respect to $\mu$
+and set it to zero:
 \begin{eqnarray}
-  \frac{\text{d}}{\text{d}\theta} \log {\cal L}(\theta|x_1,x_2, \ldots x_n) & = & \sum_{i=1}^n - \frac{2(x_i-\theta)}{2\sigma^2} \;\; = \;\; 0  \nonumber \\
-  \Leftrightarrow \quad \sum_{i=1}^n x_i - \sum_{i=1}^n \theta & = & 0  \nonumber \\
-  \Leftrightarrow \quad n \theta & = & \sum_{i=1}^n x_i  \nonumber \\
-  \Leftrightarrow \quad \theta & = & \frac{1}{n} \sum_{i=1}^n x_i \;\; = \;\; \bar x
+  \frac{\text{d}}{\text{d}\mu} \log {\cal L}(\mu|x_1,x_2, \ldots, x_n) & = & \sum_{i=1}^n - \frac{\text{d}}{\text{d}\mu} \log \sqrt{2\pi \sigma^2} - \frac{\text{d}}{\text{d}\mu} \frac{(x_i-\mu)^2}{2\sigma^2} \;\; = \;\;  0  \nonumber \\
+  \Leftrightarrow \quad \sum_{i=1}^n - \frac{2(x_i-\mu)}{2\sigma^2} & = & 0  \nonumber \\
+  \Leftrightarrow \quad \sum_{i=1}^n x_i - \sum_{i=1}^n \mu & = & 0  \nonumber \\
+  \Leftrightarrow \quad n \mu & = & \sum_{i=1}^n x_i  \nonumber \\
+  \Leftrightarrow \quad \mu & = & \frac{1}{n} \sum_{i=1}^n x_i \;\; = \;\; \bar x \label{arithmeticmean}
 \end{eqnarray}
-Thus, the maximum likelihood estimator is the arithmetic mean. That
-is, the arithmetic mean maximizes the likelihood that the data
-originate from a normal distribution centered at the arithmetic mean
+Thus, the maximum likelihood estimator of the population mean of
+normally distributed data is the arithmetic mean. That is, the
+arithmetic mean maximizes the likelihood that the data originate from
+a normal distribution centered at the arithmetic mean
 (\figref{mlemeanfig}). Equivalently, the standard deviation computed
 from the data, maximizes the likelihood that the data were generated
 from a normal distribution with this standard deviation.
@ -123,6 +144,17 @@ from a normal distribution with this standard deviation.
  the maxima with the mean calculated from the data.
 \end{exercise}

+Comparing the values of the likelihood with the ones of the
+log-likelihood shown in \figref{mlemeanfig}, shows the numerical
+reason for taking the logarithm of the likelihood. The likelihood
+values can get very small, because we multiply many, potentially small
+probability densities with each other. The likelihood quickly gets
+smaller than the samlles number a floating point number of a computer
+can represent. Try it by increasing the number of data values in the
+exercise. Taking the logarithm avoids this problem. The log-likelihood
+assumes well behaving numbers that can be handled well by the
+computer.
+

 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \section{Fitting probability distributions}
@ -130,32 +162,39 @@ Consider normally distributed data with unknown mean and standard
 deviation.  From the considerations above we just have seen that a
 Gaussian distribution with mean at the arithmetic mean and standard
 deviation equal to the standard deviation computed from the data is
-the best Gaussian distribution that fits the data best in a maximum
-likelihood sense, i.e. the likelihood that the data were generated
-from this distribution is the largest. Fitting a Gaussian distribution
-to data is very simple: just compute the two parameter of the Gaussian
-distribution as the arithmetic mean and a standard deviation directly
-from the data.
+the Gaussian that fits the data best in a maximum likelihood sense,
+i.e. the likelihood that the data were generated from this
+distribution is the largest. Fitting a Gaussian distribution to data
+is very simple: just compute the two parameter of the Gaussian
+distribution $\mu$ and $\sigma$ as the arithmetic mean and a standard
+deviation, respectively, directly from the data.

-For non-Gaussian distributions (e.g. a Gamma-distribution), however,
-such simple analytical expressions for the parameters of the
-distribution do not exist, e.g. the shape parameter of a
-\entermde[distribution!Gamma-]{Verteilung!Gamma-}{Gamma-distribution}. How
-do we fit such a distribution to some data? That is, how should we
-compute the values of the parameters of the distribution, given the
-data?
+For non-Gaussian distributions, for example a
+\entermde[distribution!Gamma-]{Verteilung!Gamma-}{Gamma-distribution}
+\begin{equation}
+  \label{gammapdf}
+  p(x|\alpha,\beta) \sim x^{\alpha-1}e^{-\beta x}
+\end{equation}
+with a shape parameter $\alpha$ and a rate parameter $\beta$
+(\figrefb{mlepdffig}), in general no such simple analytical
+expressions for estimating the parameters directly from the data do
+not exist. How do we fit such a distribution to the data?  That is,
+how should we compute the values of the parameters of the
+distribution, given the data?

-A first guess could be to fit the probability density function by
-minimization of the squared difference to a histogram of the measured
-data. For several reasons this is, however, not the method of choice:
-(i) Probability densities can only be positive which leads, for small
-values in particular, to asymmetric distributions. (ii) The values of
-a histogram estimating the density are not independent because the
-integral over a density is unity. The two basic assumptions of
-normally distributed and independent samples, which are a prerequisite
-make the minimization of the squared difference \eqnref{chisqmin} to a
-maximum likelihood estimation, are violated. (iii) The histogram
-strongly depends on the chosen bin size \figref{mlepdffig}).
+A first guess could be to fit the probability density function by a
+\enterm{least squares} fit to a normalized histogram of the measured data in
+the same way as we fit a function to some data. For several reasons
+this is, however, not the method of choice: (i) Probability densities
+can only be positive which leads, in particular for small values, to
+asymmetric distributions of the estimated histogram around the true
+density. (ii) The values of a histogram estimating the density are not
+independent because the integral over a density is unity. The two
+basic assumptions of normally distributed and independent samples,
+which are a prerequisite for making the minimization of the squared
+difference to a maximum likelihood estimation (see next section), are
+violated. (iii) The estimation of the probability density by means of
+a histogram strongly depends on the chosen bin size.

 \begin{figure}[t]
  \includegraphics[width=1\textwidth]{mlepdf}
@ -164,20 +203,19 @@ strongly depends on the chosen bin size \figref{mlepdffig}).
    order Gamma-distribution. The maximum likelihood estimation of the
    probability density function is shown in orange, the true pdf is
    shown in red. Right: normalized histogram of the data together
-    with the real (red) and the fitted probability density
-    functions. The fit was done by minimizing the squared difference
-    to the histogram.}
+    with the true probability density (red) and the probability
+    density function obtained by a least squares fit to the
+    histogram.}
 \end{figure}

 Instead we should stay with maximum-likelihood estimation.  Exactly in
 the same way as we estimated the mean value of a Gaussian distribution
 above, we can numerically fit the parameter of any type of
 distribution directly from the data by means of maximizing the
-likelihood.  We simply search for the parameter $\theta$ of the
-desired probability density function that maximizes the
-log-likelihood. In general this is a non-linear optimization problem
-that is solved with numerical methods such as the gradient descent
-\matlabfun{mle()}.
+likelihood.  We simply search for the parameter values of the desired
+probability density function that maximize the log-likelihood. In
+general this is a non-linear optimization problem that is solved with
+numerical methods such as the gradient descent \matlabfun{mle()}.

 \begin{exercise}{mlegammafit.m}{mlegammafit.out}
  Generate a sample of gamma-distributed random numbers and apply the
@ -190,46 +228,63 @@ that is solved with numerical methods such as the gradient descent
 \section{Curve fitting}

 When fitting a function of the form $f(x;\theta)$ to data pairs
-$(x_i|y_i)$ one tries to adapt the parameter $\theta$ such that the
-function best describes the data. With maximum likelihood we search
-for the parameter value $\theta$ for which the likelihood that the data
-were drawn from the corresponding function is maximal.  If we assume
-that the $y_i$ values are normally distributed around the function
-values $f(x_i;\theta)$ with a standard deviation $\sigma_i$, the
-log-likelihood is
+$(x_i|y_i)$ one tries to adapt the parameters $\theta$ such that the
+function best describes the data. In
+chapter~\ref{gradientdescentchapter} we simply assumed that ``best''
+means minimizing the squared distance between the data and the
+function.  With maximum likelihood we search for those parameter
+values $\theta$ that maximize the likelihood of the data to be drawn
+from the corresponding function.
+
+If we assume that the $y_i$ values are normally distributed around the
+function values $f(x_i;\theta)$ with a standard deviation $\sigma_i$,
+the log-likelihood is
 \begin{eqnarray}
  \log {\cal L}(\theta|(x_1,y_1,\sigma_1), \ldots, (x_n,y_n,\sigma_n))
  & = & \sum_{i=1}^n \log \frac{1}{\sqrt{2\pi \sigma_i^2}}e^{-\frac{(y_i-f(x_i;\theta))^2}{2\sigma_i^2}}  \nonumber \\
-  & = & \sum_{i=1}^n - \log \sqrt{2\pi \sigma_i^2} -\frac{(y_i-f(x_i;\theta))^2}{2\sigma_i^2} \\
+  & = & \sum_{i=1}^n - \log \sqrt{2\pi \sigma_i^2} -\frac{(y_i-f(x_i;\theta))^2}{2\sigma_i^2}
 \end{eqnarray}
-The only difference to the previous example is that the averages in
-the equations above are now given as the function values
-$f(x_i;\theta)$. The parameter $\theta$ should be the one that
-maximizes the log-likelihood. The first part of the sum is independent
-of $\theta$ and can thus be ignored when computing the the maximum:
+The only difference to the previous example of the arithmetic mean is
+that the means $\mu$ in the equations above are given by the function
+values $f(x_i;\theta)$. The parameters $\theta$ should maximize the
+log-likelihood. The first term in the sum is independent of $\theta$
+and can be ignored when computing the the maximum. From the second
+term we pull out the constant factor $-\frac{1}{2}$:
 \begin{eqnarray}
  & = & - \frac{1}{2} \sum_{i=1}^n \left( \frac{y_i-f(x_i;\theta)}{\sigma_i} \right)^2
 \end{eqnarray}
 We can further simplify by inverting the sign and then search for the
-minimum. Also the factor $1/2$ can be ignored since it does not affect
-the position of the minimum:
+minimum. Also the factor $\frac{1}{2}$ can be ignored since it does
+not affect the position of the minimum:
 \begin{equation}
  \label{chisqmin}
  \theta_{mle} = \text{argmin}_{\theta} \; \sum_{i=1}^n \left( \frac{y_i-f(x_i;\theta)}{\sigma_i} \right)^2 \;\; = \;\; \text{argmin}_{\theta} \; \chi^2
 \end{equation}
-The sum of the squared differences normalized by the standard
-deviation is also called $\chi^2$. The parameter $\theta$ which
-minimizes the squared differences is thus the one that maximizes the
-likelihood that the data actually originate from the given
-function. Minimizing $\chi^2$ therefore is a maximum likelihood
-estimation.
+The sum of the squared differences between the $y$-data values and the
+function values, normalized by the standard deviation of the data
+around the function, is called $\chi^2$ (chi squared). The parameter
+$\theta$ which minimizes the squared differences is thus the one that
+maximizes the likelihood of the data to actually originate from the
+given function. 
+
+Whether minimizing $\chi^2$ or the \enterm{mean squared error}
+\eqref{meansquarederror} introduced in
+chapter~\ref{gradientdescentchapter} does not matter. The latter is
+the mean and $\chi^2$ is the sum of the squared differences. They
+simply differ by the constant factor $n$, the number of data pairs,
+which does not affect the position of the minimum. $\chi^2$ is more
+general in that it allows for different standard deviations for each
+data pair. If they are all the same ($\sigma_i = \sigma$), the common
+standard deviation can be pulled out of the sum and also does not
+influence the position of the minimum. Both \enterm{least squares} and
+minimizing $\chi^2$ are maximum likelihood estimators of the
+parameters $\theta$ of a function.

 From the mathematical considerations above we can see that the
 minimization of the squared difference is a maximum-likelihood
 estimation only if the data are normally distributed around the
 function. In case of other distributions, the log-likelihood
-\eqnref{loglikelihood} needs to be adapted accordingly and be
-maximized respectively.
+\eqref{loglikelihood} needs to be adapted accordingly.

 \begin{figure}[t]
  \includegraphics[width=1\textwidth]{mlepropline}
@ -242,26 +297,32 @@ maximized respectively.
    the normal distribution of the data around the line (right histogram).}
 \end{figure}

+Let's go on and calculate the minimum \eqref{chisqmin} of $\chi^2$
+analytically for a simple function.

-\subsection{Example: simple proportionality}
-The function of a line with slope $\theta$ through the origin is
-\[ f(x) = \theta x \; . \]
-The $\chi^2$-sum is thus
-\[ \chi^2 = \sum_{i=1}^n \left( \frac{y_i-\theta x_i}{\sigma_i} \right)^2 \; . \]
-To estimate the minimum we again take the first derivative with
-respect to $\theta$ and equate it to zero:
+
+\subsection{Straight line trough the origin}
+The function of a straight line with slope $m$ through the origin
+is
+\[ f(x) = m x \; . \]
+With this specific function, $\chi^2$ reads
+\[ \chi^2 = \sum_{i=1}^n \left( \frac{y_i-m x_i}{\sigma_i} \right)^2
+\; . \] To calculate the minimum we take the first derivative with
+respect to $m$ and equate it to zero:
 \begin{eqnarray}
-  \frac{\text{d}}{\text{d}\theta}\chi^2 & = & \frac{\text{d}}{\text{d}\theta} \sum_{i=1}^n \left( \frac{y_i-\theta x_i}{\sigma_i} \right)^2 \nonumber \\
-  & = & \sum_{i=1}^n \frac{\text{d}}{\text{d}\theta} \left( \frac{y_i-\theta x_i}{\sigma_i} \right)^2 \nonumber \\
-  & = & -2 \sum_{i=1}^n  \frac{x_i}{\sigma_i} \left( \frac{y_i-\theta x_i}{\sigma_i} \right) \nonumber \\
-  & = & -2 \sum_{i=1}^n \left( \frac{x_i y_i}{\sigma_i^2} - \theta \frac{x_i^2}{\sigma_i^2} \right) \;\; = \;\; 0 \nonumber \\
-\Leftrightarrow \quad  \theta \sum_{i=1}^n \frac{x_i^2}{\sigma_i^2} & = & \sum_{i=1}^n \frac{x_i y_i}{\sigma_i^2} \nonumber
+  \frac{\text{d}}{\text{d}m}\chi^2 & = & \sum_{i=1}^n \frac{\text{d}}{\text{d}m} \left( \frac{y_i-m x_i}{\sigma_i} \right)^2 \nonumber \\
+  & = & -2 \sum_{i=1}^n  \frac{x_i}{\sigma_i} \left( \frac{y_i-m x_i}{\sigma_i} \right) \nonumber \\
+  & = & -2 \sum_{i=1}^n \left( \frac{x_i y_i}{\sigma_i^2} - m \frac{x_i^2}{\sigma_i^2} \right) \;\; = \;\; 0 \nonumber \\
+\Leftrightarrow \quad  m \sum_{i=1}^n \frac{x_i^2}{\sigma_i^2} & = & \sum_{i=1}^n \frac{x_i y_i}{\sigma_i^2} \nonumber \\
+\Leftrightarrow \quad  m & = & \frac{\sum_{i=1}^n \frac{x_i y_i}{\sigma_i^2}}{ \sum_{i=1}^n \frac{x_i^2}{\sigma_i^2}} \label{mleslope}
 \end{eqnarray}
-\begin{eqnarray}
-\Leftrightarrow \quad  \theta & = & \frac{\sum_{i=1}^n \frac{x_i y_i}{\sigma_i^2}}{ \sum_{i=1}^n \frac{x_i^2}{\sigma_i^2}} \label{mleslope}
-\end{eqnarray}
-This is an analytical expression for the estimation of the slope
-$\theta$ of the regression line (\figref{mleproplinefig}).
+This is an analytical expression for the estimation of the slope $m$
+of the regression line (\figref{mleproplinefig}). We do not need to
+apply numerical methods like the gradient descent to find the slope
+that minimizes the squared differences. Instead, we can compute the
+slope directly from the data by means of \eqnref{mleslope}, very much
+like we calculate the mean of some data by means of the arithmetic
+mean \eqref{arithmeticmean}.

 \subsection{Linear and non-linear fits}
 A gradient descent, as we have done in the previous chapter, is not
@ -276,47 +337,68 @@ or the coefficients $a_k$ of a polynomial
 \matlabfun{polyfit()}.

 Parameters that are non-linearly combined can not be calculated
-analytically. Consider for example the rate $\lambda$ of the
-exponential decay
+analytically. Consider, for example, the factor $c$ and the rate
+$\lambda$ of the exponential decay
 \[ y = c \cdot e^{\lambda x} \quad , \quad c, \lambda \in \reZ \; . \]
 Such cases require numerical solutions for the optimization of the
 cost function, e.g. the gradient descent \matlabfun{lsqcurvefit()}.

 \subsection{Relation between slope and correlation coefficient}
-Let us have a closer look on \eqnref{mleslope}. If the standard
-deviation of the data $\sigma_i$ is the same for each data point,
-i.e. $\sigma_i = \sigma_j \; \forall \; i, j$, the standard deviation drops
-out of \eqnref{mleslope} and we get
+Let us have a closer look on \eqnref{mleslope} for the slope of a line
+through the origin. If the standard deviation of the data $\sigma_i$
+is the same for each data point, i.e. $\sigma_i = \sigma_j \; \forall
+\; i, j$, the standard deviation drops out and \eqnref{mleslope}
+simplifies to
 \begin{equation}
  \label{whitemleslope}
-  \theta = \frac{\sum_{i=1}^n x_i y_i}{\sum_{i=1}^n x_i^2}
+  m = \frac{\sum_{i=1}^n x_i y_i}{\sum_{i=1}^n x_i^2}
 \end{equation}
-To see what this expression is, we need to standardize the data. We
-make the data mean free and normalize them to their standard
-deviation, i.e. $x \mapsto (x - \bar x)/\sigma_x$. The resulting
-numbers are also called \entermde[z-values]{z-Wert}{$z$-values} or
-$z$-scores and they have the property $\bar x = 0$ and $\sigma_x =
-1$. $z$-scores are often used in Biology to make quantities that
-differ in their units comparable. For standardized data the variance
+To see what the nominator and the denominator of this expression
+describe, we need to subtract from the data their mean value. We make
+the data mean free, i.e. $x \mapsto x - \bar x$ and $y \mapsto y -
+\bar y$ . For mean-free data the variance
 \begin{equation}
-  \sigma_x^2 = \frac{1}{n} \sum_{i=1}^n (x_i - \bar x)^2 = \frac{1}{n} \sum_{i=1}^n x_i^2 = 1
+  \sigma_x^2 = \frac{1}{n} \sum_{i=1}^n (x_i - \bar x)^2 = \frac{1}{n} \sum_{i=1}^n x_i^2
 \end{equation}
-is given by the mean squared data and equals one.
-The covariance between $x$ and $y$ also simplifies to
+is given by the mean squared data.  In the same way, the covariance
+between $x$ and $y$ simplifies to
 \begin{equation}
  \text{cov}(x, y) = \frac{1}{n} \sum_{i=1}^n (x_i - \bar x)(y_i -
-  \bar y) =\frac{1}{n} \sum_{i=1}^n x_i y_i
+  \bar y) =\frac{1}{n} \sum_{i=1}^n x_i y_i \; ,
 \end{equation}
-the averaged product between pairs of $x$ and $y$ values.  Recall that
-the correlation coefficient $r_{x,y}$,
-\eqnref{correlationcoefficient}, is the covariance normalized by the
-product of the standard deviations of $x$ and $y$,
-respectively. Therefore, in case the standard deviations equal one,
-the correlation coefficient is identical to the covariance.
-Consequently, for standardized data the slope of the regression line
-\eqnref{whitemleslope} simplifies to
+the averaged product between pairs of $x$ and $y$ values. Expanding
+the fraction in \eqnref{whitemleslope} by $\frac{1}{n}$ we get
 \begin{equation}
-  \theta = \frac{1}{n} \sum_{i=1}^n x_i y_i = \text{cov}(x,y) = r_{x,y}
+  \label{meanfreeslope}
+  m = \frac{\frac{1}{n}\sum_{i=1}^n x_i y_i}{\frac{1}{n}\sum_{i=1}^n x_i^2}
+    = \frac{\text{cov}(x, y)}{\sigma_x^2}
+\end{equation}
+
+Recall that the correlation coefficient $r_{x,y}$ is the covariance
+normalized by the product of the standard deviations of $x$ and $y$:
+\begin{equation}
+  \label{meanfreecorrcoef}
+  r_{x,y} = \frac{\text{cov}(x, y)}{\sigma_x\sigma_y}
+\end{equation}
+If furthermore the standard deviations of $x$ and $y$ are the same,
+i.e. $\sigma_x = \sigma_y$, the slope of a line trough the origin is
+identical to the correlation coefficient.
+
+This relation between slope and correlation coefficient in particular
+holds for standardized data that have been made mean free and have
+been normalized by their standard deviation, i.e. $x \mapsto (x - \bar
+x)/\sigma_x$ and $y \mapsto (y - \bar x)/\sigma_y$. The resulting
+numbers are called \entermde[z-value]{z-Wert}{$z$-values} or
+\enterm[z-score]{$z$-scores}. Their mean equals zero and their
+standard deviation one. $z$-scores are often used to make quantities
+that differ in their units comparable. For standardized data the
+denominators for both the slope \eqref{meanfreeslope} and the
+correlation coefficient \eqref{meanfreecorrcoef} equal one.  For
+standardized data, both the slope of the regression line and the
+corelation coefficient reduce to the covariance between the $x$ and
+$y$ data:
+\begin{equation}
+  m = \frac{1}{n} \sum_{i=1}^n x_i y_i = \text{cov}(x,y) = r_{x,y}
 \end{equation}
 For standardized data the slope of the regression line is the same as the
 correlation coefficient!
@ -324,63 +406,100 @@ correlation coefficient!

 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \section{Neural coding}
-In sensory systems certain aspects of the environment are encoded in
-the neuronal activity of populations of neurons. One example of such a
-population code is the tuning of neurons in the primary visual cortex
-(V1) to the orientation of an edge or bar in the visual
-stimulus. Different neurons respond best to different edge
-orientations. Traditionally, such a tuning is measured by analyzing
-the neuronal response strength (e.g. the firing rate) as a function of
-the orientation of a black bar and is illustrated and summarized
-with the so called \enterm{tuning-curve} (\determ{Abstimmkurve},
-figure~\ref{mlecodingfig}, top).
+Maximum likelihood estimators are not only a central concept for data
+analysis. Neural systems face the very same problem. They also need to
+estimate parameters of the internal and external environment based on
+the activity of neurons.

 \begin{figure}[tp]
  \includegraphics[width=1\textwidth]{mlecoding}
  \titlecaption{\label{mlecodingfig} Maximum likelihood estimation of
-    a stimulus parameter from neuronal activity.}{Top: Tuning curve of
-    an individual neuron as a function of the stimulus orientation (a
-    dark bar in front of a white background). The stimulus that evokes
-    the strongest activity in that neuron is the bar with the vertical
-    orientation (arrow, $\phi_i=90$\,\degree). The red area indicates
-    the variability of the neuronal activity $p(r|\phi)$ around the
-    tuning curve. Center: In a population of neurons, each neuron may
-    have a different tuning curve (colors). A specific stimulus (the
-    vertical bar) activates the individual neurons of the population
-    in a specific way (dots). Bottom: The log-likelihood of the
-    activity pattern will be maximized close to the real stimulus
+    a stimulus parameter from neuronal activity.}{Top: Tuning curve
+    $r_i(\phi;c,\phi_i)$ of a specific neuron $i$ as a function of the
+    orientation $\phi$ of a stimulus, a dark bar in front of a white
+    background. The preferred stimulus $\phi_i$ of that neuron, the
+    one that evokes the strongest firing rate response, is a bar with
+    vertical orientation (arrow, $\phi_i=90$\,\degree). The width of
+    the red area indicates the variability of the neuronal activity
+    $\sigma_i$ around the tuning curve. Center: In a population of
+    neurons, each neuron may have a different tuning curve (colors). A
+    specific stimulus activates the individual neurons of the
+    population in a specific way (dots). Bottom: The log-likelihood of
+    the activity pattern has a maximum close to the real stimulus
    orientation.}
 \end{figure}

+In sensory systems certain aspects of the environment are encoded in
+the neuronal activity of populations of neurons. One example of such a
+population code is the tuning of neurons in the primary visual cortex
+(V1) to the orientation of a bar in the visual stimulus. Different
+neurons respond best to different bar orientations. Traditionally,
+such a tuning is measured by analyzing the neuronal response strength
+(e.g. the firing rate) as a function of the orientation of a black bar
+and is illustrated and summarized with the so called
+\enterm{tuning-curve} (\determ{Abstimmkurve},
+figure~\ref{mlecodingfig}, top).
+
 The brain, however, is confronted with the inverse problem: given a
 certain activity pattern in the neuronal population, what is the
-stimulus (here the orientation of an edge)? In the sense of maximum
-likelihood, a possible answer to this question would be: the stimulus
-for which the particular activity pattern is most likely given the
-tuning of the neurons.
+stimulus? In our example, what is the orientation of the bar? In the
+sense of maximum likelihood, a possible answer to this question would
+be: the stimulus for which the particular activity pattern is most
+likely given the tuning of the neurons and the noise (standard
+deviation) of the responses.

 Let's stay with the example of the orientation tuning in V1. The
-tuning $\Omega_i(\phi)$ of the neurons $i$ to the preferred edge
-orientation $\phi_i$ can be well described using a van-Mises function
-(the Gaussian function on a cyclic x-axis) (\figref{mlecodingfig}):
+tuning of the firing rate $r_i(\phi)$ of neuron $i$ to the preferred
+bar orientation $\phi_i$ can be well described using a van-Mises
+function (the Gaussian function on a cyclic x-axis)
+(\figref{mlecodingfig}):
 \begin{equation}
-  \Omega_i(\phi) = c \cdot e^{\cos(2(\phi-\phi_i))} \quad , \quad c \in \reZ
+  \label{bartuningcurve}
+  r_i(\phi; c, \phi_i) = c \cdot e^{\cos(2(\phi-\phi_i))} \quad , \quad c > 0
 \end{equation} 
+Note the factor two in the cosine, because the response of the neuron
+is the same for a bar turned by 180\,\degree.
+
 If we approximate the neuronal activity by a normal distribution
-around the tuning curve with a standard deviation $\sigma=\Omega/4$,
-which is proportional to $\Omega$, then the probability $p_i(r|\phi)$
-of the $i$-th neuron showing the activity $r$ given a certain
-orientation $\phi$ of an edge is given by
+around the tuning curve with a standard deviation $\sigma_i$, then the
+probability $p_i(r|\phi)$ of the $i$-th neuron having the observed
+activity $r$, given a certain orientation $\phi$ of a bar is
 \begin{equation}
-  p_i(r|\phi) = \frac{1}{\sqrt{2\pi}\Omega_i(\phi)/4} e^{-\frac{1}{2}\left(\frac{r-\Omega_i(\phi)}{\Omega_i(\phi)/4}\right)^2} \; .
+  p_i(r|\phi) = \frac{1}{\sqrt{2\pi\sigma_i^2}} e^{-\frac{1}{2}\left(\frac{r-r_i(\phi; c, \phi_i)}{\sigma_i}\right)^2} \; .
 \end{equation}
-The log-likelihood of the edge orientation $\phi$ given the
+The log-likelihood of the bar orientation $\phi$ given the
 activity pattern in the population $r_1$, $r_2$, ... $r_n$ is thus
 \begin{equation}
-  {\cal L}(\phi|r_1, r_2, \ldots r_n) = \sum_{i=1}^n \log p_i(r_i|\phi)
+  {\cal L}(\phi|r_1, r_2, \ldots, r_n) = \sum_{i=1}^n \log p_i(r_i|\phi)
 \end{equation}
-The angle $\phi$ that maximizes this likelihood is then an estimate of
-the orientation of the edge.
+The angle $\phi_{mle}$ that maximizes this likelihood is an estimate
+of the true orientation of the bar (\figref{mlecodingfig}).
+
+The noisiness of the neuron's responses as quantified by $\sigma_i$
+usually is a function of the neuron's mean firing rate $r_i$:
+$\sigma_i = \sigma_i(r_i)$. This dependence has a major impact on the
+maximum likelihood estimation. Usually, the stronger the response of a
+neuron, the higher its firing rate, the lower the noise. In this case,
+strong responses have a stronger influence on the position of the
+maximum of the log-likelihood.
+
+Whether neural systems really implement maximum likelihood estimators
+is another question. There are many ways how a stimulus property can
+be read out from the activity of a population of neurons. The simplest
+one being a ``winner takes all'' rule. The preferred stimulus
+parameter of the neuron with the strongest response is the
+estimate. Another possibility is to compute a population vector. The
+estimated stimulus parameter is the sum of the preferred stimulus
+parameters of all neurons in the population weighted by the activity
+of the neurons. In case of angular stimulus parameters, like the
+orientation of the bar in our example, a vector pointing in the
+direction of the angle is used instead of the angle to incorporate the
+cyclic nature of the parameter. 
+
+Using maximum likelihood estimators for analyzing neural population
+activity gives us an upper bound of how well a stimulus parameter is
+encoded in the activity of the neurons. The brain would not be able to
+do better.


 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
--- a/likelihood/lecture/mlecoding.py
+++ b/likelihood/lecture/mlecoding.py
@ -5,11 +5,9 @@ import matplotlib.gridspec as gridspec
 from plotstyle import *

 rng = np.random.RandomState(4637281)
-lmarg=0.1
-rmarg=0.1

 fig = plt.figure(figsize=cm_size(figure_width, 2.8*figure_height))
-spec = gridspec.GridSpec(nrows=4, ncols=1, height_ratios=[4, 4, 1, 3], hspace=0.2,
+spec = gridspec.GridSpec(nrows=4, ncols=1, height_ratios=[4, 5, 1, 3], hspace=0.2,
                         **adjust_fs(fig, left=4.0))
 ax = fig.add_subplot(spec[0, 0])
 ax.set_xlim(0.0, np.pi)
@ -17,7 +15,7 @@ ax.set_xticks(np.arange(0.125*np.pi, 1.*np.pi, 0.125*np.pi))
 ax.set_xticklabels([])
 ax.set_ylim(0.0, 3.5)
 ax.yaxis.set_major_locator(plt.NullLocator())
-ax.text(-0.2, 0.5*3.5, 'Activity', rotation='vertical', va='center')
+ax.text(-0.2, 0.5*3.5, 'Firing rate', rotation='vertical', va='center')
 ax.annotate('Tuning curve',
            xy=(0.42*np.pi, 2.5), xycoords='data',
            xytext=(0.3*np.pi, 3.2), textcoords='data', ha='right',
@ -32,27 +30,34 @@ ax.text(0.52*np.pi, 0.7, 'preferred\norientation')
 xx = np.arange(0.0, 2.0*np.pi, 0.01)
 pp = 0.5*np.pi
 yy = np.exp(np.cos(2.0*(xx+pp)))
-ax.fill_between(xx, yy+0.25*yy, yy-0.25*yy, **fsBa)
+ss = 1.0/(0.75+2.0*yy)
+ax.fill_between(xx, yy+ss, yy-ss, **fsBa)
 ax.plot(xx, yy, **lsB)

 ax = fig.add_subplot(spec[1, 0])
 ax.set_xlim(0.0, np.pi)
 ax.set_xticks(np.arange(0.125*np.pi, 1.*np.pi, 0.125*np.pi))
 ax.set_xticklabels([])
-ax.set_ylim(0.0, 3.0)
+ax.set_ylim(-0.1, 3.5)
 ax.yaxis.set_major_locator(plt.NullLocator())
-ax.text(-0.2, 0.5*3.5, 'Activity', rotation='vertical', va='center')
+ax.text(-0.2, 0.5*3.5, 'Firing rate', rotation='vertical', va='center')
 xx = np.arange(0.0, 1.0*np.pi, 0.01)
 prefphases = np.arange(0.125*np.pi, 1.*np.pi, 0.125*np.pi)
 responses = []
-xresponse = 0.475*np.pi
+sigmas = []
+xresponse = 0.41*np.pi
+ax.annotate('Orientation of bar',
+            xy=(xresponse, -0.1), xycoords='data',
+            xytext=(xresponse, 3.1), textcoords='data', ha='left', zorder=-10,
+            arrowprops=dict(arrowstyle="->", relpos=(0.0,0.0)) )
 for pp, ls, ps in zip(prefphases, [lsE, lsC, lsD, lsB, lsD, lsC, lsE],
                      [psE, psC, psD, psB, psD, psC, psE]) :
    yy = np.exp(np.cos(2.0*(xx+pp)))
-    #ax.plot(xx, yy, color=cm.autumn(2.0*np.abs(pp/np.pi-0.5), 1))
    ax.plot(xx, yy, **ls)
    y = np.exp(np.cos(2.0*(xresponse+pp)))
-    responses.append(y + rng.randn()*0.25*y)
+    s = 1.0/(0.75+2.0*y)
+    responses.append(y + rng.randn()*s)
+    sigmas.append(s)
    ax.plot(xresponse, y, **ps)
 responses = np.array(responses)

@ -68,25 +73,23 @@ ax = fig.add_subplot(spec[3, 0])
 ax.set_xlim(0.0, np.pi)
 ax.set_xticks(np.arange(0.125*np.pi, 1.*np.pi, 0.125*np.pi))
 ax.set_xticklabels([])
-ax.set_ylim(-1600, 0)
+ax.set_ylim(-210, 0)
 ax.yaxis.set_major_locator(plt.NullLocator())
 ax.set_xlabel('Orientation')
-ax.text(-0.2, -800, 'Log-Likelihood', rotation='vertical', va='center')
+ax.text(-0.2, -100, 'Log-Likelihood', rotation='vertical', va='center')
 phases = np.linspace(0.0, 1.1*np.pi, 100)
 probs = np.zeros((len(responses), len(phases)))
-for k, (pp, r) in enumerate(zip(prefphases, responses)) :
+for k, (pp, r, sigma) in enumerate(zip(prefphases, responses, sigmas)) :
    y = np.exp(np.cos(2.0*(phases+pp)))
-    sigma = 0.1*y
-    probs[k,:] = np.exp(-0.5*((r-y)/sigma)**2.0)/np.sqrt(2.0*np.pi)/sigma
+    probs[k,:] = np.exp(-0.5*((r-y)/sigma)**2.0)/np.sqrt(2.0*np.pi*sigma**2)
 loglikelihood = np.sum(np.log(probs), 0)
-maxl = np.max(loglikelihood)
 maxp = phases[np.argmax(loglikelihood)]
 ax.annotate('',
-            xy=(maxp, -1600), xycoords='data',
-            xytext=(maxp, -30), textcoords='data',
+            xy=(maxp, -210), xycoords='data',
+            xytext=(maxp, -10), textcoords='data',
            arrowprops=dict(arrowstyle="->", relpos=(0.5,0.5),
            connectionstyle="angle3,angleA=80,angleB=90") )
-ax.text(maxp+0.05, -1100, 'most likely\norientation\ngiven the responses')
-ax.plot(phases, loglikelihood, **lsA)
+ax.text(maxp+0.05, -150, 'most likely\norientation\ngiven the responses')
+ax.plot(phases, loglikelihood, clip_on=False, **lsA)

 plt.savefig('mlecoding.pdf')
--- a/likelihood/lecture/mlemean.py
+++ b/likelihood/lecture/mlemean.py
@ -52,7 +52,7 @@ for i, theta in enumerate(thetas) :
 p=np.prod(ps,axis=0)
 # plot it:
 ax = fig.add_subplot(spec[1, 0])
-ax.set_xlabel(r'Parameter $\theta$')
+ax.set_xlabel(r'Parameter $\mu$')
 ax.set_ylabel('Likelihood')
 ax.set_xticks(np.arange(1.6, 2.5, 0.4))
 ax.annotate('Maximum',
@ -68,7 +68,7 @@ ax.annotate('',
 ax.plot(thetas, p, **lsAm)

 ax = fig.add_subplot(spec[1, 1])
-ax.set_xlabel(r'Parameter $\theta$')
+ax.set_xlabel(r'Parameter $\mu$')
 ax.set_ylabel('Log-Likelihood')
 ax.set_ylim(-50,-20)
 ax.set_xticks(np.arange(1.6, 2.5, 0.4))
--- a/logistic/code/logistic.py
+++ b/logistic/code/logistic.py
@ -0,0 +1,156 @@
+import numpy as np
+import matplotlib.pyplot as plt
+from scipy.stats import ttest_ind, mannwhitneyu
+
+
+def auc(n, dx, uniform=False, plot=False):
+    # loser:
+    if uniform:
+        x0 = np.random.rand(n)
+    else:
+        x0 = np.random.randn(n)*0.3
+    y0 = np.zeros(len(x0))
+    # winner:
+    if uniform:
+        x1 = np.random.rand(n) + dx
+    else:
+        x1 = np.random.randn(n)*0.3 + dx
+    y1 = np.ones(len(x1))
+
+    # combine into a single table:
+    data = np.zeros((len(x0) + len(y0), 2))
+    data[:len(x0),0] = x0
+    data[:len(x0),1] = y0
+    data[len(x0):,0] = x1
+    data[len(x0):,1] = y1
+
+    # fraction of overlapping data values:
+    si = np.argsort(data[:,0])
+    i0 = np.argmax(data[si,1] != data[si[0],1])
+    i1 = len(data) - 1 - np.argmax(data[si[::-1],1] != data[si[-1],1])
+    overlap = (i1-i0+1)/len(data)
+
+    # Cohen's d:
+    m0 = np.mean(data[data[:,1] < 0.5,0])
+    v0 = np.var(data[data[:,1] < 0.5,0])
+    m1 = np.mean(data[data[:,1] > 0.5,0])
+    v1 = np.var(data[data[:,1] > 0.5,0])
+    cohensd = (m1 - m0)/np.sqrt(0.5*(v0+v1))
+
+    # t-test:
+    ttest, p = ttest_ind(data[data[:,1] > 0.5,0], data[data[:,1] < 0.5,0])
+
+    # Mann-Whitney U:
+    mannu, p = mannwhitneyu(data[data[:,1] < 0.5,0], data[data[:,1] > 0.5,0])
+
+    # ROC:
+    thresh = np.arange(np.min(data[:,0])-0.1, np.max(data[:,0])+0.2, 0.01)
+    true_pos = np.zeros(len(thresh))
+    false_pos = np.zeros(len(thresh))
+    for k in range(len(thresh)):
+        true_pos[k] = np.sum(data[data[:,0] > thresh[k],1] > 0.5)/np.sum(data[:,1] > 0.5)
+        false_pos[k] = np.sum(data[data[:,0] > thresh[k],1] < 0.5)/np.sum(data[:,1] < 0.5)
+
+    # AUC:
+    droc = 0.001
+    xroc = np.arange(0.0, 1.0+droc, droc)
+    yroc = np.interp(xroc, false_pos[::-1], true_pos[::-1])
+    auc = np.sum(yroc)*droc
+
+    if plot:
+        fig = plt.figure()
+        ax = fig.add_subplot(211)
+        ax.axvline(data[si[i0],0], color='k')
+        ax.axvline(data[si[i1],0], color='k', lw=2)
+        ax.plot(data[:,0], data[:,1], 'o')
+        ax.plot(data[data[:,1] < 0.5,0], np.zeros(len(data[data[:,1] < 0.5,0]))-0.5, 'or')
+        ax.plot(data[data[:,1] > 0.5,0], np.zeros(len(data[data[:,1] > 0.5,0]))-0.5, 'og')
+        ax.text(0.5*(data[si[i0],0]+data[si[i1],0]), 0.65, 'overlap=%.0f%%' % (100.0*overlap), ha='center')
+        ax.text(0.5*(data[si[i0],0]+data[si[i1],0]), 0.35, "Cohen's d=%.2f" % cohensd, ha='center')
+        ax.set_xlabel('x')
+        ax.set_yticks([0, 1])
+        ax.set_yticklabels(['Lose', 'Win'])
+        if uniform:
+            ax.set_title('Uniformly distributed data')
+        else:
+            ax.set_title('Normally distributed data')
+        
+        ax = fig.add_subplot(223)
+        ax.plot(thresh, true_pos, '-og', label='TP')
+        ax.plot(thresh, false_pos, '-or', label='FP')
+        ax.legend()
+        ax.set_xlabel('threshold')
+        
+        ax = fig.add_subplot(224)
+        ax.plot(false_pos, true_pos, '-o')
+        ax.fill_between(xroc, yroc)
+        ax.text(0.5, 0.5, 'AUC=%.0f%%' % (100.0*auc))
+        ax.set_xlabel('FP')
+        ax.set_ylabel('TP')
+        fig.tight_layout()
+        plt.show()
+
+    return auc, overlap, cohensd, ttest, mannu
+
+
+# demo:
+auc(20, 0.5, True, True)
+auc(20, 0.5, False, True)
+
+# AUC versus overlap:
+n = 100
+aucs_uni = []
+overlaps_uni = []
+cohensd_uni = []
+ttest_uni = []
+mannu_uni = []
+aucs_norm = []
+overlaps_norm = []
+cohensd_norm = []
+ttest_norm = []
+mannu_norm = []
+for frac in np.arange(-1.5, 1.5, 0.02):
+    a, o, d, t, u = auc(n, frac, True, False)
+    aucs_uni.append(a)
+    overlaps_uni.append(o)
+    cohensd_uni.append(d)
+    ttest_uni.append(t)
+    mannu_uni.append(u)
+    a, o, d, t, u = auc(n, frac, False, False)
+    aucs_norm.append(a)
+    overlaps_norm.append(o)
+    cohensd_norm.append(d)
+    ttest_norm.append(t)
+    mannu_norm.append(u)
+    
+fig, axs = plt.subplots(2, 2)
+ax = axs[0, 0]
+ax.plot([0.0, 1.0, 0.0], [0.0, 0.5, 1.0], 'k')
+ax.plot(overlaps_uni, aucs_uni, 'o', label='uniform pdfs')
+ax.plot(overlaps_norm, aucs_norm, 'o', label='normal pdfs')
+ax.set_ylim(0, 1)
+ax.set_xlabel('fraction of overlapping data')
+ax.set_ylabel('AUC')
+ax.legend(loc='center left')
+ax = axs[0, 1]
+ax.plot(cohensd_uni, aucs_uni, 'o', label='uniform pdfs')
+ax.plot(cohensd_norm, aucs_norm, 'o', label='normal pdfs')
+ax.set_ylim(0, 1)
+ax.set_xlabel("Cohen's d")
+ax.set_ylabel('AUC')
+#ax.legend(loc='center left')
+ax = axs[1, 1]
+ax.plot(ttest_uni, aucs_uni, 'o', label='uniform pdfs')
+ax.plot(ttest_norm, aucs_norm, 'o', label='normal pdfs')
+ax.set_ylim(0, 1)
+ax.set_xlabel("Student t")
+ax.set_ylabel('AUC')
+ax = axs[1, 0]
+ax.plot(mannu_uni, aucs_uni, 'o', label='uniform pdfs')
+ax.plot(mannu_norm, aucs_norm, 'o', label='normal pdfs')
+ax.set_ylim(0, 1)
+ax.set_xlabel("Mann-Whitney U")
+ax.set_ylabel('AUC')
+fig.savefig('aucoverlap.pdf')
+plt.show()
+
--- a/plotstyle.py
+++ b/plotstyle.py
@ -22,7 +22,7 @@ colors['orange'] = '#FF9900'
 colors['lightorange'] = '#FFCC00'
 colors['yellow'] = '#FFF720'
 colors['green'] = '#99FF00'
-colors['blue'] = '#0010CC'
+colors['blue'] = '#0020BB'
 colors['gray'] = '#A7A7A7'
 colors['black'] = '#000000'
 colors['white'] = '#FFFFFF'
@ -33,17 +33,19 @@ colors['white'] = '#FFFFFF'
 # general settings for plot styles:
 lwthick = 3.0
 lwthin = 1.8
+edgewidth = 0.0 if xkcd_style else 1.0
 mainline = {'linestyle': '-', 'linewidth': lwthick}
 minorline = {'linestyle': '-', 'linewidth': lwthin}
-largemarker = {'marker': 'o', 'markersize': 9, 'markeredgecolor': colors['white'], 'markeredgewidth': 1}
-smallmarker = {'marker': 'o', 'markersize': 6, 'markeredgecolor': colors['white'], 'markeredgewidth': 1}
+largemarker = {'marker': 'o', 'markersize': 9, 'markeredgecolor': colors['white'], 'markeredgewidth': edgewidth}
+largeopenmarker = {'marker': 'o', 'markersize': 7, 'markerfacecolor': colors['white'], 'markeredgewidth': 2}
+smallmarker = {'marker': 'o', 'markersize': 6, 'markeredgecolor': colors['white'], 'markeredgewidth': edgewidth}
 largelinepoints = {'linestyle': '-', 'linewidth': lwthick, 'marker': 'o', 'markersize': 10, 'markeredgecolor': colors['white'], 'markeredgewidth': 1}
 smalllinepoints = {'linestyle': '-', 'linewidth': 1.4, 'marker': 'o', 'markersize': 7, 'markeredgecolor': colors['white'], 'markeredgewidth': 1}
-filllw = 1.0
+filllw = edgewidth
 fillec = colors['white']
 fillalpha = 0.4
 filledge = {'linewidth': filllw, 'joinstyle': 'round'}
-if int(mpl.__version__.split('.')[0]) < 2:
+if mpl_major < 2:
    del filledge['joinstyle']

 # helper lines:
@ -51,6 +53,8 @@ lsSpine = {'c': colors['black'], 'linestyle': '-', 'linewidth': 1, 'clip_on': Fa
 lsGrid = {'c': colors['gray'], 'linestyle': '--', 'linewidth': 1}
 lsMarker = {'c': colors['black'], 'linestyle': '-', 'linewidth': 2}

+psMarker = dict({'color': colors['black'], 'linestyle': 'none'}, **largemarker)
+
 # line (ls), point (ps), and fill styles (fs).

 # Each style is derived from a main color as indicated by the capital letter.
@ -85,6 +89,7 @@ fsAa = {'facecolor': colors['blue'], 'edgecolor': 'none', 'alpha': fillalpha}
 lsB = dict({'color': colors['red']}, **mainline)
 lsBm = dict({'color': colors['red']}, **minorline)
 psB = dict({'color': colors['red'], 'linestyle': 'none'}, **largemarker)
+psBo = dict({'markeredgecolor': colors['red'], 'linestyle': 'none'}, **largeopenmarker)
 psBm = dict({'color': colors['red'], 'linestyle': 'none'}, **smallmarker)
 lpsB = dict({'color': colors['red']}, **largelinepoints)
 lpsBm = dict({'color': colors['red']}, **smalllinepoints)
--- a/plotting/exercises/Makefile
+++ b/plotting/exercises/Makefile
@ -0,0 +1,3 @@
+TEXFILES=$(wildcard plotting-?.tex)
+
+include ../../exercises.mk
--- a/plotting/exercises/instructions.tex
+++ b/plotting/exercises/instructions.tex
@ -1,17 +1,11 @@
-\vspace*{-8ex}
-\begin{center}
-\textbf{\Large Introduction to scientific computing}\\[1ex]
-{\large Jan Grewe, Jan Benda}\\[-3ex]
-Neuroethology lab \hfill --- \hfill Institute for Neurobiology \hfill --- \hfill \includegraphics[width=0.28\textwidth]{UT_WBMW_Black_RGB} \\
-\end{center}
+\ifprintanswers%
+\else

 The exercises are meant for self-monitoring and revision of the
 lecture. You should try to solve them on your own. In contrast
 to previous exercises, the solutions can not be saved in a single file. Combine the files into a
 single zip archive and submit it via ILIAS. Name the archive according
 to the pattern: ``plotting\_\{surname\}.zip''.
-% \ifprintanswers%
-% \else

 % % Die folgenden Aufgaben dienen der Wiederholung, \"Ubung und
 % % Selbstkontrolle und sollten eigenst\"andig bearbeitet und gel\"ost
@ -43,4 +37,4 @@ to the pattern: ``plotting\_\{surname\}.zip''.
 %   Antworten!
 % \end{itemize}

-% \fi
+\fi
--- a/plotting/exercises/plotting-1.tex
+++ b/plotting/exercises/plotting-1.tex
@ -1,88 +1,18 @@
 \documentclass[12pt,a4paper,pdftex]{exam}

-\usepackage[german]{babel}
-\usepackage{pslatex}
-\usepackage[mediumspace,mediumqspace]{SIunits}      % \ohm, \micro
-\usepackage{xcolor}
-\usepackage{graphicx}
-\usepackage[breaklinks=true,bookmarks=true,bookmarksopen=true,pdfpagemode=UseNone,pdfstartview=FitH,colorlinks=true,citecolor=blue]{hyperref}
+\newcommand{\exercisetopic}{Plotting}
+\newcommand{\exercisenum}{X}
+\newcommand{\exercisedate}{December 14th, 2020}

-%%%%% layout %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\usepackage[left=20mm,right=20mm,top=25mm,bottom=25mm]{geometry}
-\pagestyle{headandfoot}
-\ifprintanswers
-\newcommand{\stitle}{: Solutions}
-\else
-\newcommand{\stitle}{}
-\fi
-\header{{\bfseries\large Exercise 7\stitle}}{{\bfseries\large Plotting}}{{\bfseries\large November 20, 2019}}
-\firstpagefooter{Dr. Jan Grewe}{Phone: 29 74588}{Email:
-jan.grewe@uni-tuebingen.de}
-\runningfooter{}{\thepage}{}
+\input{../../exercisesheader}

-\setlength{\baselineskip}{15pt}
-\setlength{\parindent}{0.0cm}
-\setlength{\parskip}{0.3cm}
-\renewcommand{\baselinestretch}{1.15}
+\firstpagefooter{Dr. Jan Grewe}{}{jan.grewe@uni-tuebingen.de}

-%%%%% listings %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\usepackage{listings}
-\lstset{
-  language=Matlab,
-  basicstyle=\ttfamily\footnotesize,
-  numbers=left,
-  numberstyle=\tiny,
-  title=\lstname,
-  showstringspaces=false,
-  commentstyle=\itshape\color{darkgray},
-  breaklines=true,
-  breakautoindent=true,
-  columns=flexible,
-  frame=single,
-  xleftmargin=1em,
-  xrightmargin=1em,
-  aboveskip=10pt
-}
-
-%%%%% math stuff: %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\usepackage{amsmath}
-\usepackage{amssymb}
-\usepackage{bm} 
-\usepackage{dsfont}
-\newcommand{\naZ}{\mathds{N}}
-\newcommand{\gaZ}{\mathds{Z}}
-\newcommand{\raZ}{\mathds{Q}}
-\newcommand{\reZ}{\mathds{R}}
-\newcommand{\reZp}{\mathds{R^+}}
-\newcommand{\reZpN}{\mathds{R^+_0}}
-\newcommand{\koZ}{\mathds{C}}
-
-%%%%% page breaks %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\newcommand{\continue}{\ifprintanswers%
-\else
-\vfill\hspace*{\fill}$\rightarrow$\newpage%
-\fi}
-\newcommand{\continuepage}{\ifprintanswers%
-\newpage
-\else
-\vfill\hspace*{\fill}$\rightarrow$\newpage%
-\fi}
-\newcommand{\newsolutionpage}{\ifprintanswers%
-\newpage%
-\else
-\fi}
-
-%%%%% new commands %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-\newcommand{\qt}[1]{\textbf{#1}\\}
-\newcommand{\pref}[1]{(\ref{#1})}
-\newcommand{\extra}{--- Zusatzaufgabe ---\ \mbox{}}
-\newcommand{\code}[1]{\texttt{#1}}
-
-
-%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 \begin{document}

+\input{../../exercisestitle}
+
 \input{instructions}

 \begin{questions}
--- a/plotting/lecture/plotting-chapter.tex
+++ b/plotting/lecture/plotting-chapter.tex
@ -3,7 +3,7 @@
 \input{../../header}

 \lstset{inputpath=../code}
-\graphicspath{{images/}}
+\graphicspath{{figures/}}

 \typein[\pagenumber]{Number of first page}
 \typein[\chapternumber]{Chapter number}
--- a/plotting/lecture/plotting.tex
+++ b/plotting/lecture/plotting.tex
@ -74,20 +74,20 @@ the data was changed or the same kind of plot has to be created for a
 number of datasets.

 \begin{important}[Why manual editing should be avoided.]
-  On first glance the manual editing of a figure using tools such as
-  Corel draw, Illustrator, etc.\,appears much more convenient and less
-  complex than coding everything into the analysis scripts. This,
-  however, is not entirely true. What if the figure has to be re-drawn
-  or updated? Then the editing work starts all over again. Rather,
-  there is a great risk associated with the manual editing
-  approach. Axes may be shifted, fonts have not been embedded into the
-  final document, annotations have been copy pasted between figures
-  and are not valid. All of these mistakes can be found in
-  publications and then require an erratum, which is not
-  desirable. Even if it appears more cumbersome in the beginning one
-  should always try to create publication-ready figures directly from
-  the data analysis tool using scripts or functions to properly layout
-  the plot.
+  On first glance manual editing of a figure using tools such as
+  inkscape, Corel draw, Illustrator, etc.\,appears much more
+  convenient and less complex than coding everything into the analysis
+  scripts. This, however, is not entirely true. What if the figure has
+  to be re-drawn or updated, because, for example, you got more data?
+  Then the editing work starts all over again. In addition, there is a
+  great risk associated with the manual editing approach. Axes may be
+  shifted, fonts have not been embedded into the final document,
+  annotations have been copy-pasted between figures and are not
+  valid. All of these mistakes can be found in publications and then
+  require an erratum, which is not desirable. Even if it appears more
+  cumbersome in the beginning, one should always try to generate
+  publication-ready figures directly from the data analysis tool using
+  scripts or functions to properly layout and annotate the plot.
 \end{important}

 \subsection{Simple plotting}
@ -148,7 +148,7 @@ or the color. For additional options consult the help.

 The following listing shows a simple line plot with axis labeling and a title

-\lstinputlisting[caption={A simple plot showing a sinewave.},
+\pageinputlisting[caption={A simple plot showing a sinewave.},
  label=simpleplotlisting]{simple_plot.m}


@ -162,10 +162,10 @@ chosen, and star marker symbols is used. Finally, the name of the
 curve is set to \emph{plot 1} which will be displayed in a legend, if
 chosen.

-\begin{lstlisting}[label=settinglineprops, caption={Setting line properties when calling \varcode{plot}.}]
+\begin{pagelisting}[label=settinglineprops, caption={Setting line properties when calling \varcode{plot}.}]
  x = 0:0.1:2*pi; y = sin(x); plot( x, y, 'color', 'r', 'linestyle',
  ':', 'marker', '*', 'linewidth', 1.5, 'displayname', 'plot 1')
-\end{lstlisting}
+\end{pagelisting}

 \begin{important}[Choosing the right color.]
  Choosing the perfect color goes a little bit beyond personal
@ -277,7 +277,7 @@ the last one defines the output format (box\,\ref{graphicsformatbox}).
    listing\,\ref{niceplotlisting}.}\label{spikedetectionfig}
 \end{figure}

-\begin{ibox}[t]{\label{graphicsformatbox}File formats for digital artwork.}
+\begin{ibox}[tp]{\label{graphicsformatbox}File formats for digital artwork.}
  There are two fundamentally different types of formats for digital artwork:
  \begin{enumerate}
  \item \enterm[bitmap]{Bitmaps} (\determ{Rastergrafik})
@ -322,7 +322,7 @@ the last one defines the output format (box\,\ref{graphicsformatbox}).
  efficient.
 \end{ibox}

-\lstinputlisting[caption={Script for creating the plot shown in
+\pageinputlisting[caption={Script for creating the plot shown in
    \figref{spikedetectionfig}.},
  label=niceplotlisting]{automatic_plot.m}

@ -380,7 +380,7 @@ draw the data. In the example we also provide further arguments to set
 the size, color of the dots and specify that they are filled
 (listing\,\ref{scatterlisting1}).

-\lstinputlisting[caption={Creating a scatter plot with red filled dots.},
+\pageinputlisting[caption={Creating a scatter plot with red filled dots.},
  label=scatterlisting1, firstline=9, lastline=9]{scatterplot.m}

 We could have used plot for this purpose and set the marker to
@ -395,8 +395,7 @@ manipulate the color we need to specify a length(x)-by-3 matrix. For
 each dot we provide an individual color (i.e. the RGB triplet in each
 row of the color matrix, lines 2-4 in listing\,\ref{scatterlisting2})

-
-\lstinputlisting[caption={Creating a scatter plot with size and color
+\pageinputlisting[caption={Creating a scatter plot with size and color
    variations. The RGB triplets define the respective color intensity
    in a range 0:1. Here, we modify only the red color channel.},
  label=scatterlisting2, linerange={15-15, 21-23}]{scatterplot.m}
@ -431,7 +430,7 @@ figures\,\ref{regularsubplotsfig}, \ref{irregularsubplotsfig}).
    also below).}\label{regularsubplotsfig}
 \end{figure}

-\lstinputlisting[caption={Script for creating subplots in a regular
+\pageinputlisting[caption={Script for creating subplots in a regular
    grid \figref{regularsubplotsfig}.}, label=regularsubplotlisting,
  basicstyle=\ttfamily\scriptsize]{regular_subplot.m}

@ -458,7 +457,7 @@ create a grid with larger numbers of columns and rows, and specify the
 used cells of the grid by passing a vector as the third argument to
 \code{subplot()}.

-\lstinputlisting[caption={Script for creating subplots of different
+\pageinputlisting[caption={Script for creating subplots of different
    sizes \figref{irregularsubplotsfig}.},
  label=irregularsubplotslisting,
  basicstyle=\ttfamily\scriptsize]{irregular_subplot.m}
@ -516,7 +515,7 @@ its properties. See the \matlab{} help for more information.
    listing\,\ref{errorbarlisting} for A and C and listing\,\ref{errorbarlisting2} }\label{errorbarplot}
 \end{figure}

-\lstinputlisting[caption={Illustrating estimation errors using error bars. Script that
+\pageinputlisting[caption={Illustrating estimation errors using error bars. Script that
    creates \figref{errorbarplot}. A, B},
  label=errorbarlisting, firstline=13, lastline=31,
  basicstyle=\ttfamily\scriptsize]{errorbarplot.m}
@ -550,7 +549,7 @@ leading to invisibility and a value of one to complete
 opaqueness. Finally, we use the normal plot command to draw a line
 connecting the average values (line 12).

-\lstinputlisting[caption={Illustrating estimation errors using a shaded area. Script that
+\pageinputlisting[caption={Illustrating estimation errors using a shaded area. Script that
    creates \figref{errorbarplot} C.}, label=errorbarlisting2,
  firstline=33,
  basicstyle=\ttfamily\scriptsize]{errorbarplot.m}
@ -575,7 +574,7 @@ listing\,\ref{annotationsplotlisting}. For more options consult the
    listing\,\ref{annotationsplotlisting}}\label{annotationsplot}
 \end{figure}

-\lstinputlisting[caption={Adding annotations to figures. Script that
+\pageinputlisting[caption={Adding annotations to figures. Script that
    creates \figref{annotationsplot}.},
  label=annotationsplotlisting,
  basicstyle=\ttfamily\scriptsize]{annotations.m}
@ -632,7 +631,7 @@ Lissajous figure. The basic steps are:
 \item Finally, close the file (line 31).
 \end{enumerate}

-\lstinputlisting[caption={Making animations and saving them as a
+\pageinputlisting[caption={Making animations and saving them as a
    movie.}, label=animationlisting, firstline=16, lastline=36,
  basicstyle=\ttfamily\scriptsize]{movie_example.m}

--- a/pointprocesses/code/binnedRate.m
+++ b/pointprocesses/code/binnedRate.m
@ -18,7 +18,7 @@ function [time, rate] = binned_rate(spikes, bin_width, dt, t_max)
    rate = zeros(size(time));
    h = hist(spikes, bins) ./ bin_width;
    for i = 2:length(bins)
-        rate(round(bins(i - 1) / dt) + 1:round(bins(i) / dt)) = h(i);
+        rate(round(bins(i-1)/dt) + 1:round(bins(i)/dt)) = h(i);
    end
 end

--- a/pointprocesses/code/colorednoisepdf.m
+++ b/pointprocesses/code/colorednoisepdf.m
@ -1,10 +0,0 @@
-function pcn = colorednoisepdf( x, misi, epsilon, tau )
-% returns the ISI pdf for PIF with colored noise drive
-% x: the input ISI
-% misis: the mean isi
-% epsilon: a parameter
-% tau: the correlation time of the noise
-    gamma1 = x/tau+exp(-x/tau)-1.0;
-    gamma2 = 1.0-exp(-x/tau);
-    pcn=exp(-(x-misi).^2./(4.0*epsilon*tau.^2.*gamma1)).*(((misi-x).*gamma2+2*gamma1*tau).^2./(2*gamma1*tau^2)-epsilon*(gamma2.^2-2*gamma1.*exp(-x/tau))) ./ (2*tau*sqrt(4*pi*epsilon*gamma1.^3));
-end
--- a/pointprocesses/code/colorednoisepdfisifit.m
+++ b/pointprocesses/code/colorednoisepdfisifit.m
@ -1,24 +0,0 @@
-% misi = 0.02;
-% epsilon = 1.0;
-% tau = 0.1;
-x=0:0.002:0.1;
-% pcn = colorednoisepdf( x, misi, epsilon, tau )+10.0*randn( size( x ) );
-% plot( x, pcn );
-
-spikes = lifouspikes( 10, 15, 50.0, 1.0, 1.0 );
-isivec = isis( spikes );
-misi = mean( isivec );
-1.0/misi
-isibins = 0:0.0005:0.1;
-[ n, c ] = hist( isivec, isibins );
-n = n / sum(n)/(isibins(2)-isibins(1));
-bar( c, n );
-
-beta0 = [ 1.0, 0.01 ];
-b = nlinfit(c(1:end-2), n(1:end-2), @(b,x)(colorednoisepdf(x, misi, b(1), b(2))), beta0)
-
-pcn = colorednoisepdf( x, misi, b(1), b(2) );
-hold on
-plot( x, pcn, 'r', 'LineWidth', 3 );
-hold off
-
--- a/pointprocesses/code/convolutionRate.m
+++ b/pointprocesses/code/convolutionRate.m
@ -10,19 +10,18 @@ function [time, rate] = convolution_rate(spikes, sigma, dt, t_max)
 %   t_max : the trial duration in seconds.
 %
 % Returns:
-    two vectors containing the time and the rate.
+%   two vectors containing the time and the rate.

-time = 0:dt:t_max - dt;
-rate = zeros(size(time));
-spike_indices = round(spikes / dt);
-rate(spike_indices) = 1;
-kernel = gaussKernel(sigma, dt);
-
-rate = conv(rate, kernel, 'same');
+    time = 0:dt:t_max - dt;
+    rate = zeros(size(time));
+    spike_indices = round(spikes / dt);
+    rate(spike_indices) = 1;
+    kernel = gaussKernel(sigma, dt);
+    rate = conv(rate, kernel, 'same');
 end


 function y = gaussKernel(s, step)
    x = -4 * s:step:4 * s;
-    y = exp(-0.5 .* (x ./ s) .^ 2) ./ sqrt(2 * pi) / s;
+    y = exp(-0.5 .* (x ./ s).^ 2) ./ sqrt(2 * pi) / s;
 end
--- a/pointprocesses/code/counthist.m
+++ b/pointprocesses/code/counthist.m
@ -1,44 +0,0 @@
-function [counts, bins] = counthist(spikes, w)
-% Compute and plot histogram of spike counts.
-%
-% [counts, bins] = counthist(spikes, w)
-%
-% Arguments:
-%   spikes: a cell array of vectors of spike times in seconds
-%   w: observation window duration in seconds for computing the counts
-%
-% Returns:
-%   counts: the histogram of counts normalized to probabilities
-%   bins: the bin centers for the histogram
-
-    % collect spike counts:
-    tmax = spikes{1}(end);
-    n = [];
-    r = [];
-    for k = 1:length(spikes)
-        times = spikes{k};
-%       alternative 1: count the number of spikes in each window:
-%         for tk = 0:w:tmax-w
-%             nn = sum((times >= tk) & (times < tk+w));
-%             %nn = length(find((times >= tk) & (times < tk+w)));
-%             n = [n nn];
-%         end
-%     alternative 2: use the hist() function to do that!
-        tbins = 0.5*w:w:tmax-0.5*w;
-        nn = hist(times, tbins);
-        n = [n nn];
-    end
-
-    % histogram of spike counts:
-    maxn = max(n);
-    [counts, bins] = hist(n, 0:1:maxn+10);
-    % normalize to probabilities:
-    counts = counts / sum(counts);
-
-    % plot:
-    if nargout == 0
-        bar( bins, counts );
-        xlabel( 'counts k' );
-        ylabel( 'P(k)' );
-    end
-end
--- a/pointprocesses/code/counthistpoisson.m
+++ b/pointprocesses/code/counthistpoisson.m
@ -1,55 +0,0 @@
-function [counts, bins] = counthist(spikes, w)
-% computes count histogram and compare with Poisson distribution
-%
-% [counts, bins] = counthist(spikes, w)
-%
-% Arguments:
-%   spikes: a cell array of vectors of spike times in seconds
-%   w: observation window duration in seconds for computing the counts
-%
-% Returns:
-%   counts: the histogram of counts normalized to probabilities
-%   bins: the bin centers for the histogram
-
-    % collect spike counts:
-    tmax = spikes{1}(end);
-    n = [];
-    r = [];
-    for k = 1:length(spikes)
-        times = spikes{k};
-%       alternative 1: count the number of spikes in each window:
-%         for tk = 0:w:tmax-w
-%             nn = sum( ( times >= tk ) & ( times < tk+w ) );
-%             %nn = length( find( ( times >= tk ) & ( times < tk+w ) ) );
-%             n = [ n nn ];
-%         end
-%     alternative 2: use the hist function to do that!
-        tbins = 0.5*w:w:tmax-0.5*w;
-        nn = hist(times, tbins);
-        n = [ n nn ];
-        % the rate of the spikes:
-        rate = (length(times)-1)/(times(end) - times(1));
-        r = [ r rate ];
-    end
-
-    % histogram of spike counts:
-    maxn = max( n );
-    [counts, bins ] = hist( n, 0:1:maxn+10 );
-    % normalize to probabilities:
-    counts = counts / sum( counts );
-
-    % plot:
-    if nargout == 0
-        bar( bins, counts );
-        hold on;
-        % Poisson distribution:
-        rate = mean( r );
-        x = 0:1:maxn+10;
-        a = rate*w;
-        y = a.^x.*exp(-a)./factorial(x);
-        plot( x, y, 'r', 'LineWidth', 3 );
-        hold off;
-        xlabel( 'counts k' );
-        ylabel( 'P(k)' );
-    end
-end
--- a/pointprocesses/code/counts.m
+++ b/pointprocesses/code/counts.m
@ -0,0 +1,25 @@
+function n = counts(spikes, w)
+% Count spikes in time windows.
+%
+% Arguments:
+%   spikes: a cell array of vectors of spike times in seconds
+%   w: duration of window in seconds for computing the counts
+%
+% Returns:
+%   n: vector with spike counts
+    tmax = spikes{1}(end);
+    n = [];
+    for k = 1:length(spikes)
+        times = spikes{k};
+%       alternative 1: count the number of spikes in each window:
+%         for tk = 0:w:tmax-w
+%             nn = sum((times >= tk) & (times < tk+w));
+%             % nn = length(find((times >= tk) & (times < tk+w)));
+%             n = [n, nn];
+%         end
+%     alternative 2: use the hist() function to do that!
+        tbins = 0.5*w:w:tmax-0.5*w;
+        nn = hist(times, tbins);
+        n = [n, nn];
+    end
+end
--- a/pointprocesses/code/fano.m
+++ b/pointprocesses/code/fano.m
@ -1,39 +0,0 @@
-function fano( spikes )
-% computes fano factor as a function of window size
-% spikes: a cell array of vectors of spike times
-
-    tmax = spikes{1}(end);
-    windows = 0.01:0.05:0.01*tmax;
-    mc = windows;
-    vc = windows;
-    ff = windows;
-    fs = windows;
-    for j = 1:length(windows)
-        w = windows( j );
-        % collect counts:
-        n = [];
-        for k = 1:length(spikes)
-            for tk = 0:w:tmax-w
-                nn = sum( ( spikes{k} >= tk ) & ( spikes{k} < tk+w ) );
-                %nn = length( find( ( spikes{k} >= tk ) & ( spikes{k} < tk+w ) ) );
-                n = [ n nn ];
-            end
-        end
-        % statistics for current window:
-        mc(j) = mean( n );
-        vc(j) = var( n );
-        ff(j) = vc( j )/mc( j );
-        fs(j) = sqrt(vc( j )/mc( j ));
-    end
-    
-    subplot( 1, 2, 1 );
-    scatter( mc, vc, 'filled' );
-    xlabel( 'Mean count' );
-    ylabel( 'Count variance' );
-
-    subplot( 1, 2, 2 );
-    scatter( 1000.0*windows, fs, 'filled' );
-    xlabel( 'Window W [ms]' );
-    ylabel( 'Fano factor' );
-end
-
--- a/pointprocesses/code/hompoissonspikes.m
+++ b/pointprocesses/code/hompoissonspikes.m
@ -2,8 +2,6 @@ function spikes = hompoissonspikes(rate, trials, tmax)
 % Generate spike times of a homogeneous poisson process
 % using the exponential interspike interval distribution.
 %
-% spikes = hompoissonspikes(rate, trials, tmax)
-%
 % Arguments:
 %   rate: the rate of the Poisson process in Hertz
 %   trials: number of trials that should be generated
@ -11,7 +9,6 @@ function spikes = hompoissonspikes(rate, trials, tmax)
 %
 % Returns:
 %   spikes: a cell array of vectors of spike times in seconds
-
    spikes = cell(trials, 1);
    mu = 1.0/rate;
    nintervals = 2*round(tmax/mu);
--- a/pointprocesses/code/instantaneousRate.m
+++ b/pointprocesses/code/instantaneousRate.m
@ -19,6 +19,6 @@ function [time, rate] = instantaneous_rate(spikes, dt, t_max)
    spike_indices = [1 round(spikes ./ dt)];

    for i = 2:length(spike_indices)
-        rate(spike_indices(i - 1):spike_indices(i)) = inst_rate(i - 1);
+        rate(spike_indices(i-1):spike_indices(i)) = inst_rate(i-1);
    end
 end
--- a/pointprocesses/code/isihist.m
+++ b/pointprocesses/code/isihist.m
@ -1,25 +1,13 @@
 function [pdf, centers] = isihist(isis, binwidth)
 % Compute normalized histogram of interspike intervals.
 %
-% [pdf, centers] = isihist(isis, binwidth)
-%
 % Arguments:
 %   isis: vector of interspike intervals in seconds
-%   binwidth: optional width in seconds to be used for the isi bins
+%   binwidth: width in seconds to be used for the ISI bins
 %
 % Returns:
-%   pdf: vector with probability density of interspike intervals in Hz
+%   pdf: vector with pdf of interspike intervals in Hertz
 %   centers: vector with centers of interspikeintervalls in seconds
-
-    if nargin < 2
-        % compute good binwidth:
-        nperbin = 200;        % average number of data points per bin
-        bins = length(isis)/nperbin;   % number of bins
-        binwidth = max(isis)/bins;
-        if binwidth < 5e-4             % half a millisecond
-            binwidth = 5e-4;
-        end
-    end
    bins = 0.5*binwidth:binwidth:max(isis);
    % histogram data:
    [nelements, centers] = hist(isis, bins);
--- a/pointprocesses/code/isireturnmap.m
+++ b/pointprocesses/code/isireturnmap.m
@ -1,24 +0,0 @@
-function isireturnmap( isis, lag2 )
-% plot return maps for lag 1 and lag lag2
-
-    clf;
-    subplot( 1, 2, 1 );
-    lag = 1;
-    scatter( 1000.0*isis(1:end-lag)', 1000.0*isis(1+lag:end)', 'b', 'filled', 'MarkerEdgeColor', 'white' );
-    xlabel( 'ISI T_i [ms]' );
-    ylabel( 'ISI T_{i+1} [ms]' );
-    maxisi = max( isis );
-    maxy = ceil(maxisi/10)*10.0;
-    xlim( [0 1.5*maxy ])
-    ylim( [0 maxy ])
-
-    subplot( 1, 2, 2 );
-    lag = lag2;
-    scatter( 1000.0*isis(1:end-lag)', 1000.0*isis(1+lag:end)', 'b', 'filled', 'MarkerEdgeColor', 'white' );
-    xlabel( 'ISI T_i [ms]' );
-    ylabel( 'ISI T_{i+2} [ms]' );
-    xlim( [0 1.5*maxy ])
-    ylim( [0 maxy ])
-
-end
-
--- a/pointprocesses/code/isis.m
+++ b/pointprocesses/code/isis.m
@ -1,15 +1,11 @@
 function isivec = isis(spikes)
 % returns a single list of isis computed from all trials in spikes
 %
-% isivec = isis(spikes)
-%
 % Arguments:
 %   spikes: a cell array of vectors of spike times in seconds
-%   isivec: a column vector with all the interspike intervalls
 %
 % Returns:
-%   isivec: a column vector with all the interspike intervalls
-
+%   isivec: a column vector with all the interspike intervals
    isivec = [];
    for k = 1:length(spikes)
        difftimes = diff(spikes{k});
--- a/pointprocesses/code/isiserialcorr.m
+++ b/pointprocesses/code/isiserialcorr.m
@ -1,35 +1,21 @@
-function isicorr = isiserialcorr(isivec, maxlag)
+function [isicorr, lags] = isiserialcorr(isivec, maxlag)
 % serial correlation of interspike intervals
 %
-% isicorr = isiserialcorr(isivec, maxlag)
-%
 % Arguments:
 %   isivec: vector of interspike intervals in seconds
-%   maxlag: the maximum lag in seconds
+%   maxlag: the maximum lag
 %
 % Returns:
 %   isicorr: vector with the serial correlations for lag 0 to maxlag
-
+%   lags: vector with the lags corresponding to isicorr
    lags = 0:maxlag;
    isicorr = zeros(size(lags));
    for k = 1:length(lags)
        lag = lags(k);
        if length(isivec) > lag+10        % ensure "enough" data
 	    % NOTE: the arguments to corr must be column vectors!
-            % We insure this in the isis() function that 
-            % generates the isivec.
+            % We insure this already in the isis() function.
            isicorr(k) = corr(isivec(1:end-lag), isivec(lag+1:end));
        end
    end
-    
-    if nargout == 0
-        % plot:
-        plot(lags, isicorr, '-b');
-        hold on;
-        scatter(lags, isicorr, 50.0, 'b', 'filled');
-        hold off;
-        xlabel('Lag k')
-        ylabel('\rho_k')
-    end
 end
-
--- a/pointprocesses/code/plotcounthist.m
+++ b/pointprocesses/code/plotcounthist.m
@ -1,24 +1,14 @@
-w = 0.1;
-cmax = 8;
-pmax = 0.5;
-subplot(1, 3, 1);
-counthist(poissonspikes, w);
-xlim([0 cmax])
-set(gca, 'XTick', 0:2:cmax)
-ylim([0 pmax])
-title('Poisson');
-
-subplot(1, 3, 2);
-counthist(pifouspikes, w);
-xlim([0 cmax])
-set(gca, 'XTick', 0:2:cmax)
-ylim([0 pmax])
-title('PIF OU');
-
-subplot(1, 3, 3);
-counthist(lifadaptspikes, w);
-xlim([0 cmax])
-set(gca, 'XTick', 0:2:cmax)
-ylim([0 pmax])
-title('LIF adapt');
-savefigpdf(gcf, 'counthist.pdf', 20, 7);
+function plotcounthist(spikes, w)
+% Plot histogram of spike counts.
+%
+% Arguments:
+%   spikes: a cell array of vectors of spike times in seconds
+%   w: duration of window in seconds for computing the counts
+    n = counts(spikes, w);
+    maxn = max(n);
+    [counts, bins] = hist(n, 0:1:maxn+10);
+    counts = counts / sum(counts);
+    bar(bins, counts);
+    xlabel('counts k');
+    ylabel('P(k)');
+end
--- a/pointprocesses/code/plotfanofactor.m
+++ b/pointprocesses/code/plotfanofactor.m
@ -0,0 +1,31 @@
+function plotfanofactor(spikes, wmin, wmax)
+% Compute and plot Fano factor as a function of window size.
+%
+% Arguments:
+%   spikes: a cell array of vectors of spike times in seconds
+%   wmin: minimum window size in seconds
+%   wmax: maximum window size in seconds
+    windows = logspace(log10(wmin), log10(wmax), 100);
+    mc = zeros(1, length(windows));
+    vc = zeros(1, length(windows));
+    for k = 1:length(windows)
+        w = windows(k);
+        n = counts(spikes, w);
+        mc(k) = mean(n);
+        vc(k) = var(n);
+    end
+    
+    subplot(1, 2, 1);
+    scatter(mc, vc, 'filled');
+    xlabel('Mean count');
+    ylabel('Count variance');
+
+    subplot(1, 2, 2);
+    scatter(1000.0*windows, vc ./ mc, 'filled');
+    xlabel('Window [ms]');
+    ylabel('Fano factor');
+    xlim(1000.0*[windows(1) windows(end)])
+    ylim([0.0 1.1]);
+    set(gca, 'XScale', 'log');
+end
+
--- a/pointprocesses/code/plotisihist.m
+++ b/pointprocesses/code/plotisihist.m
@ -1,24 +1,13 @@
 function plotisihist(isis, binwidth)
 % Plot and annotate histogram of interspike intervals.
 %
-% plotisihist(isis, binwidth)
-%
 % Arguments:
 %   isis: vector of interspike intervals in seconds
-%   binwidth: optional width in seconds to be used for the isi bins
-
-    % compute normalized histogram:
-    if nargin < 2
-        [pdf, centers] = isihist(isis);
-    else
-        [pdf, centers] = isihist(isis, binwidth);
-    end
-
-    % plot:
+%   binwidth: width in seconds to be used for the ISI bins
+    [pdf, centers] = isihist(isis, binwidth);
    bar(1000.0*centers, pdf);     % milliseconds on x-axis
    xlabel('ISI [ms]')
    ylabel('p(ISI) [1/s]')
-    % annotation:
    misi = mean(isis);
    sdisi = std(isis);
    text(0.95, 0.8, sprintf('mean=%.1f ms', 1000.0*misi), ...
--- a/pointprocesses/code/plotisiserialcorr.m
+++ b/pointprocesses/code/plotisiserialcorr.m
@ -0,0 +1,14 @@
+function isicorr = plotisiserialcorr(isivec, maxlag)
+% plot serial correlation of interspike intervals
+%
+% Arguments:
+%   isivec: vector of interspike intervals in seconds
+%   maxlag: the maximum lag
+    [isicorr, lags] = isiserialcorr(isivec, maxlag);
+    plot(lags, isicorr, '-b');
+    hold on;
+    scatter(lags, isicorr, 20.0, 'b', 'filled');
+    hold off;
+    xlabel('Lag k')
+    ylabel('\rho_k')
+end
--- a/pointprocesses/code/plotspikestats.m
+++ b/pointprocesses/code/plotspikestats.m
@ -1,100 +0,0 @@
-%% load data:
-clear all
-% alternative 1:
-% pro: no structs. contra: global unknown variables
-load poisson.mat
-whos
-poissonspikes = spikes;
-load pifou.mat;
-pifouspikes = spikes;
-load lifadapt.mat;
-lifadaptspikes = spikes;
-clear spikes;
-% alternative 2:
-% pro: clean code. contra: structs that we do not really know yet
-clear all
-x = load( 'poisson.mat' );
-poissonspikes = x.spikes;
-x = load( 'pifou.mat' );
-pifouspikes = x.spikes;
-x = load( 'lifadapt.mat' );
-lifadaptspikes = x.spikes;
-
-%% spike raster plots:
-tmax = 1.0;
-subplot(1, 3, 1);
-spikeraster(poissonspikes, tmax);
-title('Poisson');
-
-subplot(1, 3, 2);
-spikeraster(pifouspikes, tmax);
-title('PIF OU');
-
-subplot(1, 3, 3);
-spikeraster(lifadaptspikes, tmax);
-title('LIF adapt');
-
-%% isi histograms:
-maxisi = 300.0;
-binwidth = 0.002;
-subplot(1, 3, 1);
-poissonisis = isis(poissonspikes);
-isihist(poissonisis, binwidth);
-xlim([0, maxisi])
-title('Poisson');
-
-subplot(1, 3, 2);
-pifouisis = isis(pifouspikes);
-isihist(pifouisis, binwidth);
-xlim([0, maxisi])
-title('PIF OU');
-
-subplot(1, 3, 3);
-lifadaptisis = isis(lifadaptspikes);
-isihist(lifadaptisis, binwidth);
-xlim([0, maxisi])
-title('LIF adapt');
-
-%% serial correlations:
-maxlag = 10;
-rrange = [-0.5, 1.05];
-subplot(1, 3, 1);
-isiserialcorr(poissonisis, maxlag);
-ylim(rrange)
-title('Poisson');
-
-subplot(1, 3, 2);
-isiserialcorr(pifouisis, maxlag);
-ylim(rrange)
-title('PIF OU');
-
-subplot(1, 3, 3);
-isiserialcorr(lifadaptisis, maxlag);
-ylim(rrange)
-title('LIF adapt');
-
-%% spike counts:
-w = 0.1;
-cmax = 8;
-pmax = 0.5;
-subplot(1, 3, 1);
-counthist(poissonspikes, w);
-xlim([0 cmax])
-set(gca, 'XTick', 0:2:cmax)
-ylim([0 pmax])
-title('Poisson');
-
-subplot(1, 3, 2);
-counthist(pifouspikes, w);
-xlim([0 cmax])
-set(gca, 'XTick', 0:2:cmax)
-ylim([0 pmax])
-title('PIF OU');
-
-subplot(1, 3, 3);
-counthist(lifadaptspikes, w);
-xlim([0 cmax])
-set(gca, 'XTick', 0:2:cmax)
-ylim([0 pmax])
-title('LIF adapt');
-savefigpdf(gcf, 'counthist.pdf', 20, 7);
--- a/pointprocesses/code/poissonisih.m
+++ b/pointprocesses/code/poissonisih.m
@ -1,27 +0,0 @@
-rate = 100.0;
-trials = 50;
-tmax = 100.0;
-
-% generate spikes:
-spikes = poissonspikes( trials, rate, tmax );
-% interspike intervals:
-isivec = isis( spikes );
-% histogram
-f = figure( 1 );
-isihist( isivec );
-hold on
-% theoretical density:
-xmax = 5.0/rate;
-x = 0:0.0001:xmax;
-y = rate*exp(-rate*x);
-plot( 1000.0*x, y, 'r', 'LineWidth', 3 );
-% plot details:
-title( sprintf( 'Poisson spike trains, rate=%g Hz, nisi=%d', rate, length( isivec ) ) )
-xlim( [ 0.0 1000.0*xmax ] )
-ylim( [ 0.0 1.1*rate ] )
-legend( 'data', 'poisson' )
-hold off
-
-% serial correlations:
-f = figure( 2 );
-isiserialcorr( isivec, 10 );
--- a/pointprocesses/code/poissonisistats.m
+++ b/pointprocesses/code/poissonisistats.m
@ -1,46 +0,0 @@
-rates = 1:1:100;
-avisi = [];
-sdisi = [];
-cvisi = [];
-
-for rate = rates
-    spikes = poissonspikes( 10, rate, 100.0 );
-    isivec = isis( spikes );
-    av = mean( isivec );
-    sd = std( isivec );
-    cv = sd/av;
-    avisi = [ avisi av ];
-    sdisi = [ sdisi sd ];
-    cvisi = [ cvisi cv ];
-end
-
-f = figure;
-subplot( 1, 3, 1 );
-scatter( rates, 1000.0*avisi, 'b', 'filled' );
-hold on;
-plot( rates, 1000.0./rates, 'r' );
-hold off;
-xlabel( 'Rate \lambda [Hz]' );
-ylim( [ 0 1000 ] );
-title( 'Mean ISI [ms]' );
-legend( 'simulation', 'theory 1/\lambda' );
-
-subplot( 1, 3, 2 );
-scatter( rates, 1000.0*sdisi, 'b', 'filled' );
-hold on;
-plot( rates, 1000.0./rates, 'r' );
-hold off;
-xlabel( 'Rate \lambda [Hz]' );
-ylim( [ 0 1000 ] )
-title( 'Standard deviation ISI [ms]' );
-legend( 'simulation', 'theory 1/\lambda' );
-
-subplot( 1, 3, 3 );
-scatter( rates, cvisi, 'b', 'filled' );
-hold on;
-plot( rates, ones( size( rates ) ), 'r' );
-hold off;
-xlabel( 'Rate \lambda [Hz]' );
-ylim( [ 0 2 ] )
-title( 'CV' );
-legend( 'simulation', 'theory' );
--- a/pointprocesses/code/psth.m
+++ b/pointprocesses/code/psth.m
@ -1,14 +0,0 @@
-function p = psth(spikes, dt, tmax)
-% plots a PSTH of the spikes with binwidth dt
-    t = 0.0:dt:tmax+dt;
-    p = zeros(1, length(t));
-    for k=1:length(spikes)
-        times = spikes{k};
-        [h, b] = hist(times, t);
-        p = p + h;
-    end
-    p = p/length(spikes)/dt;
-    t(end) = [];
-    p(end) = [];
-    plot(t, p);
-end
--- a/pointprocesses/code/rasterplot.m
+++ b/pointprocesses/code/rasterplot.m
@ -1,29 +1,32 @@
 function rasterplot(spikes, tmax)
 % Display a spike raster of the spike times given in spikes.
 %
-% rasterplot(spikes, tmax)
+% Arguments:
 %   spikes: a cell array of vectors of spike times in seconds
-%   tmax: plot spike raster upto tmax seconds
-
-ntrials = length(spikes);
-for k = 1:ntrials
-    times = spikes{k};
-    times = times(times<tmax);
-    if tmax < 1.5
-        times = 1000.0*times; % conversion to ms
+%   tmax: plot spike raster up to tmax seconds
+    spiketimes = [];
+    trials = [];
+    ntrials = length(spikes);
+    for k = 1:ntrials
+        times = spikes{k};
+        times = times(times<tmax);
+        % (x,y) pairs for start and stop of stroke
+        % plus nan separating strokes:
+        spiketimes = [spiketimes, ...
+                       [times(:)'; times(:)'; times(:)'*nan]];
+        trials = [trials, ...
+                   [ones(1, length(times)) * (k-0.4); ...
+                    ones(1, length(times)) * (k+0.4); ...
+                    ones(1, length(times)) * nan]];
    end
-    for i = 1:length( times )
-      line([times(i) times(i)],[k-0.4 k+0.4], 'Color', 'k'); 
-    end
-end
-if tmax < 1.5
-    xlabel('Time [ms]');
-    xlim([0.0 1000.0*tmax]);
-else
+    % convert matrices into column vectors of (x,y) pairs:
+    spiketimes = spiketimes(:);
+    trials = trials(:);
+    % plotting this is lightning fast:
+    plot(spiketimes, trials, 'k')
    xlabel('Time [s]');
    xlim([0.0 tmax]);
-end
-ylabel('Trials');
-ylim([0.3 ntrials+0.7 ]);
+    ylabel('Trials');
+    ylim([0.3 ntrials+0.7]);
 end

--- a/pointprocesses/code/spikecounts.m
+++ b/pointprocesses/code/spikecounts.m
@ -1,30 +0,0 @@
-function counts = spikecounts(spikes, w)
-% Compute vector of spike counts.
-%
-% counts = spikecounts(spikes, w)
-%
-% Arguments:
-%   spikes: a cell array of vectors of spike times in seconds
-%   w: observation window duration in seconds for computing the counts
-%
-% Returns:
-%   counts: vector of spike counts
-
-    % collect spike counts:
-    tmax = spikes{1}(end);
-    counts = [];
-    for k = 1:length(spikes)
-        times = spikes{k};
-%       method 1: count the number of spikes in each window:
-%         for tk = 0:w:tmax-w
-%             nn = sum((times >= tk) & (times < tk+w));
-%             %nn = length(times((times >= tk) & (times < tk+w)));
-%             %nn = length(find((times >= tk) & (times < tk+w)));
-%             counts = [counts nn];
-%         end
-%     method 2: use the hist() function to do that!
-        tbins = 0.5*w:w:tmax-0.5*w;
-        nn = hist(times, tbins);
-        counts = [counts nn];
-    end
-end
--- a/pointprocesses/code/spikecountshists.m
+++ b/pointprocesses/code/spikecountshists.m
@ -1,17 +0,0 @@
-w = 0.1;
-bins = 0.0:1.0:10.0;
-
-counts{1} = spikecounts(poissonspikes, w);
-counts{2} = spikecounts(pifouspikes, w);
-counts{3} = spikecounts(lifadaptspikes, w);
-titles = {'Poisson', 'PIF OU', 'LIF adapt'};
-for k = 1:3
-    subplot(1, 3, k);
-    [h, b] = hist(counts{k}, bins);
-    bar(b, h/sum(h));
-    title(titles{k})
-    xlabel('Spike count');
-    xlim([-0.5, 8.5]);
-    ylim([0.0 0.8]);
-end
-savefigpdf(gcf, 'spikecountshists.pdf', 20, 7);
--- a/pointprocesses/code/spikerate.m
+++ b/pointprocesses/code/spikerate.m
@ -1,12 +0,0 @@
-function r = spikerate(spikes, duration)
-% returns the average spike rate of the spikes
-% for the first duration seconds
-% spikes: a cell array of vectors of spike times
-
-    rates = zeros(length(spikes),1);
-    for k = 1:length(spikes)
-        times = spikes{k};
-        rates(k) = sum(times<duration)/duration;
-    end
-    r = mean(rates);
-end
--- a/pointprocesses/exercises/Makefile
+++ b/pointprocesses/exercises/Makefile
@ -1,35 +1,3 @@
-BASENAME=pointprocesses
-TEXFILES=$(wildcard $(BASENAME)??.tex)
-EXERCISES=$(TEXFILES:.tex=.pdf)
-SOLUTIONS=$(EXERCISES:pointprocesses%=pointprocesses-solutions%)
+TEXFILES=$(wildcard pointprocesses-?.tex) psth.tex

-.PHONY: pdf exercises solutions watch watchexercises watchsolutions clean
-
-pdf : $(SOLUTIONS) $(EXERCISES)
-
-exercises : $(EXERCISES)
-
-solutions : $(SOLUTIONS)
-
-$(SOLUTIONS) : pointprocesses-solutions%.pdf : pointprocesses%.tex instructions.tex
-	{ echo "\\documentclass[answers,12pt,a4paper,pdftex]{exam}"; sed -e '1d' $<; } > $(patsubst %.pdf,%.tex,$@)
-	pdflatex -interaction=scrollmode $(patsubst %.pdf,%.tex,$@) | tee /dev/stderr | fgrep -q "Rerun to get cross-references right" && pdflatex -interaction=scrollmode $(patsubst %.pdf,%.tex,$@) || true
-	rm $(patsubst %.pdf,%,$@).[!p]*
-
-$(EXERCISES) : %.pdf : %.tex instructions.tex
-	pdflatex -interaction=scrollmode $< | tee /dev/stderr | fgrep -q "Rerun to get cross-references right" && pdflatex -interaction=scrollmode $< || true
-
-watch :
-	while true; do ! make -q pdf && make pdf; sleep 0.5; done
-
-watchexercises :
-	while true; do ! make -q exercises && make exercises; sleep 0.5; done
-
-watchsolutions :
-	while true; do ! make -q solutions && make solutions; sleep 0.5; done
-
-clean :
-	rm -f *~ *.aux *.log *.out
-
-cleanup : clean
-	rm -f $(SOLUTIONS) $(EXERCISES)
+include ../../exercises.mk
--- a/pointprocesses/exercises/counthist.pdf
+++ b/pointprocesses/exercises/counthist.pdf
--- a/pointprocesses/exercises/counts.m
+++ b/pointprocesses/exercises/counts.m
@ -0,0 +1,25 @@
+function n = counts(spikes, w)
+% Count spikes in time windows.
+%
+% Arguments:
+%   spikes: a cell array of vectors of spike times in seconds
+%   w: duration of window in seconds for computing the counts
+%
+% Returns:
+%   n: vector with spike counts
+    tmax = spikes{1}(end);
+    n = [];
+    for k = 1:length(spikes)
+        times = spikes{k};
+%       alternative 1: count the number of spikes in each window:
+%         for tk = 0:w:tmax-w
+%             nn = sum((times >= tk) & (times < tk+w));
+%             % nn = length(find((times >= tk) & (times < tk+w)));
+%             n = [n, nn];
+%         end
+%     alternative 2: use the hist() function to do that!
+        tbins = 0.5*w:w:tmax-0.5*w;
+        nn = hist(times, tbins);
+        n = [n, nn];
+    end
+end
--- a/pointprocesses/exercises/fanoplot.m
+++ b/pointprocesses/exercises/fanoplot.m
@ -1,18 +1,17 @@
 function fanoplot(spikes, titles)
-% computes and plots fano factor as a function of window size
-% spikes: a cell array of vectors of spike times
-% titles: string that is used as a title for the plots
+% Plots fano factor as a function of window size.
+%
+% Arguments:
+%   spikes: a cell array of vectors of spike times
+%   titles: string that is used as a title for the plots
    windows = logspace(-3.0, -0.5, 100);
-    mc = windows;
-    vc = windows;
-    ff = windows;
+    mc = zeros(1, length(windows));
+    vc = zeros(1, length(windows));
    for j = 1:length(windows)
        w = windows(j);
-        counts = spikecounts(spikes, w);
-        % statistics for current window:
-        mc(j) = mean(counts);
-        vc(j) = var(counts);
-        ff(j) = vc(j)/mc(j);
+        spikecounts = counts(spikes, w);
+        mc(j) = mean(spikecounts);
+        vc(j) = var(spikecounts);
    end
    
    subplot(1, 2, 1);
@ -22,7 +21,7 @@ function fanoplot(spikes, titles)
    ylabel('Count variance');

    subplot(1, 2, 2);
-    scatter(1000.0*windows, ff, 'filled');
+    scatter(1000.0*windows, vc ./ mc, 'filled');
    title(titles);
    xlabel('Window [ms]');
    ylabel('Fano factor');
--- a/pointprocesses/exercises/fanoplots.m
+++ b/pointprocesses/exercises/fanoplots.m
@ -1,9 +1,9 @@
 spikes{1} = poissonspikes;
 spikes{2} = pifouspikes;
 spikes{3} = lifadaptspikes;
-idents = {'poisson', 'pifou', 'lifadapt'};
+titles = {'poisson', 'pifou', 'lifadapt'};
 for k = 1:3
    figure(k)
    fanoplot(spikes{k}, titles{k});
-    savefigpdf(gcf, sprintf('fanoplots%s.pdf', idents{k}), 20, 7);
+    savefigpdf(gcf, sprintf('fanoplots%s.pdf', titles{k}), 20, 7);
 end
--- a/pointprocesses/exercises/fanoplotslifadapt.pdf
+++ b/pointprocesses/exercises/fanoplotslifadapt.pdf
--- a/pointprocesses/exercises/fanoplotspifou.pdf
+++ b/pointprocesses/exercises/fanoplotspifou.pdf
--- a/pointprocesses/exercises/fanoplotspoisson.pdf
+++ b/pointprocesses/exercises/fanoplotspoisson.pdf
--- a/pointprocesses/exercises/hompoissonisih.m
+++ b/pointprocesses/exercises/hompoissonisih.m
@ -1,18 +0,0 @@
-% generate spike times:
-rate = 20.0;
-spikes = hompoissonspikes( 10, rate, 50.0 );
-% isi histogram:
-isivec = isis( spikes );
-isihist( isivec );
-hold on
-% theoretical density:
-xmax = 5.0/rate;
-x = 0:0.0001:xmax;
-y = rate*exp(-rate*x);
-plot( 1000.0*x, y, 'r', 'LineWidth', 3 );
-% plot details:
-title( sprintf( 'Poisson spike trains, rate=%g Hz, nisi=%d', rate, length( isivec ) ) )
-xlim( [ 0.0 1000.0*xmax ] )
-ylim( [ 0.0 1.1*rate ] )
-legend( 'data', 'poisson' )
-hold off
--- a/pointprocesses/exercises/hompoissonisistats.m
+++ b/pointprocesses/exercises/hompoissonisistats.m
@ -1,46 +0,0 @@
-rates = 1:1:100;
-avisi = [];
-sdisi = [];
-cvisi = [];
-
-for rate = rates
-    spikes = hompoissonspikes( 10, rate, 100.0 );
-    isivec = isis( spikes );
-    av = mean( isivec );
-    sd = std( isivec );
-    cv = sd/av;
-    avisi = [ avisi av ];
-    sdisi = [ sdisi sd ];
-    cvisi = [ cvisi cv ];
-end
-
-f = figure;
-subplot( 1, 3, 1 );
-scatter( rates, 1000.0*avisi, 'b', 'filled' );
-hold on;
-plot( rates, 1000.0./rates, 'r' );
-hold off;
-xlabel( 'Rate \lambda [Hz]' );
-ylim( [ 0 1000 ] );
-title( 'Mean ISI [ms]' );
-legend( 'simulation', 'theory 1/\lambda' );
-
-subplot( 1, 3, 2 );
-scatter( rates, 1000.0*sdisi, 'b', 'filled' );
-hold on;
-plot( rates, 1000.0./rates, 'r' );
-hold off;
-xlabel( 'Rate \lambda [Hz]' );
-ylim( [ 0 1000 ] )
-title( 'Standard deviation ISI [ms]' );
-legend( 'simulation', 'theory 1/\lambda' );
-
-subplot( 1, 3, 3 );
-scatter( rates, cvisi, 'b', 'filled' );
-hold on;
-plot( rates, ones( size( rates ) ), 'r' );
-hold off;
-xlabel( 'Rate \lambda [Hz]' );
-ylim( [ 0 2 ] )
-title( 'CV' );
-legend( 'simulation', 'theory' );
--- a/pointprocesses/exercises/hompoissonspikes.m
+++ b/pointprocesses/exercises/hompoissonspikes.m
@ -1,19 +0,0 @@
-function spikes = hompoissonspikes( trials, rate, tmax )
-% Generate spike times of a homogeneous poisson process
-% trials: number of trials that should be generated
-% rate: the rate of the Poisson process in Hertz
-% tmax: the duration of each trial in seconds
-% returns a cell array of vectors of spike times
-
-    dt = 3.33e-5;
-    p = rate*dt;
-    if p > 0.2
-        p = 0.2
-        dt = p/rate;
-    end
-    x = rand( trials, ceil(tmax/dt) );
-    spikes = cell( trials, 1 );
-    for k=1:trials
-        spikes{k} = find( x(k,:) < p ) * dt;
-    end
-end
--- a/pointprocesses/exercises/iafisistats-solutions.pdf
+++ b/pointprocesses/exercises/iafisistats-solutions.pdf
--- a/pointprocesses/exercises/iafisistats.pdf
+++ b/pointprocesses/exercises/iafisistats.pdf
--- a/pointprocesses/exercises/inversegauss.m
+++ b/pointprocesses/exercises/inversegauss.m
--- a/pointprocesses/exercises/inversegaussplot.m
+++ b/pointprocesses/exercises/inversegaussplot.m
--- a/pointprocesses/exercises/isihist.m
+++ b/pointprocesses/exercises/isihist.m
@ -0,0 +1,29 @@
+function [pdf, centers] = isihist(isis, binwidth)
+% Compute normalized histogram of interspike intervals.
+%
+% [pdf, centers] = isihist(isis, binwidth)
+%
+% Arguments:
+%   isis: vector of interspike intervals in seconds
+%   binwidth: optional width in seconds to be used for the isi bins
+%
+% Returns:
+%   pdf: vector with pdf of interspike intervals in Hertz
+%   centers: vector with centers of interspikeintervalls in seconds
+
+    if nargin < 2
+        % compute good binwidth:
+        nperbin = 200;     % average number of data points per bin
+        bins = length(isis)/nperbin;   % number of bins
+        binwidth = max(isis)/bins;
+        if binwidth < 5e-4             % half a millisecond
+            binwidth = 5e-4;
+        end
+    end
+    bins = 0.5*binwidth:binwidth:max(isis);
+    % histogram data:
+    [nelements, centers] = hist(isis, bins);
+    % normalization (integral = 1):
+    pdf = nelements / sum(nelements) / binwidth;
+end
+
--- a/pointprocesses/exercises/isihist.pdf
+++ b/pointprocesses/exercises/isihist.pdf
--- a/pointprocesses/exercises/isis.m
+++ b/pointprocesses/exercises/isis.m
@ -0,0 +1,16 @@
+function isivec = isis(spikes)
+% returns a single list of isis computed from all trials in spikes
+%
+% Arguments:
+%   spikes: a cell array of vectors of spike times in seconds
+%
+% Returns:
+%   isivec: a column vector with all the interspike intervals
+    isivec = [];
+    for k = 1:length(spikes)
+        difftimes = diff(spikes{k});
+        % difftimes(:) ensures a column vector
+        % regardless of the type of vector in spikes{k}
+        isivec = [isivec; difftimes(:)];
+    end
+end
--- a/pointprocesses/exercises/isiserialcorr.m
+++ b/pointprocesses/exercises/isiserialcorr.m
@ -0,0 +1,21 @@
+function [isicorr, lags] = isiserialcorr(isivec, maxlag)
+% serial correlation of interspike intervals
+%
+% Arguments:
+%   isivec: vector of interspike intervals in seconds
+%   maxlag: the maximum lag
+%
+% Returns:
+%   isicorr: vector with the serial correlations for lag 0 to maxlag
+%   lags: vector with the lags corresponding to isicorr
+    lags = 0:maxlag;
+    isicorr = zeros(size(lags));
+    for k = 1:length(lags)
+        lag = lags(k);
+        if length(isivec) > lag+10        % ensure "enough" data
+	    % NOTE: the arguments to corr must be column vectors!
+            % We insure this already in the isis() function.
+            isicorr(k) = corr(isivec(1:end-lag), isivec(lag+1:end));
+        end
+    end
+end
--- a/pointprocesses/exercises/lifadapt.mat
+++ b/pointprocesses/exercises/lifadapt.mat
--- a/pointprocesses/exercises/lifficurves.m
+++ b/pointprocesses/exercises/lifficurves.m
--- a/pointprocesses/exercises/lifisih.m
+++ b/pointprocesses/exercises/lifisih.m
--- a/pointprocesses/exercises/lifisistats.m
+++ b/pointprocesses/exercises/lifisistats.m
--- a/Show More
+++ b/Show More