Added .gitignore that currently only excludes contents of ./data/.
This commit is contained in:
112
main.tex
112
main.tex
@@ -10,8 +10,11 @@
|
||||
\usepackage{parskip}
|
||||
\usepackage{amsmath}
|
||||
\usepackage{amssymb}
|
||||
\usepackage{subcaption}
|
||||
\usepackage{subcaption}
|
||||
\usepackage[labelfont=bf, textfont=small]{caption}
|
||||
\usepackage[german,english]{babel}
|
||||
\addto\captionsenglish{\renewcommand{\figurename}{Fig.}}
|
||||
\addto\captionsenglish{\renewcommand{\tablename}{Tab.}}
|
||||
\usepackage[separate-uncertainty=true, locale=DE]{siunitx}
|
||||
\sisetup{output-exponent-marker=\ensuremath{\mathrm{e}}}
|
||||
% \usepackage[capitalize]{cleveref}
|
||||
@@ -66,14 +69,18 @@
|
||||
\newcommand{\kf}{\omega} % Unspecific Gabor kernel frequency
|
||||
\newcommand{\kp}{\phi} % Unspecific Gabor kernel phase
|
||||
\newcommand{\kn}{n} % Unspecific Gabor kernel lobe number
|
||||
\newcommand{\ks}{s} % Unspecific Gabor kernel sign
|
||||
% \newcommand{\ks}{s} % Unspecific Gabor kernel sign
|
||||
\newcommand{\kwi}{\kw_i} % Specific Gabor kernel width
|
||||
\newcommand{\kfi}{\kf_i} % Specific Gabor kernel frequency
|
||||
\newcommand{\kpi}{\kp_i} % Specific Gabor kernel phase
|
||||
\newcommand{\kni}{\kn_i} % Specific Gabor kernel lobe number
|
||||
\newcommand{\ksi}{\ks_i} % Specific Gabor kernel sign
|
||||
\newcommand{\rh}{\text{RH}} % Relative Gaussian height for FWRH
|
||||
% \newcommand{\ksi}{\ks_i} % Specific Gabor kernel sign
|
||||
|
||||
% Math shorthands - Auxiliary kernel parameters:
|
||||
\newcommand{\fsin}{f_{\text{sin}}} % Carrier frequency
|
||||
\newcommand{\rh}{h_{\text{rel}}} % Relative Gaussian height for FWRH
|
||||
\newcommand{\fwrh}{\text{FWRH}} % Gaussian full-width at relative height
|
||||
\newcommand{\off}{\beta_0} % Offset for linear frequency approximation
|
||||
|
||||
% Math shorthands - Threshold nonlinearity:
|
||||
\newcommand{\thr}{\Theta_i} % Step function threshold value
|
||||
@@ -421,58 +428,62 @@ ascending neuron. We use Gabor kernels as basis functions for creating
|
||||
different template patterns. An arbitrary one-dimensional, real Gabor kernel is
|
||||
generated by multiplication of a Gaussian envelope and a sinusoidal carrier
|
||||
\begin{equation}
|
||||
k_i(t,\,\kwi,\,\kfi,\,\kpi)\,=\,e^{-\frac{t^{2}}{2{\kwi}^{2}}}\,\cdot\,\sin(\kfi\,t\,+\,\kpi), \qquad \kfi\,=\,2\pi f_{sin}
|
||||
k_i(t,\,\kwi,\,\kfi,\,\kpi)\,=\,e^{-\frac{t^{2}}{2{\kwi}^{2}}}\,\cdot\,\sin(\kfi\,t\,+\,\kpi), \qquad \kfi\,=\,2\pi\fsin
|
||||
\label{eq:gabor}
|
||||
\end{equation}
|
||||
with Gaussian standard deviation or kernel width $\kwi$, carrier frequency
|
||||
$\kfi$, and carrier phase $\kpi$. Different combinations of $\kw$, $\kf$, and
|
||||
$\kp$ result in Gabor kernels with different lobe number $\kn$, which is the
|
||||
number of half-periods of the carrier that fit under the Gaussian envelope
|
||||
within reasonable limits of attenuation. These limits are a matter of
|
||||
definition, since the Gaussian function never fully decays to zero. A good
|
||||
measure is the Gaussian full-width at relative height, which can be calculated
|
||||
as
|
||||
$\kfi$, and carrier phase $\kpi$. Different combinations of $\kw$ and $\kf$
|
||||
result in Gabor kernels with different lobe number $\kn$, which is the number
|
||||
of half-periods of the carrier that fit under the Gaussian envelope within
|
||||
reasonable limits of attenuation. The interval under the Gaussian envelope that
|
||||
contains the relevant lobes of the kernel can be defined as Gaussian full-width
|
||||
measured at relative peak height $\rh$
|
||||
\begin{equation}
|
||||
\fwrh(\kw,\,\rh)\,=\,2\,\cdot\,\sqrt{-2\,\ln \rh}\cdot\,\kw, \qquad \rh\,\in\,(0,\,1]
|
||||
\fwrh(\kw,\,\rh)\,=\,2\,\cdot\,\sqrt{-2\,\cdot\,\ln \rh}\cdot\,\kw, \qquad \rh\,\in\,(0,\,1]
|
||||
\end{equation}
|
||||
With this, an appropriate carrier frequency $\kf$ for obtaining a Gabor kernel
|
||||
with width $\kw$ and a desired lobe number $\kn$ can be approximated as
|
||||
with width $\kw$ and desired lobe number $\kn$ can be approximated as
|
||||
% \begin{equation}
|
||||
% \kf(\kn,\,\fwrh)\,=\,\frac{0.5\,\cdot\,\kn\,+\,\off}{\fwrh}, \qquad \kn\,\geq\,2\enspace\forall\enspace \kn\,\in\,\mathbb{Z}
|
||||
% \end{equation}
|
||||
\begin{equation}
|
||||
\kf(\kn,\,\fwrh)\,=\,\frac{0.5\,\cdot\,\kn\,+\,0.5}{\fwrh}
|
||||
\kf(\kn,\,\kw,\,\rh)\,=\,\frac{\kn\,+\,\off}{4\,\cdot\,\sqrt{-2\,\cdot\,\ln \rh}}, \qquad \kn\,\geq\,2\enspace\forall\enspace \kn\,\in\,\mathbb{Z}
|
||||
\end{equation}
|
||||
We restrict the Gabor kernels to be either even functions~(mirror-symmetric,
|
||||
uneven $\kn$) or odd functions~(point-symmetric, even $\kn$). Under this
|
||||
condition, phase $\kp$ is related to lobe number $\kn$ by
|
||||
\begin{equation}
|
||||
\kp(\kn,\,\ks)\,=\,0.5\,\cdot\,(1\,-\,\text{mod}[\kn,\,2]\,+\,\ks)
|
||||
\label{eq:gabor_phase}
|
||||
\end{equation}
|
||||
which results in the specific phase values shown in
|
||||
Table\,\mbox{\ref{tab:gabor_phase}}.
|
||||
where $\off$ is a small positive offset to the near-linear relationship between
|
||||
$\kf$ and $\kn$ to balance the amplitude of the $\kn$ desired lobes of the
|
||||
kernel --- which should be maximized --- against the amplitude of the
|
||||
next-outer lobes, which should not exceed the threshold value determined by
|
||||
$\rh$. For $\kn=1$, carrier frequency $\kf$ is set to zero, which results in a
|
||||
simple Gaussian kernel. Carrier phase $\kp$ determines the position of the
|
||||
kernel lobes relative to the kernel center. By setting $\kp$ to one of only
|
||||
four specific phase values~(Tab.\,\ref{tab:gabor_phases}), we restrict the
|
||||
Gabor kernels to be either even functions~(mirror-symmetric, uneven $\kn$) or
|
||||
odd functions~(point-symmetric, even $\kn$) with either positive or negative
|
||||
sign, which refers to the sign of the kernel's central lobe (even kernels) or
|
||||
the left of the two central lobes (odd kernels).
|
||||
\FloatBarrier
|
||||
\begin{table}[!ht]
|
||||
\centering
|
||||
\captionsetup{width=.55\textwidth}
|
||||
\caption{}
|
||||
\captionsetup{width=.46\textwidth}
|
||||
\caption{Values of phase $\kp$ that are specific for the four major groups
|
||||
of Gabor kernels.}
|
||||
\begin{tabular}{|ccc|}
|
||||
\hline
|
||||
sign $\ks$ & even $\kn$ & odd $\kn$\\
|
||||
sign & even kernels & odd kernels\\
|
||||
\hline
|
||||
+1 & $+\pi\,/\,2$ & $\pi$\\
|
||||
-1 & $-\pi\,/\,2$ & $0$\\
|
||||
$+$ & $+\pi\,/\,2$ & $\pi$\\
|
||||
$-$ & $-\pi\,/\,2$ & $0$\\
|
||||
\hline
|
||||
\end{tabular}
|
||||
\label{tab:gabor_phase}
|
||||
\label{tab:gabor_phases}
|
||||
\end{table}
|
||||
\FloatBarrier
|
||||
|
||||
|
||||
\textbf{Stage-specific processing steps and functional approximations:}
|
||||
|
||||
Thresholding nonlinearity in ascending neurons (or further downstream)\\
|
||||
- Binarization of AN response traces into "relevant" vs. "irrelevant"\\
|
||||
$\rightarrow$ Shifted Heaviside step-function $\nl$ (or steep sigmoid threshold?)
|
||||
%
|
||||
These four groups of Gabor kernels allow for the extraction of different types
|
||||
of signal features, such as the presence of peaks (even, $+$), troughs (even,
|
||||
$-$), onsets (odd, $+$), and offsets (odd, $-$) at various time scales.
|
||||
Following the convolutional template matching, each kernel-specific response
|
||||
$c_i(t)$ is passed through a shifted Heaviside step-function $\nl$ with threshold
|
||||
value $\thr$ to obtain a binary response
|
||||
\begin{equation}
|
||||
b_i(t,\,\thr)\,=\,\begin{cases}
|
||||
\;1, \quad c_i(t)\,>\,\thr\\
|
||||
@@ -480,18 +491,23 @@ $\rightarrow$ Shifted Heaviside step-function $\nl$ (or steep sigmoid threshold?
|
||||
\end{cases}
|
||||
\label{eq:binary}
|
||||
\end{equation}
|
||||
%
|
||||
Temporal averaging by neurons of the central brain\\
|
||||
- Finalized set of slowly changing kernel-specific features (one per AN)\\
|
||||
- Different species-specific song patterns are characterized by a distinct combination
|
||||
of feature values $\rightarrow$ Clusters in high-dimensional feature space\\
|
||||
$\rightarrow$ Lowpass filter 1 Hz
|
||||
%
|
||||
which can be thought of as a categorization into "relevant" and "irrelevant"
|
||||
response values. In the grasshopper, these threshold nonlinearities might
|
||||
either be part of the processing within the ascending neurons or take place
|
||||
further downstream~(SOURCE). Finally, the responses of the ascending neurons
|
||||
are assumed to be integrated somewhere in the supraesophageal
|
||||
ganglion~(\bcite{ronacher1986routes}; \bcite{bauer1987separate};
|
||||
\bcite{bhavsar2017brain}). This processing step can be approximated as temporal
|
||||
averaging of the binary responses $b_i(t)$ by a lowpass filter
|
||||
\begin{equation}
|
||||
f_i(t)\,=\,b_i(t)\,*\,\lp, \qquad \fc\,=\,1\,\text{Hz}
|
||||
\label{eq:lowpass}
|
||||
\end{equation}
|
||||
%
|
||||
to obtain a final set of slowly changing kernel-specific features $f_i(t)$. In
|
||||
the resulting high-dimensional feature space, different species-specific song
|
||||
patterns are characterized by a distinct combination of feature values, which
|
||||
can be read out by a simple linear classifier.
|
||||
|
||||
\section{Two mechanisms driving the emergence of intensity-invariant song representation}
|
||||
|
||||
\textbf{Definition of invariance (general, systemic):}\\
|
||||
@@ -671,4 +687,8 @@ initiation of one behavior over another is categorical (e.g. approach/stay)
|
||||
|
||||
\section{Conclusions \& outlook}
|
||||
|
||||
The model pathway includes a rather large number of Gabor kernels compared to
|
||||
the 15 to 20 ascending neurons in the grasshopper auditory
|
||||
system~(\bcite{stumpner1991auditory}).
|
||||
|
||||
\end{document}
|
||||
Reference in New Issue
Block a user