paper_2025/main.tex

\documentclass[a4paper, 12pt]{article}

\usepackage{parskip}
\usepackage{amsmath}
\usepackage{amssymb}
\usepackage[
backend=biber,
style=authoryear,
]{biblatex}
\addbibresource{cite.bib}

\title{Emergent intensity invariance in a physiologically inspired model of the grasshopper auditory system}
\author{Jona Hartling, Jan Benda}
\date{}

\begin{document}
\maketitle{}

\newcommand{\bp}{h_{\text{BP}}(t)} % Bandpass filter function
\newcommand{\lp}{h_{\text{LP}}(t)} % Lowpass filter function
\newcommand{\hp}{h_{\text{HP}}(t)} % Highpass filter function
\newcommand{\fc}{f_{\text{cut}}} % Filter cutoff frequency

\newcommand{\raw}{x} % Placeholder input signal
\newcommand{\filt}{\raw_{\text{filt}}} % Bandpass-filtered signal
\newcommand{\env}{\raw_{\text{env}}} % Signal envelope
\newcommand{\db}{\raw_{\text{dB}}} % Logarithmically scaled signal
\newcommand{\dbref}{\raw_{\text{ref}}} % Decibel reference intensity
\newcommand{\adapt}{\raw_{\text{adapt}}} % Adapted signal

\newcommand{\dec}{\log_{10}} % Logarithm base 10
\newcommand{\sigs}{\sigma_{\text{s}}} % Song standard deviation
\newcommand{\sign}{\sigma_{\eta}} % Noise standard deviation
\newcommand{\infint}{\int_{-\infty}^{+\infty}} % Indefinite integral
\newcommand{\thr}{\Theta_i} % Step function threshold value
\newcommand{\nl}{H(c_i\,-\,\thr)} % Shifted Heaviside step function

\newcommand{\bi}{b_{i,\Theta}} % Single threshold-constrained binary response
\newcommand{\feat}{f_{i,\Theta}} % Single threshold-constrained feature

\newcommand{\thp}{T_{\text{HP}}} % Highpass filter adaptation interval
\newcommand{\tlp}{T_{\text{LP}}} % Lowpass filter averaging interval
\newcommand{\pc}{p(c_i,\,T)} % Probability density (general interval)
\newcommand{\pclp}{p(c_i,\,\tlp)} % Probability density (lowpass interval)

\section{The sensory world of a grasshopper}

Strong dependence on acoustic signals for ranged communication\\
- Diverse species-specific sound repertoires and production mechanisms\\
- Different contexts/ranges: Stridulatory, mandibular, wings, walking sounds\\
- Mate attraction/evaluation, rival deterrence, loss-of-signal predator alarm\\
$\rightarrow$ Elaborate acoustic behaviors co-depend on reliable auditory perception

Songs = Amplitude-modulated (AM) broad-band acoustic signals\\
- Generated by stridulatory movement of hindlegs against forewings\\
- Shorter time scales: Characteristic temporal waveform pattern\\
- Longer time scales: High degree of periodicity (pattern repetition)\\
- Sound propagation: Signal intensity varies strongly with distance to sender\\
- Ectothermy: Temporal structure warps with temperature\\
$\rightarrow$ Sensory constraints imposed by properties of the acoustic signal itself

Multi-species, multi-individual communally inhabited environments\\
- Temporal overlap: Simultaneous singing across individuals/species common\\
- Frequency overlap: No/hardly any niche speciation into frequency bands\\
- "Biotic noise": Hetero-/conspecifics ("Another one's songs are my noise")\\
- "Abiotic noise": Wind, water, vegetation, anthropogenic\\
- Effects of habitat structure on sound propagation (landscape - soundscape)\\
$\rightarrow$ Sensory constraints imposed by the (acoustic) environment

Cluster of auditory challenges (interlocking constraints $\rightarrow$ tight coupling):\\
From continuous acoustic input, generate neuronal representations that...\\
1)...allow for the separation of relevant (song) events from ambient noise floor\\
2)...compensate for behaviorally non-informative song variability (invariances)\\
3)...carry sufficient information to characterize different song patterns,
recognize the ones produced by conspecifics, and make appropriate behavioral
decisions based on context (sender identity, song type, mate/rival quality)

How can the auditory system of grasshoppers meet these challenges?\\
- What are the minimum functional processing steps required?\\
- Which known neuronal mechanisms can implement these steps?\\
- Which and how many stages along the auditory pathway contribute?\\
$\rightarrow$ What are the limitations of the system as a whole?

How can a human observer conceive a grasshopper's auditory percepts?\\
- How to investigate the workings of the auditory pathway as a whole?\\
- How to systematically test effects and interactions of processing parameters?\\
- How to integrate the available knowledge on anatomy, physiology, ethology?\\
$\rightarrow$ Abstract, simplify, formalize $\rightarrow$ Functional model framework


\section{Developing a functional model of\\the grasshopper auditory pathway}


\subsection{Population-driven signal pre-processing}

"Pre-split portion" of the auditory pathway:\\
Tympanal membrane $\rightarrow$ Receptor neurons $\rightarrow$ Local interneurons

Similar response/filter properties within receptor/interneuron populations (\cite{clemens2011})\\
$\rightarrow$ One population-wide response trace per stage (no "single-cell resolution")

\textbf{Stage-specific processing steps and functional approximations:}

Initial: Continuous acoustic input signal $x(t)$

Filtering of behaviorally relevant frequencies by tympanal membrane\\
$\rightarrow$ Bandpass filter 5-30 kHz
\begin{equation}
    \filt(t)\,=\,\raw(t)\,*\,\bp, \qquad \fc\,=\,5\,\text{kHz},\,30\,\text{kHz}
    \label{eq:bandpass}
\end{equation}

Extraction of signal envelope (AM encoding) by receptor population\\
$\rightarrow$ Full-wave rectification, then lowpass filter 500 Hz
\begin{equation}
    \env(t)\,=\,|\filt(t)|\,*\,\lp, \qquad \fc\,=\,500\,\text{Hz}
    \label{eq:env}
\end{equation}

Logarithmically compressed intensity tuning curve of receptors\\
$\rightarrow$ Decibel transformation
\begin{equation}
    \db(t)\,=\,10\,\cdot\,\dec \frac{\env(t)}{\dbref}, \qquad \dbref\,=\,\max[\env(t)]
    \label{eq:log}
\end{equation}

Spike-frequency adaptation in receptor and interneuron populations\\
$\rightarrow$ Highpass filter 10 Hz
\begin{equation}
    \adapt(t)\,=\,\db(t)\,*\,\hp, \qquad \fc\,=\,10\,\text{Hz}
    \label{eq:highpass}
\end{equation}


\subsection{Feature extraction by individual neurons}

"Post-split portion" of the auditory pathway:\\
Ascending neurons (AN) $\rightarrow$ Central brain neurons

Diverse response/filter properties within AN population (\cite{clemens2011})\\
- Pathway splitting into several parallel branches\\
- Expansion into a decorrelated higher-dimensional sound representation\\
$\rightarrow$ Individual neuron-specific response traces from this stage onwards

\textbf{Stage-specific processing steps and functional approximations:}

Template matching by individual ANs\\
- Filter base (STA approximations): Set of Gabor kernels\\
- Gabor parameters: $\sigma, \phi, f$ $\rightarrow$ Determines kernel sign and lobe number
\begin{equation}
    k(t)\,=\,e^{-\frac{t^{2}}{2\sigma^{2}}}\,\cdot\,\sin(2\pi f t\,+\,\phi)
    \label{eq:gabor}
\end{equation}
$\rightarrow$ Separate convolution with each member of the kernel set
\begin{equation}
    c_i(t)\,=\,\adapt(t)\,*\,k_i(t)
    = \infint \adapt(\tau)\,\cdot\,k_i(t\,-\,\tau)\,d\tau
    \label{eq:conv}
\end{equation}

Thresholding nonlinearity in ascending neurons (or further downstream)\\
- Binarization of AN response traces into "relevant" vs. "irrelevant"\\
$\rightarrow$ Shifted Heaviside step-function $\nl$ (or steep sigmoid threshold?)
\begin{equation}
    \bi(t)\,=\,\begin{cases}
        \;1, \quad c_i(t)\,>\,\thr\\
        \;0, \quad c_i(t)\,\leq\,\thr
    \end{cases}
    \label{eq:binary}
\end{equation}

Temporal averaging by neurons of the central brain\\
- Finalized set of slowly changing kernel-specific features (one per AN)\\
- Different species-specific song patterns are characterized by a distinct combination
of feature values $\rightarrow$ Clusters in high-dimensional feature space\\
$\rightarrow$ Lowpass filter 1 Hz
\begin{equation}
    \feat(t)\,=\,\bi(t)\,*\,\lp, \qquad \fc\,=\,1\,\text{Hz}
    \label{eq:lowpass}
\end{equation}

\section{Two mechanisms driving the emergence of intensity-invariant song representation}

\subsection{Logarithmic scaling \& spike-frequency adaptation}

Envelope $\env(t)$ $\xrightarrow{\text{dB}}$ Logarithmic $\db(t)$ $\xrightarrow{\hp}$ Adapted $\adapt(t)$

- Rewrite signal envelope $\env(t)$ (Eq.\,\ref{eq:env}) as a synthetic mixture:\\
1) Song signal $s(t)$ ($\sigs=1$) with variable multiplicative scale $\alpha\geq0$\\
2) Fixed-scale additive noise $\eta(t)$ ($\sign=1$)
\begin{equation}
    \env(t)\,=\,\alpha\,\cdot\,s(t)\,+\,\eta(t),\qquad \env(t)\,>\,0\enspace\forall\enspace t\,\in\,\mathbb{R}
    \label{eq:toy_env}
\end{equation}

\textbf{Logarithmic component:}\\
- Apply decibel transformation (Eq.\,\ref{eq:log}) to synthetic $\env(t)$\\
- Isolate scale $\alpha$ and reference $\dbref$ using logarithm product/quotient laws
\begin{equation}
    \begin{split}
        \db(t)\,&=\,10\,\cdot\,\dec \frac{\alpha\,\cdot\,s(t)\,+\,\eta(t)}{\dbref}\\
        &=\,10\,\cdot\,\big(\dec \frac{\alpha}{\dbref}\,+\,\dec[s(t)\,+\,\frac{\eta(t)}{\alpha}]\big)
    \end{split}
    \label{eq:toy_log}
\end{equation}
$\rightarrow$ In log-space, a multiplicative scaling factor becomes additive\\
$\rightarrow$ Allows for the separation of song signal $s(t)$ and its scale $\alpha$\\
$\rightarrow$ Introduces scaling of noise term $\eta(t)$ by the inverse of $\alpha$\\
$\rightarrow$ Normalization by $\dbref$ applies equally to all terms (no individual effects)

\textbf{Adaptation component:}\\
- Highpass filter over logarithmically scaled $\db(t)$ (Eq.\,\ref{eq:highpass}) can
be approximated as subtraction of the signal offset (DC removal) within a suitable
time interval $\thp$ ($0 < \thp < \frac{1}{\fc}$)\\
\begin{equation}
    \begin{split}
    \adapt(t)\,\approx\,\db(t)\,-\,\dec \frac{\alpha}{\dbref}\,=\,\dec{[s(t)\,+\,\frac{\eta(t)}{\alpha}]}
    \end{split}
    \label{eq:toy_highpass}
\end{equation}

\subsection{Threshold nonlinearity \& temporal averaging}

Convolved $c_i(t)$ $\xrightarrow{\nl}$ Binary $\bi(t)$ $\xrightarrow{\lp}$ Feature $\feat(t)$

\textbf{Thresholding component:}\\
- Within an observed time interval $T$, $c_i(t)$ follows probability density $\pc$\\
- Within $T$, $c_i(t)$ exceeds threshold value $\thr$ for time $T_1$ ($T_1+T_0=T$)\\
- Threshold $\nl$ splits $\pc$ around $\thr$ in two complementary parts
\begin{equation}
    \int_{\thr}^{+\infty} p(c_i,T)\,dc_i\,=\,1\,-\,\int_{-\infty}^{\thr} p(c_i,T)\,dc_i\,=\,\frac{T_1}{T}
    \label{eq:pdf_split}
\end{equation}
$\rightarrow$ Semi-definite integral over right-sided portion of split $\pc$ gives ratio
of time $T_1$ where $c_i(t)>\thr$ to total time $T$ due to normalization of $\pc$
\begin{equation}
    \infint \pc\,dc_i\,=\,1
    \label{eq:pdf}
\end{equation}

\textbf{Averaging component:}\\
- Lowpass filter over binary response $\bi(t)$ (Eq.\,\ref{eq:lowpass}) can be
approximated as temporal averaging over a suitable time interval $\tlp$ ($\tlp > \frac{1}{\fc}$)\\
- Within $\tlp$, $\bi(t)$ takes a value of 1 ($c_i(t)>\thr$) for time $T_1$ ($T_1+T_0=\tlp$)
\begin{equation}
    \feat(t)\,\approx\,\frac{1}{\tlp} \int_{t}^{t\,+\,\tlp} \bi(\tau)\,d\tau\,=\,\frac{T_1}{\tlp}
    \label{eq:feat_avg}
\end{equation}
$\rightarrow$ Temporal averaging over $\bi(t)\in[0,1]$ (Eq.\ref{eq:binary}) gives
ratio of time $T_1$ where $c_i(t)>\thr$ to total averaging interval $\tlp$\\
$\rightarrow$ Feature $\feat(t)$ approximately represents supra-threshold fraction of $\tlp$

\textbf{Combined result:}\\
- Feature $\feat(t)$ can be linked to the distribution of $c_i(t)$ using Eqs.\,\ref{eq:pdf_split} \& \ref{eq:feat_avg}
\begin{equation}
    \feat(t)\,\approx\,\int_{\thr}^{+\infty} \pclp\,dc_i\,=\,P(c_i\,>\,\thr,\,\tlp)
    \label{eq:feat_prop}
\end{equation}
$\rightarrow$ Because the integral over a probability density is a cumulative
probability, the value of feature $\feat(t)$ (temporal compression of $\bi(t)$)
at every time point $t$ signifies the probability that convolution output
$c_i(t)$ exceeds the threshold value $\thr$ during the corresponding averaging
interval $\tlp$

\textbf{Implication for intensity invariance:}\\
- Convolution output $c_i(t)$ = amplitude-based quantity\\
$\rightarrow$ Values indicate how well template waveform $k_i(t)$ matches signal $x(t)$\\
- Feature $\feat(t)$ = duty cycle-based quantity\\
$\rightarrow$ Values indicate how often $c_i(t)$ exceeds threshold value $\thr$

- Thresholding of $c_i(t)$ and subsequent temporal averaging of $\bi(t)$ to obtain $\feat(t)$
constitutes a remapping of an amplitude-based quantity (values indicating the match between) into a duty cycle-based quantity\\

\section{Discriminating species-specific song\\patterns in feature space}


\section{Conclusions \& outlook}

\end{document}