Done bullet-pointing LHP invariance, nearly done with THP invariance.

This commit is contained in:
j-hartling 2025-11-13 16:52:22 +01:00
parent 53e43f61f5
commit 2b9f411a06
6 changed files with 113 additions and 48 deletions

View File

@ -17,17 +17,18 @@
\newlabel{eq:gabor}{{5}{3}{}{}{}} \newlabel{eq:gabor}{{5}{3}{}{}{}}
\newlabel{eq:conv}{{6}{3}{}{}{}} \newlabel{eq:conv}{{6}{3}{}{}{}}
\newlabel{eq:binary}{{7}{3}{}{}{}} \newlabel{eq:binary}{{7}{3}{}{}{}}
\newlabel{eq:lowpass}{{8}{4}{}{}{}} \newlabel{eq:lowpass}{{8}{3}{}{}{}}
\@writefile{toc}{\contentsline {section}{\numberline {3}Two mechanisms driving the emergence of intensity-invariant song representation}{4}{}\protected@file@percent } \@writefile{toc}{\contentsline {section}{\numberline {3}Two mechanisms driving the emergence of intensity-invariant song representation}{4}{}\protected@file@percent }
\@writefile{toc}{\contentsline {subsection}{\numberline {3.1}Logarithmic scaling \& spike-frequency adaptation}{4}{}\protected@file@percent } \@writefile{toc}{\contentsline {subsection}{\numberline {3.1}Logarithmic scaling \& spike-frequency adaptation}{4}{}\protected@file@percent }
\newlabel{eq:toy_env}{{9}{4}{}{}{}} \newlabel{eq:toy_env}{{9}{4}{}{}{}}
\newlabel{eq:toy_log}{{10}{4}{}{}{}} \newlabel{eq:toy_snr}{{10}{4}{}{}{}}
\newlabel{eq:toy_highpass}{{11}{4}{}{}{}} \newlabel{eq:toy_log}{{11}{4}{}{}{}}
\newlabel{eq:toy_highpass}{{12}{4}{}{}{}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.2}Threshold nonlinearity \& temporal averaging}{5}{}\protected@file@percent } \@writefile{toc}{\contentsline {subsection}{\numberline {3.2}Threshold nonlinearity \& temporal averaging}{5}{}\protected@file@percent }
\newlabel{eq:pdf_split}{{12}{5}{}{}{}} \newlabel{eq:pdf_split}{{13}{5}{}{}{}}
\newlabel{eq:pdf}{{13}{5}{}{}{}} \newlabel{eq:pdf}{{14}{5}{}{}{}}
\newlabel{eq:feat_avg}{{14}{5}{}{}{}} \newlabel{eq:feat_avg}{{15}{5}{}{}{}}
\newlabel{eq:feat_prop}{{15}{5}{}{}{}} \newlabel{eq:feat_prop}{{16}{6}{}{}{}}
\@writefile{toc}{\contentsline {section}{\numberline {4}Discriminating species-specific song\\patterns in feature space}{6}{}\protected@file@percent } \@writefile{toc}{\contentsline {section}{\numberline {4}Discriminating species-specific song\\patterns in feature space}{6}{}\protected@file@percent }
\@writefile{toc}{\contentsline {section}{\numberline {5}Conclusions \& outlook}{6}{}\protected@file@percent } \@writefile{toc}{\contentsline {section}{\numberline {5}Conclusions \& outlook}{6}{}\protected@file@percent }
\abx@aux@read@bbl@mdfivesum{D9585839A1478809D4C6E9E5BFFC8FE4} \abx@aux@read@bbl@mdfivesum{D9585839A1478809D4C6E9E5BFFC8FE4}

View File

@ -1,14 +1,14 @@
# Fdb version 4 # Fdb version 4
["biber main"] 0 "main.bcf" "main.bbl" "main" 1762872619.20857 -1 ["biber main"] 0 "main.bcf" "main.bbl" "main" 1763049091.30626 -1
"cite.bib" 1762424399.63955 252 7fc49109df64576e199ce34111f01817 "" "cite.bib" 1762424399.63955 252 7fc49109df64576e199ce34111f01817 ""
"main.bcf" 1762872619.1766 107531 bb4289418b1a6604c7c781cbf02f8242 "pdflatex" "main.bcf" 1763049091.2738 107531 bb4289418b1a6604c7c781cbf02f8242 "pdflatex"
(generated) (generated)
"main.bbl" "main.bbl"
"main.blg" "main.blg"
(rewritten before read) (rewritten before read)
["pdflatex"] 1762872618.80069 "/home/hartling/phd/paper/paper_2025/main.tex" "main.pdf" "main" 1762872619.20877 0 ["pdflatex"] 1763049090.88497 "/home/hartling/phd/paper/paper_2025/main.tex" "main.pdf" "main" 1763049091.30646 0
"/etc/texmf/web2c/texmf.cnf" 1761560044.43676 475 c0e671620eb5563b2130f56340a5fde8 "" "/etc/texmf/web2c/texmf.cnf" 1761560044.43676 475 c0e671620eb5563b2130f56340a5fde8 ""
"/home/hartling/phd/paper/paper_2025/main.tex" 1762872618.31261 12714 174d8417d0722be3e50c61997690350b "" "/home/hartling/phd/paper/paper_2025/main.tex" 1763049090.80581 14802 bc1953ed33dca011873a94b8381b353a ""
"/usr/share/texlive/texmf-dist/fonts/map/fontname/texfonts.map" 1577235249 3524 cb3e574dea2d1052e39280babc910dc8 "" "/usr/share/texlive/texmf-dist/fonts/map/fontname/texfonts.map" 1577235249 3524 cb3e574dea2d1052e39280babc910dc8 ""
"/usr/share/texlive/texmf-dist/fonts/tfm/public/amsfonts/cmextra/cmex7.tfm" 1246382020 1004 54797486969f23fa377b128694d548df "" "/usr/share/texlive/texmf-dist/fonts/tfm/public/amsfonts/cmextra/cmex7.tfm" 1246382020 1004 54797486969f23fa377b128694d548df ""
"/usr/share/texlive/texmf-dist/fonts/tfm/public/amsfonts/cmextra/cmex8.tfm" 1246382020 988 bdf658c3bfc2d96d3c8b02cfc1c94c20 "" "/usr/share/texlive/texmf-dist/fonts/tfm/public/amsfonts/cmextra/cmex8.tfm" 1246382020 988 bdf658c3bfc2d96d3c8b02cfc1c94c20 ""
@ -81,10 +81,10 @@
"/usr/share/texmf/web2c/texmf.cnf" 1707919699 40399 f2c302f7d2af602abb742093540a5834 "" "/usr/share/texmf/web2c/texmf.cnf" 1707919699 40399 f2c302f7d2af602abb742093540a5834 ""
"/var/lib/texmf/fonts/map/pdftex/updmap/pdftex.map" 1761648465.84635 5472669 54eaf61a88b6b7896ebd0dac973cb29c "" "/var/lib/texmf/fonts/map/pdftex/updmap/pdftex.map" 1761648465.84635 5472669 54eaf61a88b6b7896ebd0dac973cb29c ""
"/var/lib/texmf/web2c/pdftex/pdflatex.fmt" 1761648508 8213325 7fd20752ab46ff9aa583e4973d7433df "" "/var/lib/texmf/web2c/pdftex/pdflatex.fmt" 1761648508 8213325 7fd20752ab46ff9aa583e4973d7433df ""
"main.aux" 1762872619.1756 2095 e1147be531e57b160e5a1f27b419d862 "pdflatex" "main.aux" 1763049091.2728 2132 0170975d330d9f141156fd1cd9431731 "pdflatex"
"main.bbl" 1762858512.77528 2032 d9585839a1478809d4c6e9e5bffc8fe4 "biber main" "main.bbl" 1762945661.89497 2032 d9585839a1478809d4c6e9e5bffc8fe4 "biber main"
"main.run.xml" 1762872619.1776 2305 d0067550f22ade5b49f22d40cea22838 "pdflatex" "main.run.xml" 1763049091.2738 2305 d0067550f22ade5b49f22d40cea22838 "pdflatex"
"main.tex" 1762872618.31261 12714 174d8417d0722be3e50c61997690350b "" "main.tex" 1763049090.80581 14802 bc1953ed33dca011873a94b8381b353a ""
(generated) (generated)
"main.aux" "main.aux"
"main.bcf" "main.bcf"

View File

@ -1,4 +1,4 @@
This is pdfTeX, Version 3.141592653-2.6-1.40.25 (TeX Live 2023/Debian) (preloaded format=pdflatex 2025.10.28) 11 NOV 2025 15:50 This is pdfTeX, Version 3.141592653-2.6-1.40.25 (TeX Live 2023/Debian) (preloaded format=pdflatex 2025.10.28) 13 NOV 2025 16:51
entering extended mode entering extended mode
restricted \write18 enabled. restricted \write18 enabled.
file:line:error style messages enabled. file:line:error style messages enabled.
@ -398,17 +398,22 @@ Overfull \hbox (3.81674pt too wide) in paragraph at lines 70--77
[1 [1
{/var/lib/texmf/fonts/map/pdftex/updmap/pdftex.map}] [2] [3] {/var/lib/texmf/fonts/map/pdftex/updmap/pdftex.map}] [2] [3] [4] [5]
Underfull \hbox (badness 10000) in paragraph at lines 211--215 Underfull \hbox (badness 10000) in paragraph at lines 311--314
[] []
[4]
Underfull \hbox (badness 10000) in paragraph at lines 271--273 Overfull \hbox (2.79701pt too wide) in paragraph at lines 315--318
[]$\OMS/cmsy/m/n/12 !$ \OT1/cmr/m/n/12 Val-ues in-di-cate cor-re-spon-dence be-tween a tem-plate wave-form $\OML/cmm/m/it/12 k[]\OT1/cmr/m/n/12 (\OML/cmm/m/it/12 t\OT1/cmr/m/n/12 )$ matches
[]
Underfull \hbox (badness 10000) in paragraph at lines 330--332
[] []
[5] [6] (./main.aux) [6] (./main.aux)
*********** ***********
LaTeX2e <2023-11-01> patch level 1 LaTeX2e <2023-11-01> patch level 1
L3 programming layer <2024-01-22> L3 programming layer <2024-01-22>
@ -418,15 +423,15 @@ Package logreq Info: Writing requests to 'main.run.xml'.
) )
Here is how much of TeX's memory you used: Here is how much of TeX's memory you used:
9882 strings out of 474222 9883 strings out of 474222
184270 string characters out of 5748732 184282 string characters out of 5748732
1935975 words of memory out of 5000000 1936975 words of memory out of 5000000
32077 multiletter control sequences out of 15000+600000 32078 multiletter control sequences out of 15000+600000
566832 words of font info for 70 fonts, out of 8000000 for 9000 566832 words of font info for 70 fonts, out of 8000000 for 9000
1141 hyphenation exceptions out of 8191 1141 hyphenation exceptions out of 8191
66i,19n,81p,713b,973s stack positions out of 10000i,1000n,20000p,200000b,200000s 66i,19n,81p,713b,973s stack positions out of 10000i,1000n,20000p,200000b,200000s
</usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmbx12.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmex10.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmmi12.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmmi6.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmmi8.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmr12.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmr17.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmr6.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmr8.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmsy10.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmsy8.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/symbols/msbm10.pfb> </usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmbx12.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmex10.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmmi12.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmmi6.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmmi8.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmr12.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmr17.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmr6.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmr8.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmsy10.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/cm/cmsy8.pfb></usr/share/texlive/texmf-dist/fonts/type1/public/amsfonts/symbols/msbm10.pfb>
Output written on main.pdf (6 pages, 146175 bytes). Output written on main.pdf (6 pages, 148721 bytes).
PDF statistics: PDF statistics:
83 PDF objects out of 1000 (max. 8388607) 83 PDF objects out of 1000 (max. 8388607)
50 compressed objects within 1 object stream 50 compressed objects within 1 object stream

BIN
main.pdf

Binary file not shown.

Binary file not shown.

103
main.tex
View File

@ -29,8 +29,8 @@ style=authoryear,
\newcommand{\adapt}{\raw_{\text{adapt}}} % Adapted signal \newcommand{\adapt}{\raw_{\text{adapt}}} % Adapted signal
\newcommand{\dec}{\log_{10}} % Logarithm base 10 \newcommand{\dec}{\log_{10}} % Logarithm base 10
\newcommand{\sigs}{\sigma_{\text{s}}} % Song standard deviation \newcommand{\svar}{\sigma_{\text{s}}^{2}} % Song signal variance
\newcommand{\sign}{\sigma_{\eta}} % Noise standard deviation \newcommand{\nvar}{\sigma_{\eta}^{2}} % Noise signal variance
\newcommand{\infint}{\int_{-\infty}^{+\infty}} % Indefinite integral \newcommand{\infint}{\int_{-\infty}^{+\infty}} % Indefinite integral
\newcommand{\thr}{\Theta_i} % Step function threshold value \newcommand{\thr}{\Theta_i} % Step function threshold value
\newcommand{\nl}{H(c_i\,-\,\thr)} % Shifted Heaviside step function \newcommand{\nl}{H(c_i\,-\,\thr)} % Shifted Heaviside step function
@ -105,33 +105,36 @@ Initial: Continuous acoustic input signal $x(t)$
Filtering of behaviorally relevant frequencies by tympanal membrane\\ Filtering of behaviorally relevant frequencies by tympanal membrane\\
$\rightarrow$ Bandpass filter 5-30 kHz $\rightarrow$ Bandpass filter 5-30 kHz
%
\begin{equation} \begin{equation}
\filt(t)\,=\,\raw(t)\,*\,\bp, \qquad \fc\,=\,5\,\text{kHz},\,30\,\text{kHz} \filt(t)\,=\,\raw(t)\,*\,\bp, \qquad \fc\,=\,5\,\text{kHz},\,30\,\text{kHz}
\label{eq:bandpass} \label{eq:bandpass}
\end{equation} \end{equation}
%
Extraction of signal envelope (AM encoding) by receptor population\\ Extraction of signal envelope (AM encoding) by receptor population\\
$\rightarrow$ Full-wave rectification, then lowpass filter 500 Hz $\rightarrow$ Full-wave rectification, then lowpass filter 500 Hz
%
\begin{equation} \begin{equation}
\env(t)\,=\,|\filt(t)|\,*\,\lp, \qquad \fc\,=\,500\,\text{Hz} \env(t)\,=\,|\filt(t)|\,*\,\lp, \qquad \fc\,=\,500\,\text{Hz}
\label{eq:env} \label{eq:env}
\end{equation} \end{equation}
%
Logarithmically compressed intensity tuning curve of receptors\\ Logarithmically compressed intensity tuning curve of receptors\\
$\rightarrow$ Decibel transformation $\rightarrow$ Decibel transformation
%
\begin{equation} \begin{equation}
\db(t)\,=\,10\,\cdot\,\dec \frac{\env(t)}{\dbref}, \qquad \dbref\,=\,\max[\env(t)] \db(t)\,=\,10\,\cdot\,\dec \frac{\env(t)}{\dbref}, \qquad \dbref\,=\,\max[\env(t)]
\label{eq:log} \label{eq:log}
\end{equation} \end{equation}
%
Spike-frequency adaptation in receptor and interneuron populations\\ Spike-frequency adaptation in receptor and interneuron populations\\
$\rightarrow$ Highpass filter 10 Hz $\rightarrow$ Highpass filter 10 Hz
%
\begin{equation} \begin{equation}
\adapt(t)\,=\,\db(t)\,*\,\hp, \qquad \fc\,=\,10\,\text{Hz} \adapt(t)\,=\,\db(t)\,*\,\hp, \qquad \fc\,=\,10\,\text{Hz}
\label{eq:highpass} \label{eq:highpass}
\end{equation} \end{equation}
%
\subsection{Feature extraction by individual neurons} \subsection{Feature extraction by individual neurons}
"Post-split portion" of the auditory pathway:\\ "Post-split portion" of the auditory pathway:\\
@ -147,20 +150,24 @@ $\rightarrow$ Individual neuron-specific response traces from this stage onwards
Template matching by individual ANs\\ Template matching by individual ANs\\
- Filter base (STA approximations): Set of Gabor kernels\\ - Filter base (STA approximations): Set of Gabor kernels\\
- Gabor parameters: $\sigma, \phi, f$ $\rightarrow$ Determines kernel sign and lobe number - Gabor parameters: $\sigma, \phi, f$ $\rightarrow$ Determines kernel sign and lobe number
%
\begin{equation} \begin{equation}
k(t)\,=\,e^{-\frac{t^{2}}{2\sigma^{2}}}\,\cdot\,\sin(2\pi f t\,+\,\phi) k(t)\,=\,e^{-\frac{t^{2}}{2\sigma^{2}}}\,\cdot\,\sin(2\pi f t\,+\,\phi)
\label{eq:gabor} \label{eq:gabor}
\end{equation} \end{equation}
%
$\rightarrow$ Separate convolution with each member of the kernel set $\rightarrow$ Separate convolution with each member of the kernel set
%
\begin{equation} \begin{equation}
c_i(t)\,=\,\adapt(t)\,*\,k_i(t) c_i(t)\,=\,\adapt(t)\,*\,k_i(t)
= \infint \adapt(\tau)\,\cdot\,k_i(t\,-\,\tau)\,d\tau = \infint \adapt(\tau)\,\cdot\,k_i(t\,-\,\tau)\,d\tau
\label{eq:conv} \label{eq:conv}
\end{equation} \end{equation}
%
Thresholding nonlinearity in ascending neurons (or further downstream)\\ Thresholding nonlinearity in ascending neurons (or further downstream)\\
- Binarization of AN response traces into "relevant" vs. "irrelevant"\\ - Binarization of AN response traces into "relevant" vs. "irrelevant"\\
$\rightarrow$ Shifted Heaviside step-function $\nl$ (or steep sigmoid threshold?) $\rightarrow$ Shifted Heaviside step-function $\nl$ (or steep sigmoid threshold?)
%
\begin{equation} \begin{equation}
\bi(t)\,=\,\begin{cases} \bi(t)\,=\,\begin{cases}
\;1, \quad c_i(t)\,>\,\thr\\ \;1, \quad c_i(t)\,>\,\thr\\
@ -168,17 +175,18 @@ $\rightarrow$ Shifted Heaviside step-function $\nl$ (or steep sigmoid threshold?
\end{cases} \end{cases}
\label{eq:binary} \label{eq:binary}
\end{equation} \end{equation}
%
Temporal averaging by neurons of the central brain\\ Temporal averaging by neurons of the central brain\\
- Finalized set of slowly changing kernel-specific features (one per AN)\\ - Finalized set of slowly changing kernel-specific features (one per AN)\\
- Different species-specific song patterns are characterized by a distinct combination - Different species-specific song patterns are characterized by a distinct combination
of feature values $\rightarrow$ Clusters in high-dimensional feature space\\ of feature values $\rightarrow$ Clusters in high-dimensional feature space\\
$\rightarrow$ Lowpass filter 1 Hz $\rightarrow$ Lowpass filter 1 Hz
%
\begin{equation} \begin{equation}
\feat(t)\,=\,\bi(t)\,*\,\lp, \qquad \fc\,=\,1\,\text{Hz} \feat(t)\,=\,\bi(t)\,*\,\lp, \qquad \fc\,=\,1\,\text{Hz}
\label{eq:lowpass} \label{eq:lowpass}
\end{equation} \end{equation}
%
\section{Two mechanisms driving the emergence of intensity-invariant song representation} \section{Two mechanisms driving the emergence of intensity-invariant song representation}
\subsection{Logarithmic scaling \& spike-frequency adaptation} \subsection{Logarithmic scaling \& spike-frequency adaptation}
@ -186,38 +194,69 @@ $\rightarrow$ Lowpass filter 1 Hz
Envelope $\env(t)$ $\xrightarrow{\text{dB}}$ Logarithmic $\db(t)$ $\xrightarrow{\hp}$ Adapted $\adapt(t)$ Envelope $\env(t)$ $\xrightarrow{\text{dB}}$ Logarithmic $\db(t)$ $\xrightarrow{\hp}$ Adapted $\adapt(t)$
- Rewrite signal envelope $\env(t)$ (Eq.\,\ref{eq:env}) as a synthetic mixture:\\ - Rewrite signal envelope $\env(t)$ (Eq.\,\ref{eq:env}) as a synthetic mixture:\\
1) Song signal $s(t)$ ($\sigs=1$) with variable multiplicative scale $\alpha\geq0$\\ 1) Song signal $s(t)$ ($\svar=1$) with variable multiplicative scale $\alpha\geq0$\\
2) Fixed-scale additive noise $\eta(t)$ ($\sign=1$) 2) Fixed-scale additive noise $\eta(t)$ ($\nvar=1$)
%
\begin{equation} \begin{equation}
\env(t)\,=\,\alpha\,\cdot\,s(t)\,+\,\eta(t),\qquad \env(t)\,>\,0\enspace\forall\enspace t\,\in\,\mathbb{R} \env(t)\,=\,\alpha\,\cdot\,s(t)\,+\,\eta(t),\qquad \env(t)\,>\,0\enspace\forall\enspace t\,\in\,\mathbb{R}
\label{eq:toy_env} \label{eq:toy_env}
\end{equation} \end{equation}
%
- Signal-to-noise ratio (SNR): Ratio of variances of synthetic mixture
$\env(t)$ with ($\alpha>0$) and without ($\alpha=0$) song signal $s(t)$, assuming $s(t)\perp\eta(t)$
%
\begin{equation}
\text{SNR}\,=\,\frac{\sigma_{s+\eta}^{2}}{\nvar}\,=\,\frac{\alpha^{2}\,\cdot\,\svar\,+\,\nvar}{\nvar}\,=\,\alpha^{2}\,+\,1
\label{eq:toy_snr}
\end{equation}
%
\textbf{Logarithmic component:}\\ \textbf{Logarithmic component:}\\
- Apply decibel transformation (Eq.\,\ref{eq:log}) to synthetic $\env(t)$\\ - Simplify decibel transformation (Eq.\,\ref{eq:log}) and apply to synthetic $\env(t)$\\
- Isolate scale $\alpha$ and reference $\dbref$ using logarithm product/quotient laws - Isolate scale $\alpha$ and reference $\dbref$ using logarithm product/quotient laws
%
\begin{equation} \begin{equation}
\begin{split} \begin{split}
\db(t)\,&=\,10\,\cdot\,\dec \frac{\alpha\,\cdot\,s(t)\,+\,\eta(t)}{\dbref}\\ \db(t)\,&=\,\log \frac{\alpha\,\cdot\,s(t)\,+\,\eta(t)}{\dbref}\\
&=\,10\,\cdot\,\big(\dec \frac{\alpha}{\dbref}\,+\,\dec[s(t)\,+\,\frac{\eta(t)}{\alpha}]\big) &=\,\log \frac{\alpha}{\dbref}\,+\,\log \big[s(t)\,+\,\frac{\eta(t)}{\alpha}\big]
\end{split} \end{split}
\label{eq:toy_log} \label{eq:toy_log}
\end{equation} \end{equation}
%
$\rightarrow$ In log-space, a multiplicative scaling factor becomes additive\\ $\rightarrow$ In log-space, a multiplicative scaling factor becomes additive\\
$\rightarrow$ Allows for the separation of song signal $s(t)$ and its scale $\alpha$\\ $\rightarrow$ Allows for the separation of song signal $s(t)$ and its scale $\alpha$\\
$\rightarrow$ Introduces scaling of noise term $\eta(t)$ by the inverse of $\alpha$\\ $\rightarrow$ Introduces scaling of noise term $\eta(t)$ by the inverse of $\alpha$\\
$\rightarrow$ Normalization by $\dbref$ applies equally to all terms (no individual effects) $\rightarrow$ Normalization by $\dbref$ applies equally to all terms (no individual effects)
\textbf{Adaptation component:}\\ \textbf{Adaptation component:}\\
- Highpass filter over logarithmically scaled $\db(t)$ (Eq.\,\ref{eq:highpass}) can - Highpass filter over $\db(t)$ (Eq.\,\ref{eq:highpass}) can
be approximated as subtraction of the signal offset (DC removal) within a suitable be approximated as subtraction of the local signal offset within a suitable time
time interval $\thp$ ($0 < \thp < \frac{1}{\fc}$)\\ interval $\thp$ ($0 \ll \thp < \frac{1}{\fc}$)
%
\begin{equation} \begin{equation}
\begin{split} \begin{split}
\adapt(t)\,\approx\,\db(t)\,-\,\dec \frac{\alpha}{\dbref}\,=\,\dec{[s(t)\,+\,\frac{\eta(t)}{\alpha}]} \adapt(t)\,\approx\,\db(t)\,-\,\log \frac{\alpha}{\dbref}\,=\,\log \big[s(t)\,+\,\frac{\eta(t)}{\alpha}\big]
\end{split} \end{split}
\label{eq:toy_highpass} \label{eq:toy_highpass}
\end{equation} \end{equation}
%
\textbf{Implication for intensity invariance:}\\
- Logarithmic scaling is essential for equalizing different song intensities\\
$\rightarrow$ Intensity information can be manipulated more easily when in form
of a signal offset in log-space than a multiplicative scale in linear space
- Scale $\alpha$ can only be redistributed, not entirely eliminated from $\adapt(t)$\\
$\rightarrow$ Turn initial scaling of song $s(t)$ by $\alpha$ into scaling of noise $\eta(t)$ by $\frac{1}{\alpha}$
- Capability to compensate for intensity variations, i.e. selective amplification
of output $\adapt(t)$ relative to input $\env(t)$, is limited by input SNR (Eq.\,\ref{eq:toy_snr}):\\
$\alpha\gg1$: Attenuation of $\eta(t)$ term $\rightarrow$ $s(t)$ dominates $\adapt(t)$\\
$\alpha\approx1$ Negligible effect on $\eta(t)$ term $\rightarrow$ $\adapt(t)=\log[s(t)+\eta(t)]$\\
$\alpha\ll1$: Amplification of $\eta(t)$ term $\rightarrow$ $\eta(t)$ dominates $\adapt(t)$\\
$\rightarrow$ Ability to equalize between different sufficiently large scales of $s(t)$\\
$\rightarrow$ Inability to recover $s(t)$ when initially masked by noise floor $\eta(t)$
- Logarithmic scaling emphasizes small amplitudes (song onsets, noise floor) \\
$\rightarrow$ Recurring trade-off: Equalizing signal intensity vs preserving initial SNR
\subsection{Threshold nonlinearity \& temporal averaging} \subsection{Threshold nonlinearity \& temporal averaging}
@ -227,35 +266,42 @@ Convolved $c_i(t)$ $\xrightarrow{\nl}$ Binary $\bi(t)$ $\xrightarrow{\lp}$ Featu
- Within an observed time interval $T$, $c_i(t)$ follows probability density $\pc$\\ - Within an observed time interval $T$, $c_i(t)$ follows probability density $\pc$\\
- Within $T$, $c_i(t)$ exceeds threshold value $\thr$ for time $T_1$ ($T_1+T_0=T$)\\ - Within $T$, $c_i(t)$ exceeds threshold value $\thr$ for time $T_1$ ($T_1+T_0=T$)\\
- Threshold $\nl$ splits $\pc$ around $\thr$ in two complementary parts - Threshold $\nl$ splits $\pc$ around $\thr$ in two complementary parts
%
\begin{equation} \begin{equation}
\int_{\thr}^{+\infty} p(c_i,T)\,dc_i\,=\,1\,-\,\int_{-\infty}^{\thr} p(c_i,T)\,dc_i\,=\,\frac{T_1}{T} \int_{\thr}^{+\infty} p(c_i,T)\,dc_i\,=\,1\,-\,\int_{-\infty}^{\thr} p(c_i,T)\,dc_i\,=\,\frac{T_1}{T}
\label{eq:pdf_split} \label{eq:pdf_split}
\end{equation} \end{equation}
%
$\rightarrow$ Semi-definite integral over right-sided portion of split $\pc$ gives ratio $\rightarrow$ Semi-definite integral over right-sided portion of split $\pc$ gives ratio
of time $T_1$ where $c_i(t)>\thr$ to total time $T$ due to normalization of $\pc$ of time $T_1$ where $c_i(t)>\thr$ to total time $T$ due to normalization of $\pc$
%
\begin{equation} \begin{equation}
\infint \pc\,dc_i\,=\,1 \infint \pc\,dc_i\,=\,1
\label{eq:pdf} \label{eq:pdf}
\end{equation} \end{equation}
%
\textbf{Averaging component:}\\ \textbf{Averaging component:}\\
- Lowpass filter over binary response $\bi(t)$ (Eq.\,\ref{eq:lowpass}) can be - Lowpass filter over binary response $\bi(t)$ (Eq.\,\ref{eq:lowpass}) can be
approximated as temporal averaging over a suitable time interval $\tlp$ ($\tlp > \frac{1}{\fc}$)\\ approximated as temporal averaging over a suitable time interval $\tlp$ ($\tlp > \frac{1}{\fc}$)\\
- Within $\tlp$, $\bi(t)$ takes a value of 1 ($c_i(t)>\thr$) for time $T_1$ ($T_1+T_0=\tlp$) - Within $\tlp$, $\bi(t)$ takes a value of 1 ($c_i(t)>\thr$) for time $T_1$ ($T_1+T_0=\tlp$)
%
\begin{equation} \begin{equation}
\feat(t)\,\approx\,\frac{1}{\tlp} \int_{t}^{t\,+\,\tlp} \bi(\tau)\,d\tau\,=\,\frac{T_1}{\tlp} \feat(t)\,\approx\,\frac{1}{\tlp} \int_{t}^{t\,+\,\tlp} \bi(\tau)\,d\tau\,=\,\frac{T_1}{\tlp}
\label{eq:feat_avg} \label{eq:feat_avg}
\end{equation} \end{equation}
%
$\rightarrow$ Temporal averaging over $\bi(t)\in[0,1]$ (Eq.\ref{eq:binary}) gives $\rightarrow$ Temporal averaging over $\bi(t)\in[0,1]$ (Eq.\ref{eq:binary}) gives
ratio of time $T_1$ where $c_i(t)>\thr$ to total averaging interval $\tlp$\\ ratio of time $T_1$ where $c_i(t)>\thr$ to total averaging interval $\tlp$\\
$\rightarrow$ Feature $\feat(t)$ approximately represents supra-threshold fraction of $\tlp$ $\rightarrow$ Feature $\feat(t)$ approximately represents supra-threshold fraction of $\tlp$
\textbf{Combined result:}\\ \textbf{Combined result:}\\
- Feature $\feat(t)$ can be linked to the distribution of $c_i(t)$ using Eqs.\,\ref{eq:pdf_split} \& \ref{eq:feat_avg} - Feature $\feat(t)$ can be linked to the distribution of $c_i(t)$ using Eqs.\,\ref{eq:pdf_split} \& \ref{eq:feat_avg}
%
\begin{equation} \begin{equation}
\feat(t)\,\approx\,\int_{\thr}^{+\infty} \pclp\,dc_i\,=\,P(c_i\,>\,\thr,\,\tlp) \feat(t)\,\approx\,\int_{\thr}^{+\infty} \pclp\,dc_i\,=\,P(c_i\,>\,\thr,\,\tlp)
\label{eq:feat_prop} \label{eq:feat_prop}
\end{equation} \end{equation}
%
$\rightarrow$ Because the integral over a probability density is a cumulative $\rightarrow$ Because the integral over a probability density is a cumulative
probability, the value of feature $\feat(t)$ (temporal compression of $\bi(t)$) probability, the value of feature $\feat(t)$ (temporal compression of $\bi(t)$)
at every time point $t$ signifies the probability that convolution output at every time point $t$ signifies the probability that convolution output
@ -264,7 +310,20 @@ interval $\tlp$
\textbf{Implication for intensity invariance:}\\ \textbf{Implication for intensity invariance:}\\
- Convolution output $c_i(t)$ = amplitude-based quantity\\ - Convolution output $c_i(t)$ = amplitude-based quantity\\
$\rightarrow$ Values indicate how well template waveform $k_i(t)$ matches signal $x(t)$\\ $\rightarrow$ Values indicate correspondence between template waveform and signal\\
$\rightarrow$ Values indicate correspondence between a template waveform $k_i(t)$
matches
the waveform of the pre-processed signal $\adapt(t)$ at a given time point $t$
- Feature $\feat(t)$ = duty cycle-based quantity\\
$\rightarrow$ Values indicate the ratio of two temporal quantities\\
$\rightarrow$ Values indicate the ratio of time, or probability, that $c_i(t)$
exceeds threshold value $\thr$ within
- Feature $\feat(t)$ = duty cycle-based quantity\\ - Feature $\feat(t)$ = duty cycle-based quantity\\
$\rightarrow$ Values indicate how often $c_i(t)$ exceeds threshold value $\thr$ $\rightarrow$ Values indicate how often $c_i(t)$ exceeds threshold value $\thr$