-
Notifications
You must be signed in to change notification settings - Fork 18
/
Copy path07-03-05-ACA-Tonal-F0Eval.tex
141 lines (132 loc) · 5.93 KB
/
07-03-05-ACA-Tonal-F0Eval.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
% move all configuration stuff into includes file so we can focus on the content
\input{include}
\subtitle{module 7.3.5: fundamental frequency detection~---~evaluation}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\begin{document}
% generate title page
\input{include/titlepage}
\section[overview]{lecture overview}
\begin{frame}{introduction}{overview}
\begin{block}{corresponding textbook section}
%\href{http://ieeexplore.ieee.org/xpl/articleDetails.jsp?tp=&arnumber=6331119&}{Chapter 2~---~Fundamentals}: pp.~14--18\\
%\href{http://ieeexplore.ieee.org/xpl/articleDetails.jsp?arnumber=6331114}{Appendix A~---~Convolution Properties}: pp.~181--183
section~7.3.5
\end{block}
\begin{itemize}
\item \textbf{lecture content}
\begin{itemize}
\item evaluation of pitch tracking systems
\item challenges in annotation
\item metrics
\end{itemize}
\bigskip
\item<2-> \textbf{learning objectives}
\begin{itemize}
\item successfully plan a systematic evaluation procedure for a pitch detection system
\end{itemize}
\end{itemize}
\inserticon{directions}
\end{frame}
\section[intro]{intro}
\begin{frame}{pitch evaluation}{tasks}
goal: compare predicted pitch and ground truth pitch
\pause
\bigskip
\begin{itemize}
\item differentiate various 'pitch tracking' tasks
\begin{itemize}
\item pitch of \textbf{individual notes}
\item pitch of \textbf{monophonic melody}
\item pitch of \textbf{pre-dominant melody} in polyphonic mixture
\item pitches in multi-timbral \textbf{polyphonic mixture}
\end{itemize}
\end{itemize}
\end{frame}
\begin{frame}{pitch evaluation}{annotation challenges}
\begin{itemize}
\item pitch discretization
\begin{itemize}
\item (MIDI/score) pitch of individual notes
\item F0
\end{itemize}
\item time discretization
\begin{itemize}
\item start and stop time of note
\item equidistant time stamps
\end{itemize}
\end{itemize}
\bigskip
\question{how to annotate F0}
\end{frame}
\section{metrics}
\begin{frame}{pitch evaluation}{metrics --- score ground truth}
\vspace{-2mm}
\begin{itemize}
\item all metrics should be computed in the pitch domain, not the frequency domain
\item metrics measure a \textbf{match} between ground truth and predicted pitch ($\Rightarrow$ tolerance)
\bigskip
\item<2-> \textbf{Raw Pitch Accuracy}:
\begin{footnotesize}
\begin{equation*}
RPA = \frac{\sum\limits_{\forall n}TP_n}{\mathcal{N}}
\end{equation*}
\[ TP_n = \left\{
\begin{array}{ll}
0, & \text{if } |\mathfrak{p}_\mathrm{GT}(n) - \hat{\mathfrak{p}}(n)| \geq 0.5 \\
1, & \text{otherwise }
\end{array}
\right. \]
\end{footnotesize}
\smallskip
\item<2-> \textbf{Raw Chroma Accuracy}:
\begin{footnotesize}
\begin{equation*}
RCA = \frac{\sum\limits_{\forall n}TP_{\mathrm{chroma},n}}{\mathcal{N}}
\end{equation*}
\[ TP_{\mathrm{chroma},n} = \left\{
\begin{array}{ll}
0, & \text{if} \mod\big(|\mathfrak{p}_\mathrm{GT}(n) - \hat{\mathfrak{p}}(n)|, 12\big) \geq 0.5 \\
1, & \text{otherwise }
\end{array}
\right. \]
\end{footnotesize}
\end{itemize}
\end{frame}
\begin{frame}{pitch evaluation}{metrics --- f0 ground truth}
\begin{itemize}
\item all metrics should be computed in the pitch domain, not the frequency domain
\item metrics measure \textbf{deviation} between ground truth and predicted pitch
\bigskip
\item<2-> MSE, MAE, standard deviation from the ground truth
\end{itemize}
\end{frame}
\begin{frame}{pitch evaluation}{result aggregation}
\begin{itemize}
\item aggregate per datapoint (frame/note)
\item aggregate per file
\end{itemize}
\end{frame}
\section{summary}
\begin{frame}{summary}{lecture content}
\begin{itemize}
\item \textbf{potential data problems}
\begin{itemize}
\item pitch and time quantization
\item reliability of ground truth
\item time resolution mismatch of ground truth and system
\end{itemize}
\bigskip
\item \textbf{metrics}
\begin{itemize}
\item score pitch match (chroma match)
\item measures of deviation
\end{itemize}
\bigskip
\item \textbf{factor impacting metrics}
\begin{itemize}
\item voicing detection
\end{itemize}
\end{itemize}
\inserticon{summary}
\end{frame}
\end{document}