started writing up some stuff
[asr1617.git] / experiment.tex
index 328c089..0e61c21 100644 (file)
@@ -14,8 +14,8 @@ during growling the regions around $100$Hz have an increased intensity.
 \begin{itemize}
        \item Sox~\footnote{\url{https://sox.sourceforge.net}} is used to convert
                the stereo CD audio to mono $44.1Khz$ waveforms
-       \item Using the \texttt{python\_speech\_features}~%
-               \footnote{\url{https://github.com/jameslyons/python_speech_features}}
+       \item Using the \texttt{python\_speech\_features}\footnote{\url{%
+                       https://github.com/jameslyons/python_speech_features}}
                the waveforms are converted to $13$ $MFCC$ cepstrals with the default
                $25ms$ window every $10ms$.
        \item The data is matched with the annotated files using
@@ -32,7 +32,7 @@ because the predictions are very noisy. This is probably due to pauses in
 growling. This can easily be smoothed out by not allowing extremely short
 growling segments.
 
-\begin{figure}[h]
+\begin{figure}[ht]
        \centering
        \includegraphics[width=.7\linewidth]{cement}
        \caption{A vocal segment of the \emph{Cannibal Corpse} song