first draft? added output sounds, referencing

2020-11-08 16:31:44 +00:00 · 2020-11-08 16:31:44 +00:00 · b2d3bccb29
commit b2d3bccb29
parent 4910c2c20d
26 changed files with 259 additions and 121 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1,4 +1,4 @@
-*~
+*~*
 *#
 *.pdf
 samples
--- a/lpss.m
+++ b/lpss.m
@ -4,10 +4,13 @@

 close all;clear all;clc;

+NAME = 'hood_m';
+% NAME = 'head_f';
+
 SEGMENT_LENGTH = 100; % ms
 SEGMENT_OFFSET = 20; % ms from start

-LPC_ORDER = 25;
+LPC_ORDER = 30;
 AC_DISP_SAMPLES = 1000; % autocorrelation display samples
 WINDOW_NUMBER = 10; % number of windows for spectrogram
 WINDOW_OVERLAP = 10; % ms
@ -36,15 +39,15 @@ ORIG_LPC_T_COMPARE = false;
 ORIG_SPECTROGRAM = true;
 SYNTH_SPECTROGRAM = true;

-SYNTHESISED_SOUND_LENGTH = 1000; % ms
+SYNTHESISED_SOUND_LENGTH = 100; % ms

-WRITE = false;
-PLAY = false;
+WRITE = ~true;
+PLAY = ~false;

 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
 %% READ SIGNAL
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
-[y, Fs] = audioread('samples/head_f.wav');
+[y, Fs] = audioread(strcat('samples/', NAME, '.wav'));
 % take segment of sample for processing
 y = clip_segment(y, Fs, SEGMENT_LENGTH, SEGMENT_OFFSET);
 y_orig = y;
@ -75,7 +78,7 @@ AC_DISP_SAMPLES = min([AC_DISP_SAMPLES L]);
 figure(1)
 plot(x, y(end-AC_DISP_SAMPLES+1:end), x, est_y(end-AC_DISP_SAMPLES+1:end), '--')

-grid
+gridh
 xlabel('Sample Number')
 ylabel('Amplitude')
 legend('Original signal','LPC estimate')
@ -171,9 +174,9 @@ plot(ceps_t(1:round(L / 2)), c(1:round(L / 2)))
 %% MAXIMA 
 % value threshold
 c(c < CEPSTRUM_THRESHOLD) = 0;
-cep_maxima_indexes = islocalmax(c);

-cep_maxima_times = ceps_t(1:round(L / 2));
+% local maxima
+cep_maxima_indexes = islocalmax(c);
 cep_maxima_times = ceps_t(cep_maxima_indexes);
 c = c(cep_maxima_indexes);

@ -218,7 +221,7 @@ if exist('fundamental_freq')
    synth_sound = filter(1, a, excitation);
    
    if WRITE
-    audiowrite('out.wav', synth_sound, Fs);
+    audiowrite(strcat('synthed/', NAME, '_o', num2str(LPC_ORDER), '_', num2str(SEGMENT_LENGTH), '_', num2str(SEGMENT_OFFSET), 'ms.wav'), synth_sound, Fs);
    end
 end

--- a/report/references.bib
+++ b/report/references.bib
@ -10,3 +10,64 @@
 	year = {2015}
 }

+@misc{etsi-gsm,
+	author = {ETSI},
+	month = may,
+	organization = {European Telecommunications Standards Institute},
+	title = {Digital cellular telecommunications system (Phase 2+); Full rate speech; Transcoding; ETS 300 961},
+	url = {https://www.etsi.org/deliver/etsi_i_ets/300900_300999/300961/02_60/ets_300961e02p.pdf},
+	year = {1998}
+}
+
+@online{all-pole-resonance,
+	author = {Kim, Hyung-Suk},
+	organization = {Center for Computer Research in Music and Acoustics, Stanford University},
+	title = {Linear Predictive Coding is All-Pole Resonance Modeling},
+	url = {https://ccrma.stanford.edu/~hskim08/lpc},
+	year = {2014}
+}
+
+@article{quefrency,
+	author = {Oppenheim, A.V. and Schafer, Ronald},
+	doi = {10.1109/MSP.2004.1328092},
+	journal = {Signal Processing Magazine, IEEE},
+	month = {10},
+	pages = {95--106},
+	title = {From Frequency to Quefrency: A History of the Cepstrum},
+	url = {https://www.researchgate.net/publication/3321562_From_Frequency_to_Quefrency_A_History_of_the_Cepstrum},
+	volume = {21},
+	year = {2004}
+}
+
+@online{source-filter-macquaire,
+	author = {Mannell, Robert},
+	month = mar,
+	organization = {Department of Linguistics, Macquarie University},
+	title = {Source-Filter Theory of Speech Production},
+	url = {https://www.mq.edu.au/about/about-the-university/faculties-and-departments/medicine-and-health-sciences/departments-and-centres/department-of-linguistics/our-research/phonetics-and-phonology/speech/acoustics/acoustic-theory-of-speech-production/source-filter-theory},
+	year = {2020}
+}
+
+@online{max-min,
+	author = {{Whitman College}},
+	title = {Maxima and Minima},
+	url = {https://www.whitman.edu/mathematics/calculus_online/section05.01.html}
+}
+
+@online{islocalmax,
+	author = {{MathWorks}},
+	organization = {MathWorks},
+	subtitle = {Find local maxima},
+	title = {islocalmax},
+	url = {https://www.mathworks.com/help/matlab/ref/islocalmax.html}
+}
+
+@online{aalto-fundamental-freq,
+	author = {B{\"a}ckstr{\"o}m, Tom},
+	month = aug,
+	organization = {Aalto University},
+	title = {Fundamental frequency (F0)},
+	url = {https://wiki.aalto.fi/pages/viewpage.action?pageId=149890776},
+	year = {2020}
+}
+
--- a/report/report.lyx
+++ b/report/report.lyx
@ -181,7 +181,15 @@ University of Surrey
 \end_layout

 \begin_layout Abstract
-Abstract
+A system implementing the source-filter model of speech is presented and
+ evaluated using vowel segments as subjects.
+ Linear predictive coding is used to estimate the formant frequencies of
+ the samples while the cepstrum is used to identify the fundamental frequency.
+ Comparisons of the LPC filter spectrum with the original audio spectrum
+ are provided.
+ A periodic impulse train of the same pitch period is used to synthesise
+ vowel samples, a subjective analysis of the segment quality is given.
+ Evaluations of various parameter variations are also presented.
 \end_layout

 \begin_layout Standard
@ -272,12 +280,19 @@ Introduction
 \end_layout

 \begin_layout Standard
-The ability to process and analyse speech signals has facilitated developments
- throughout their use in the digital space with applications from data compressi
-on to speech recognition.
+Speech analysis and processing is an ever-expanding space with applications
+ from data compression to speech recognition.
+ The latter is a particularly relevant and popular area, presenting an important
+ domain for AI and machine learning applications.
 \end_layout

-\begin_layout Section
+\begin_layout Standard
+Prior to these, however, the ability to analyse, transform and identify
+ key parameters for a speech signal are important tools that will be explored
+ herein.
+\end_layout
+
+\begin_layout Subsection
 Brief
 \end_layout

@ -289,14 +304,37 @@ s can be used to analyse, model and synthesise speech.
 \end_layout

 \begin_layout Standard
-The modelling stage will utilise Linear Predictive Coding and the source-filter
- model of speech to construct an all-pole filter that acts similarly to
- the vocal tract's effect on sound produced by the vocal chords.
+The modelling stage will utilise Linear Predictive Coding
+\begin_inset CommandInset citation
+LatexCommand cite
+key "all-pole-resonance"
+literal "false"
+
+\end_inset
+
+ and the source-filter model of speech
+\begin_inset CommandInset citation
+LatexCommand cite
+key "source-filter-macquaire"
+literal "false"
+
+\end_inset
+
+ to construct an all-pole filter that acts similarly to the vocal tract's
+ effect on sound produced by the vocal chords.
 Comparisons of the frequency response for both the estimated filter and
 the original sound will be presented, the effect of different filter orders
 will also be demonstrated.
 Relevant parameters of the original vowel speech segment will be presented
- including the fundamental frequency and formant frequencies.
+ including the fundamental frequency
+\begin_inset CommandInset citation
+LatexCommand cite
+key "aalto-fundamental-freq"
+literal "false"
+
+\end_inset
+
+ and formant frequencies.
 \end_layout

 \begin_layout Standard
@ -321,12 +359,7 @@ Matlab
 others.
 Following loading a vowel sample, a segment of given length (100ms was
 typical) was clipped for processing.
- The clip optionally also underwent pre-emphasis using a high pass filter.
- As speech spectra can tend to have higher energy at lower frequencies,
- the use of pre-emphasis can balance the magnitude across the spectrum.
- A first order filter was used and the coefficient varied, over-use could
- prove excessive for higher frequencies including fricative sounds.
- The majority of the investigations were conducted on two samples, 
+ The investigations were conducted on two samples, 
 \begin_inset listings
 lstparams "language=Matlab,basicstyle={\ttfamily},tabsize=4"
 inline true
@ -403,12 +436,27 @@ freqz(b, a, n, f)
 of the signal and the vowel formant frequencies can be found at the maxima
 of the spectrum.
 The smooth profile of the LPC spectrum allowed the formant frequencies
- to be estimated by identifying the local maxima of the function.
+ to be estimated by identifying the local maxima
+\begin_inset CommandInset citation
+LatexCommand cite
+key "max-min,islocalmax"
+literal "false"
+
+\end_inset
+
+ of the function.
 \end_layout

 \begin_layout Standard
-In order to find the fundamental frequency of the signal, the cepstrum was
- used.
+In order to find the fundamental frequency of the signal, the cepstrum
+\begin_inset CommandInset citation
+LatexCommand cite
+key "quefrency"
+literal "false"
+
+\end_inset
+
+ was used.
 Regular periodic frequencies in the time domain present as a peak in the
 quefrency domain, this can also be achieved with an auto-corelation function.
 The use of a low-pass filter was investigated in order to smooth the cepstrum
@ -434,7 +482,15 @@ islocalmax(x)

 \end_inset

- function.
+ function
+\begin_inset CommandInset citation
+LatexCommand cite
+key "islocalmax"
+literal "false"
+
+\end_inset
+
+.
 A minimum quefrency threshold of 20 was applied to ignore the transient-like
 oscillations at small 
 \begin_inset Formula $x$
@ -446,7 +502,7 @@ islocalmax(x)
 sampled at 24kHz, a frequency higher than that of the fundamental frequency
 being investigated.
 Additionally a minimum cepstrum threshold of 0.075 was used, from here the
- maximum value was used as the pitch period.
+ quefrency candidate with the highest value was used as the pitch period.
 \end_layout

 \begin_layout Subsection
@ -472,7 +528,15 @@ noprefix "false"
 .
 In order to produce the final synthesised speech, the generated impulse
 train must be convolved (in the time domain) with the transfer function
- of the LPC filter representing the vocal tract.
+ of the LPC filter representing the vocal tract
+\begin_inset CommandInset citation
+LatexCommand cite
+key "source-filter-macquaire"
+literal "false"
+
+\end_inset
+
+.
 In 
 \noun on
 Matlab
@ -1572,7 +1636,7 @@ noprefix "false"

 \end_inset

-, where the order of the 
+, the order of the 
 \begin_inset listings
 lstparams "basicstyle={\ttfamily}"
 inline true
@ -1648,6 +1712,19 @@ name "fig:Spectrum-Tile"
 \end_inset


+\end_layout
+
+\begin_layout Standard
+\begin_inset Flex TODO Note (inline)
+status open
+
+\begin_layout Plain Layout
+segment length variation?
+\end_layout
+
+\end_inset
+
+
 \end_layout

 \begin_layout Subsection
@ -1659,9 +1736,8 @@ Formant Frequencies
 \end_layout

 \begin_layout Standard
-As described previously, the smooth profile of the LPC filter spectra makes
- the use of the local maxima of this curve reasonable estimations as to
- the peaks.
+As described previously, the smooth profile of the LPC filter spectra allows
+ the local maxima to be used as reasonable estimations of the peaks.
 The first three formants for the order 25 filters seen in figure 
 \begin_inset CommandInset ref
 LatexCommand ref
@ -1892,7 +1968,7 @@ hood_m
 \begin_inset Text

 \begin_layout Plain Layout
-1,209
+1,209.0
 \end_layout

 \end_inset
@ -2376,7 +2452,7 @@ noprefix "false"

 \end_inset

-.
+, [1 -0.7] were used as coefficients.
 When employing smoothing, the peak corresponding to the pitch period has
 been amplified compared to the unsmoothed curve where the pitch period
 does not reach far beyond the noise of the rest of the function.
@ -2428,7 +2504,8 @@ head_f

 \end_inset

- with and without low-pass filtering, thresholded local maxima crossed
+ with and without low-pass filtering, thresholded local maxima crossed,
+ smoothing coefficients: [1 -0.7]
 \begin_inset CommandInset label
 LatexCommand label
 name "fig:smoothed-cepstrum"
@ -2711,70 +2788,6 @@ name "tab:fund-freq"
 \end_inset


-\end_layout
-
-\begin_layout Subsubsection
-Pre-emphasis
-\end_layout
-
-\begin_layout Standard
-\begin_inset Float figure
-wide false
-sideways false
-status open
-
-\begin_layout Plain Layout
-\noindent
-\align center
-\begin_inset Graphics
-	filename ../resources/hood_m_spect_25_premph_0.9.png
-	lyxscale 20
-	width 80col%
-
-\end_inset
-
-
-\end_layout
-
-\begin_layout Plain Layout
-\begin_inset Caption Standard
-
-\begin_layout Plain Layout
-LPC spectra for 
-\begin_inset listings
-lstparams "basicstyle={\ttfamily}"
-inline true
-status open
-
-\begin_layout Plain Layout
-
-hood_m
-\end_layout
-
-\end_inset
-
- following pre-emphasis using coefficients, [1 -0.9]
-\begin_inset CommandInset label
-LatexCommand label
-name "fig:pre-emph-spectrum"
-
-\end_inset
-
-
-\end_layout
-
-\end_inset
-
-
-\end_layout
-
-\begin_layout Plain Layout
-
-\end_layout
-
-\end_inset
-
-
 \end_layout

 \begin_layout Subsection
@ -2796,8 +2809,8 @@ noprefix "false"
 .
 The circled areas highlight similar portions, the formant frequencies can
 be seen in both.
- Despite being quasi-stationary, variation can be seen in time for the original
- signal.
+ Despite being quasi-stationary, some variation in time can be seen for
+ the original signal.
 The stationary synthesised signal, however, has a flat profile in time.
 \end_layout

@ -2850,27 +2863,88 @@ name "fig:Spectrograms-synth"

 \end_layout

+\begin_layout Standard
+At lower filter orders (< 10), the synthesised speech has a 
+\emph on
+buzzy
+\emph default
+ quality resembling a sawtooth wave of the same pitch as the original voice
+ sample.
+ At these orders, the synthesised sound can not accurately be discerned
+ as being speech.
+ As the filter order increases, the tone of the sound becomes less harsh
+ and by around order 20 the sample could be identified as being of a voice.
+ By order 40, much of the harsh tone has been smoothed and the sample subjective
+ly sounds as close to human speech as could be achieved.
+ Beyond this order, although the sound does change and smooth, it does not
+ appear to further approach the quality of the original sound.
+\end_layout
+
 \begin_layout Section
 Discussion
 \end_layout

 \begin_layout Standard
-\begin_inset Flex TODO Note (inline)
-status open
-
-\begin_layout Plain Layout
-do numbers on compression
+As presented, the order of the LPC filter is a critical parameter for audio
+ quality.
+ An order that is too low will not allow the filter to accurately map to
+ the desired vowel spectrum leaving a sound that, although at the right
+ pitch, does not appreciably sound like the source segment.
+ At the other end, increasing the order beyond a certain complexity can
+ result in diminishing returns.
+ Although the sound sounded smoother, beyond around order 40 it did not
+ noticeably further approach the original sound.
+ Subjectively, an order of 30 provided a good approximation of the input
+ sound with acceptable quality for low bandwidth transmission.
 \end_layout

+\begin_layout Standard
+The use of low-pass filtering on the cepstrum when identifying the fundamental
+ frequency was effective in accentuating the peak corresponding to the pitch
+ period.
+ With this, a higher 
+\begin_inset Formula $y$
+\end_inset
+
+ threshold could be used that would be further from the noise of the function
+ while still consistently identifying the correct peak.
+\end_layout
+
+\begin_layout Standard
+A 100ms vowel segment sampled at 24kHz totals to 2,400 samples.
+ Assuming that each is represented by a float of 4 bytes, this uncompressed
+ vowel segment would fill 9600 bytes of storage.
+ Encoding the same 100ms of information via LPC using an order 30 filter
+ could reduce this to 120 bytes, just 1% of the previous space.
+ This is particularly important for audio transmission such as in mobile
+ telecoms, the GSM standard uses codecs based on LPC
+\begin_inset CommandInset citation
+LatexCommand cite
+key "etsi-gsm"
+literal "false"
+
 \end_inset

-
+.
 \end_layout

 \begin_layout Section
 Conclusion
 \end_layout

+\begin_layout Standard
+Within this work, a complete source-filter model of speech has been presented,
+ analysing vowel samples and re-synthesising them while compressing the
+ data representation.
+ The effect of changing the complexity of this representation was investigated
+ by varying the order of the LPC filter and describing the effect on the
+ final audio sample.
+ Various statistics about the original samples were calculated including
+ the formant frequencies and the fundamental frequency.
+ With a sufficient filter order, sound samples comparable to the originals
+ were generated.
+\end_layout
+
 \begin_layout Standard
 \begin_inset Newpage newpage
 \end_inset
@ -2895,6 +2969,10 @@ options "bibtotoc"
 \end_inset


+\begin_inset Newpage pagebreak
+\end_inset
+
+
 \end_layout

 \begin_layout Section
@ -2936,22 +3014,18 @@ Additional helper functions were written to plot and manipulate data.
 \begin_inset CommandInset include
 LatexCommand lstinputlisting
 filename "../lpss.m"
-lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, mfcc, spectro, fft_, autocorr, clip_segment, islocalmax, ms_to_samples, rceps, cceps, ones, audioplayer, play, get_impulse_train, lpc},caption={Main script including source-filter model and spectral analysis},label={main_script}"
+lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, mfcc, spectro, fft_, autocorr, clip_segment, islocalmax, ms_to_samples, rceps, cceps, ones, audioplayer, play, get_impulse_train, lpc, strcat, num2str, xlim},caption={Main script including source-filter model and spectral analysis},label={main_script}"

 \end_inset


-\begin_inset Newpage pagebreak
-\end_inset
-
-
 \end_layout

 \begin_layout Standard
 \begin_inset CommandInset include
 LatexCommand lstinputlisting
 filename "../func/spectro.m"
-lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, ms_to_samples},caption={Spectrogram plotting wrapper function},label={spectrogram_function}"
+lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, ms_to_samples, xlim},caption={Spectrogram plotting wrapper function},label={spectrogram_function}"

 \end_inset

@ -2962,7 +3036,7 @@ lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},comm
 \begin_inset CommandInset include
 LatexCommand lstinputlisting
 filename "../func/fft_.m"
-lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram},caption={Fast Fourier transform wrapper function},label={fft_function}"
+lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, xlim},caption={Fast Fourier transform wrapper function},label={fft_function}"

 \end_inset

@ -2973,7 +3047,7 @@ lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},comm
 \begin_inset CommandInset include
 LatexCommand lstinputlisting
 filename "../func/autocorr.m"
-lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram},caption={Autocorrelation plotting wrapper function},label={autocorr_function}"
+lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, xlim},caption={Autocorrelation plotting wrapper function},label={autocorr_function}"

 \end_inset

@ -2984,7 +3058,7 @@ lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},comm
 \begin_inset CommandInset include
 LatexCommand lstinputlisting
 filename "../func/clip_segment.m"
-lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, ms_to_samples},caption={Retrieve a segment of the original speech signal},label={clip_segment_function}"
+lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, ms_to_samples, xlim},caption={Retrieve a segment of the original speech signal},label={clip_segment_function}"

 \end_inset

@ -2995,7 +3069,7 @@ lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},comm
 \begin_inset CommandInset include
 LatexCommand lstinputlisting
 filename "../func/ms_to_samples.m"
-lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram},caption={Transform time in milliseconds into the respective number of samples},label={ms_to_samples_function}"
+lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, xlim},caption={Transform time in milliseconds into the respective number of samples},label={ms_to_samples_function}"

 \end_inset

@ -3006,7 +3080,7 @@ lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},comm
 \begin_inset CommandInset include
 LatexCommand lstinputlisting
 filename "../func/get_impulse_train.m"
-lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, ms_to_samples, repmat},caption={Generate an impulse rate of given fundamental frequency at a provided sampling frequency for a given length of time},label={get_impulse_train_function}"
+lstparams "breaklines=true,frame=tb,language=Matlab,basicstyle={\\ttfamily},commentstyle={\\color{commentgreen}\\itshape},keywordstyle={\\color{blue}},emphstyle={\\color{red}},stringstyle={\\color{red}},identifierstyle={\\color{cyan}},morekeywords={audioread, aryule, xcorr, freqz, spectrogram, ms_to_samples, repmat, xlim},caption={Generate an impulse rate of given fundamental frequency at a provided sampling frequency for a given length of time},label={get_impulse_train_function}"

 \end_inset

--- a/synthed/head_f_o10_100_20ms.wav
+++ b/synthed/head_f_o10_100_20ms.wav
--- a/synthed/head_f_o15_100_20ms.wav
+++ b/synthed/head_f_o15_100_20ms.wav
--- a/synthed/head_f_o20_100_20ms.wav
+++ b/synthed/head_f_o20_100_20ms.wav
--- a/synthed/head_f_o25_100_20ms.wav
+++ b/synthed/head_f_o25_100_20ms.wav
--- a/synthed/head_f_o30_100_20ms.wav
+++ b/synthed/head_f_o30_100_20ms.wav
--- a/synthed/head_f_o40_100_20ms.wav
+++ b/synthed/head_f_o40_100_20ms.wav
--- a/synthed/head_f_o50_100_20ms.wav
+++ b/synthed/head_f_o50_100_20ms.wav
--- a/synthed/head_f_o5_100_20ms.wav
+++ b/synthed/head_f_o5_100_20ms.wav
--- a/synthed/head_f_o60_100_20ms.wav
+++ b/synthed/head_f_o60_100_20ms.wav
--- a/synthed/head_f_o70_100_20ms.wav
+++ b/synthed/head_f_o70_100_20ms.wav
--- a/synthed/head_f_o80_100_20ms.wav
+++ b/synthed/head_f_o80_100_20ms.wav
--- a/synthed/hood_m_o10_100_20ms.wav
+++ b/synthed/hood_m_o10_100_20ms.wav
--- a/synthed/hood_m_o15_100_20ms.wav
+++ b/synthed/hood_m_o15_100_20ms.wav
--- a/synthed/hood_m_o20_100_20ms.wav
+++ b/synthed/hood_m_o20_100_20ms.wav
--- a/synthed/hood_m_o25_100_20ms.wav
+++ b/synthed/hood_m_o25_100_20ms.wav
--- a/synthed/hood_m_o30_100_20ms.wav
+++ b/synthed/hood_m_o30_100_20ms.wav
--- a/synthed/hood_m_o40_100_20ms.wav
+++ b/synthed/hood_m_o40_100_20ms.wav
--- a/synthed/hood_m_o50_100_20ms.wav
+++ b/synthed/hood_m_o50_100_20ms.wav
--- a/synthed/hood_m_o5_100_20ms.wav
+++ b/synthed/hood_m_o5_100_20ms.wav
--- a/synthed/hood_m_o60_100_20ms.wav
+++ b/synthed/hood_m_o60_100_20ms.wav
--- a/synthed/hood_m_o70_100_20ms.wav
+++ b/synthed/hood_m_o70_100_20ms.wav
--- a/synthed/hood_m_o80_100_20ms.wav
+++ b/synthed/hood_m_o80_100_20ms.wav