123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696 |
- /* manual_LPC.cpp
- *
- * Copyright (C) 1994-2016 David Weenink
- *
- * This code is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or (at
- * your option) any later version.
- *
- * This code is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this work. If not, see <http://www.gnu.org/licenses/>.
- */
- /*
- djmw 20020422 GPL + removed "C syntax" part of manpage
- djmw 20101009 Latest modification
- */
- #include "ManPagesM.h"
- #include "MFCC.h"
- void manual_LPC (ManPages me);
- void manual_LPC (ManPages me)
- {
- MAN_BEGIN (U"CC: Paint...", U"djmw", 20040407)
- INTRO (U"A command to paint the cepstral coefficients in shades of grey.")
- ENTRY (U"Settings")
- TAG (U"##From coefficient#, ##To coefficient#")
- DEFINITION (U"the range of coefficients that will be represented.")
- MAN_END
- MAN_BEGIN (U"CC: To DTW...", U"djmw", 19960918)
- INTRO (U"You can choose this command after selecting 2 objects with cepstral "
- "coefficients (two @MFCC's or @LFCC's). "
- "With this command you perform dynamic time warping. ")
- ENTRY (U"Algorithm")
- NORMAL (U"First we calculate distances between cepstral coefficients: ")
- LIST_ITEM (U"The distance between frame %i (from me) and %j (from thee) is:")
- LIST_ITEM (U" %wc \\.c %d1 + %wle \\.c %d2 + %wr \\.c %d3,")
- LIST_ITEM (U" where %wc, %wle & %wr are user-supplied weights and")
- LIST_ITEM (U" %d1 = \\su (%k=1..%nCoefficients; (%c__%ik_ - %c__%jk_)^2)")
- LIST_ITEM (U" %d2 = (c__%i0_ - c__%j0_)^2")
- LIST_ITEM (U" %d3 = \\su (%k=1..%nCoefficients; (%r__%ik_ - %r__%jk_)^2), with ")
- LIST_ITEM (U" %r__%ik_ the regression coefficient of the cepstral coefficients "
- "from the frames within a time span of %dtr seconds. "
- "c__%ij_ is %j-th cepstral coefficient in frame %i. ")
- NORMAL (U"Next we find the optimum path through the distance matrix with a "
- "Viterbi-algorithm.")
- MAN_END
- MAN_BEGIN (U"CC: To Matrix", U"djmw", 20011123)
- INTRO (U"Copies the cepstral coefficients of the selected @CC "
- "object to a newly created @Matrix object.")
- ENTRY (U"Behaviour")
- FORMULA (U"%z__%ji_ = %c__%ij_, with 1 \\<_ %i \\<_ %nx and "
- "1 \\<_ j \\<_ %numberOfCoefficients__%i_,")
- NORMAL (U"where %z__%ji_ is the matrix element in row %j and column %i and "
- "%c__%ij_ is the %j-th cepstral coefficient in frame %i.")
- MAN_END
- MAN_BEGIN (U"Formants: Extract smoothest part...", U"djmw", 20140313)
- INTRO (U"Extracts the part from one of the selected formants which shows the smoothest formant tracks in a given interval.")
- ENTRY (U"Settings")
- SCRIPT (5, Manual_SETTINGS_WINDOW_HEIGHT (5), U""
- Manual_DRAW_SETTINGS_WINDOW (U"Formants: Extract smoothest part", 5)
- Manual_DRAW_SETTINGS_WINDOW_RANGE (U"Time range (s)", U"0.0", U"0.0")
- Manual_DRAW_SETTINGS_WINDOW_RANGE (U"Fitter formant range", U"1", U"3")
- Manual_DRAW_SETTINGS_WINDOW_FIELD (U"Order of polynomials", U"3")
- Manual_DRAW_SETTINGS_WINDOW_BOOLEAN (U"Use bandwidths to model formant tracks", 1)
- Manual_DRAW_SETTINGS_WINDOW_BOOLEAN (U"Bandwidths for smoothing test", 0)
- )
- TAG (U"##Time range (s)#")
- DEFINITION (U"determines the position of the intervals that have to be compared.")
- TAG (U"##Fitter formant range")
- DEFINITION (U"determines which formant tracks will be modelled with a polynomial function. The goodness of fit of these models will be used in the comparison.")
- TAG (U"##Order of polynomials")
- DEFINITION (U"determines the maximum order of the polynomials that are used in modeling each formant track. Order 0 means a model which is a constant function; this model needs only one parameter. Order 1 means a model that is a straight line function; this order needs two parameters. Order 2 means that an additional parabolic function is used in the modeling; order 2 needs therefore 3 parameters. In general an order %p model needs %p+1 parameters.")
- TAG (U"##Use bandwidths to model formant tracks")
- DEFINITION (U"Bandwidths give an indication about the sharpness of a spectral peak. Sharp peaks have small bandwidths and, vice versa, broad peaks have large bandwidths. The width of a peak can also be interpreted as a measure of certainty for its formant frequency value. Setting this option %%on%, the default setting, means that you force the modeling function to be closer to frequencies that are well defined, i.e. that have sharp peaks, than to the frequencies of broad peaks, if choices have to be made. The consequence is that in the model sharp peaks will be better represented than broad peaks.")
- TAG (U"##Bandwidths for smoothing test")
- DEFINITION (U"determines whether for the smoothnes determination the formant frequencies are still needed. Not using them anymore probably gives a better indication of the smoothness of a track.")
- MAN_END
- MAN_BEGIN (U"PowerCepstrogram", U"djmw", 20130616)
- INTRO (U"One of the @@types of objects@ in P\\s{RAAT}.")
- ENTRY (U"Description")
- NORMAL (U"The PowerCepstrogram shows @@PowerCepstrum|cepstral slices@ as a function of time.")
- MAN_END
- MAN_BEGIN (U"PowerCepstrogram: To Table (peak prominence)...", U"djmw", 20130616)
- INTRO (U"A command to create a table with @@PowerCepstrum: Get peak prominence...|cepstral peak prominence@ values.")
- ENTRY (U"Settings")
- SCRIPT (5, Manual_SETTINGS_WINDOW_HEIGHT (7), U""
- Manual_DRAW_SETTINGS_WINDOW ("PowerCepstrogram: To Table (peak prominence)", 7)
- Manual_DRAW_SETTINGS_WINDOW_RANGE("Peak search pitch range (Hz)", U"60.0", U"300.0")
- Manual_DRAW_SETTINGS_WINDOW_RADIO (U"Interpolation", U"None", 0)
- Manual_DRAW_SETTINGS_WINDOW_RADIO (U"", U"Parabolic", 0)
- Manual_DRAW_SETTINGS_WINDOW_RADIO (U"", U"Cubic", 1)
- Manual_DRAW_SETTINGS_WINDOW_RADIO (U"", U"Sinc70", 0)
- Manual_DRAW_SETTINGS_WINDOW_RANGE("Tilt line quefrency range (s)", U"0.001", U"0.0 (= end)")
- Manual_DRAW_SETTINGS_WINDOW_OPTIONMENU(U"Fit method", U"Robust")
- )
- NORMAL (U"The meaning of these settings is explained @@PowerCepstrum: Get peak prominence...|here@.")
- MAN_END
- MAN_BEGIN(U"PowerCepstrogram: Paint...", U"djmw", 20131001)
- INTRO (U"A command to draw the selected @@PowerCepstrogram@ object(s) in shades of grey.")
- ENTRY (U"Settings")
- SCRIPT (5, Manual_SETTINGS_WINDOW_HEIGHT (7), U""
- Manual_DRAW_SETTINGS_WINDOW (U"PowerCepstrogram: Paint", 7)
- Manual_DRAW_SETTINGS_WINDOW_RANGE("Time range (s)", U"0.0", U"0.0")
- Manual_DRAW_SETTINGS_WINDOW_RANGE("Quefrency range (s)", U"0.0", U"0.0")
- Manual_DRAW_SETTINGS_WINDOW_FIELD("Maximum (dB)", U"80.0")
- Manual_DRAW_SETTINGS_WINDOW_BOOLEAN("Autoscaling",0)
- Manual_DRAW_SETTINGS_WINDOW_FIELD("Dynamic range (dB)", U"30.0")
- Manual_DRAW_SETTINGS_WINDOW_FIELD("Dynamic compression (0-1)", U"0.0")
- Manual_DRAW_SETTINGS_WINDOW_BOOLEAN("Garnish",1)
- )
- TAG (U"##Time range (s)")
- DEFINITION (U"the time domain along the %%x% axis.")
- TAG (U"##Quefrency range (s)")
- DEFINITION (U"the quefency domain along the %%y% axis.")
- TAG (U"##Maximum (dB)")
- DEFINITION (U"cells that have cepstral values greater or equal than this value are drawn in black.")
- TAG (U"##Autoscaling")
- DEFINITION (U"If %%on%, overrules the effects of the previous option and the following three options. I.e. the global maximum and the "
- "global minimum cepstral values determine the maximum blackness and the minimal blackness. Values in-between have apropriate "
- "values of grey.")
- TAG (U"##Dynamic range (dB)")
- DEFINITION (U"All values more than %%Dynamic range% below the maximum will be drawn in white. Values in-between have apropriate "
- "values of grey.")
- TAG (U"##Dynamic compression (0-1)")
- DEFINITION (U"determines how much stronger weak frames should be made before drawing. Normally this parameter is between 0 and 1. "
- "If it is 0, no dynamic compression will take place. If it is 1, all time frames (vertical bands) will contain cepstral values "
- "that are drawn in black. If the global %%maximum% is set at 80 dB, %%autoscaling% is off, %%dynamic range% is 30 dB and "
- "%%dynamic compression% is 0.4 then for a frame with a local maximum of 40 dB all values will be lifted by 0.4*(80-40)=16 dB, "
- "so that its maximum will be seen at 56 dB (thus making the corresponding cell visible).")
- TAG (U"##Garnish")
- DEFINITION (U"Draws a box around the cepstrogram and labels the axes.")
- MAN_END
- MAN_BEGIN (U"PowerCepstrogram: Smooth...", U"djmw", 20140117)
- INTRO (U"Smoothes the selected @PowerCepstrogram by averaging cepstra. The smoothed PowerCepstrogram is the result of two separate steps. "
- "In the first step, cepsta are averaged across time. In the second step, cepstra are averaged across quefrency.")
- ENTRY (U"Settings")
- TAG (U"##Time averaging window (s)")
- DEFINITION (U"determines how many frames will used in the first step, averaging across time. The user-supplied value will be divided "
- "by the Cepstrograms's time step value (its %dx). If %%numberOfFramesToAverage%, the result of the division, turns out to be one or less, no averaging across time is performed. "
- "If %%numberOfFramesToAverage% is larger than one and is even, one will be added. "
- "Each new cepstral frame will be the average of %numberOfFramesToAverage frames of the input Cepstrogram. "
- "For example, if %numberOfFramesToAverage turns out to be 5, then the %j-th new cepstral frame is the result of averaging the 5 frames with indices %j\\--2 , %j\\--1, %j, %j+1 and %j+2 for all frames %j=3..%%numberOfFrames%\\--2, i.e. besides frame %j, the 2 frames on either side are used in the averaging. The %numberOfFramesToAverage has to be uneven to allow for this symmetric behaviour. ")
- TAG (U"##Quefrency averaging window (s)")
- DEFINITION (U"determines how many quefrency bins will be used for the averaging across quefrency step. The number of bins used in this step "
- "is the result of the division of the user-supplied value by the quefrency step value (the Cepstrogram's %dy). "
- "If the result turns out to be one or less, no averaging across quefrencies is performed. If the resulting value is even, one will be added. "
- "If, for example, the result happens to be 3 then the value in quefrency bin %k will be the average value of the values in quefrency bins "
- "%k\\--1, %k and %k+1. ")
- ENTRY (U"Note")
- NORMAL (U"The following commands should reproduce the smoothing described in the @@Hillenbrand & Houde (1996)@ article, where they use a 20 ms "
- "(10 frame) time smoothing and a 1 ms (10 bin) quefrency smoothing. ")
- CODE (U"selectObject (\"Sound xxx\")")
- CODE (U"To PowerCepstrogram: 0.041, 0.002, 5000.0")
- CODE (U"Smooth: 0.02, 0.001")
- MAN_END
- MAN_BEGIN (U"Cepstrum", U"djmw", 20130616)
- INTRO (U"One of the @@types of objects@ in P\\s{RAAT}.")
- ENTRY (U"Description")
- NORMAL (U"A Cepstrum is the log spectrum of the log power spectrum.")
- MAN_END
- MAN_BEGIN (U"PowerCepstrum", U"djmw", 20130616)
- INTRO (U"One of the @@types of objects@ in P\\s{RAAT}.")
- ENTRY (U"Description")
- NORMAL (U"A PowerCepstrum is the log power spectrum of the log power spectrum. The vertical scale will show the amplitude expressed in dB. The horizontal scale shows %%quefrency% in units of seconds.")
- MAN_END
- MAN_BEGIN (U"PowerCepstrum: Get peak prominence...", U"djmw", 20130616)
- INTRO (U"Calculates the cepstral peak prominence measure (CPP) as defined by @@Hillenbrand et al. (1994)@")
- NORMAL (U"The CPP measure is the difference in amplitude between the cepstral peak and the corresponding value on the regression "
- "line that is directly below the peak (i.e., the predicted magnitude for the quefrency at the cepstral peak). "
- "The CPP measure represents how far the cepstral peak emerges from the cepstrum background. ")
- ENTRY (U"Settings")
- SCRIPT (7, Manual_SETTINGS_WINDOW_HEIGHT (7), U""
- Manual_DRAW_SETTINGS_WINDOW (U"PowerCepstrum: Get peak prominence", 7)
- Manual_DRAW_SETTINGS_WINDOW_RANGE("Search peak in pitch range (s)", U"60.0", U"333.3")
- Manual_DRAW_SETTINGS_WINDOW_RADIO (U"Interpolation", U"None", 0)
- Manual_DRAW_SETTINGS_WINDOW_RADIO (U"", U"Parabolic", 0)
- Manual_DRAW_SETTINGS_WINDOW_RADIO (U"", U"Cubic", 1)
- Manual_DRAW_SETTINGS_WINDOW_RADIO (U"", U"Sinc70", 0)
- Manual_DRAW_SETTINGS_WINDOW_RANGE (U"Tilt line quefrency range (s)", U"0.001", U"0.0 (= end)")
- Manual_DRAW_SETTINGS_WINDOW_OPTIONMENU (U"Fit method", U"Robust")
- )
- TAG (U"##Search peak in pitch range")
- DEFINITION (U"determine the limits of the quefrency range where a peak is searched for. The lower quefrency is determined as "
- "1 / %%pitchCeiling% and this value is in general more critical than "
- "the value of the upper quefrency which equals 1 / %%pitchFloor%. A %%pitchCeiling% of 300 Hz will correspond to a lower quefrency of 1/300\\~~0.0033 seconds.")
- TAG (U"##Interpolation")
- DEFINITION (U"determines how the @@vector peak interpolation|amplitude of a peak is determined@.")
- TAG (U"##Tilt line quefrency range")
- DEFINITION (U"the quefrency range for which the amplitudes (in dB) will be modelled by a straight line. "
- "The lower value for this range in the Hillenbrand article was chosen as 0.001 s "
- "in order to reduce the effect of the low quefrency data on the straight line fit. In our analysis this value is not so critical "
- "as we use a more robust straight line fit.")
- TAG (U"##Fit method")
- DEFINITION (U"the default method is @@theil regression|Theil's robust line fit@. However, to be compatible with the past, a standard least squares line fit has also been implemented.")
- ENTRY (U"Note")
- NORMAL (U"The CPP value does not depend on the reference value used in the dB calculation of the power cepstrum.")
- MAN_END
- MAN_BEGIN (U"PowerCepstrum: Draw tilt line...", U"djmw", 20130616)
- INTRO (U"Draws the line that models the backgound of the power cepstrum.")
- MAN_END
- MAN_BEGIN (U"Formant & Spectrogram: To IntensityTier...", U"djmw", 20130109)
- INTRO (U"Determines the formant intensities from the selected Spectrogram.")
- NORMAL (U"The intensities at the frequencies of the selected formant are copied from the corresponding positions in the spectrogram. "
- "If the selected formant doesn't exist in a particular frame, then a large negative value (< -200 dB) is substituted instead. "
- "Because the values in the spectrogram are expressed in Pa^^2^/Hz, the units in the intensity tier are in dB/Hz. ")
- MAN_END
- MAN_BEGIN (U"LFCC", U"djmw", 20040421)
- INTRO (U"One of the @@types of objects@ in P\\s{RAAT}.")
- NORMAL (U"An object of type LFCC represents cepstral "
- "coefficients on a linear frequency scale as a function of time. "
- "The coefficients are represented in frames with constant sampling "
- "period.")
- ENTRY (U"#LFCC commands")
- NORMAL (U"Creation:")
- LIST_ITEM (U"\\bu @@LPC: To LFCC...")
- MAN_END
- MAN_BEGIN (U"LFCC: To LPC...", U"djmw", 20040407)
- INTRO (U"You can choose this command after selecting 1 or more @LFCC's.")
- ENTRY (U"Settings")
- TAG (U"##Number of coefficients")
- DEFINITION (U"the desired number of linear predictive coefficients.")
- ENTRY (U"Behaviour")
- NORMAL (U"The transformation from cepstral coefficients to %a-coefficients "
- "as described in @@Markel & Gray (1976)@.")
- MAN_END
- MAN_BEGIN (U"LPC", U"djmw", 19990610)
- INTRO (U"One of the @@types of objects@ in P\\s{RAAT}.")
- NORMAL (U"An object of type LPC represents filter coefficients as a function of time. "
- "The coefficients are represented in frames with constant sampling period.")
- ENTRY (U"LPC commands")
- NORMAL (U"Creation:")
- LIST_ITEM (U"\\bu @@Sound: To LPC (autocorrelation)...@")
- LIST_ITEM (U"\\bu @@Sound: To LPC (covariance)...@")
- LIST_ITEM (U"\\bu @@Sound: To LPC (burg)...@")
- LIST_ITEM (U"\\bu @@Sound: To LPC (marple)...@")
- ENTRY (U"Conversion")
- LIST_ITEM (U"\\bu @@LPC: To LFCC...|To LFCC...@")
- LIST_ITEM (U"\\bu @@LPC: To Spectrogram...|To Spectrogram...@")
- LIST_ITEM (U"\\bu @@LPC: To Spectrum (slice)...|To Spectrum (slice)...@")
- LIST_ITEM (U"\\bu @@LPC: To Polynomial (slice)...|To Polynomial (slice)...@")
- MAN_END
- MAN_BEGIN (U"LPC: Draw gain...", U"djmw", 20040407)
- INTRO (U"You can choose this command after selecting 1 or more @LPC objects.")
- ENTRY (U"Settings")
- TAG (U"##From time (s)#, ##To time (seconds)#")
- DEFINITION (U"the time domain along the %x-axis.")
- TAG (U"##Minimum gain#, ##Maximum gain#")
- DEFINITION (U"the range for the %y-axis.")
- TAG (U"##Garnish")
- DEFINITION (U"determines whether to draw a bounding box and axis labels.")
- ENTRY (U"Behaviour")
- NORMAL (U"Gain will be drawn as a function of time (gain also equals the prediction error "
- "energy). ")
- MAN_END
- MAN_BEGIN (U"LPC: Draw poles...", U"djmw", 20040407)
- INTRO (U"You can choose this command after selecting 1 or more @LPC objects.")
- ENTRY (U"Settings")
- TAG (U"##Time (s)")
- DEFINITION (U"the time of the nearest frame.")
- ENTRY (U"Behaviour")
- NORMAL (U"The @@Roots|roots@ of the @@LPC: To Polynomial (slice)...|linear prediction "
- "polynomial@, constructed from the coefficients "
- "of the analysis frame, will be drawn in the complex plane.")
- MAN_END
- MAN_BEGIN (U"LPC: To LFCC...", U"djmw", 20040407)
- INTRO (U"You can choose this command after selecting 1 or more @LPC objects.")
- ENTRY (U"Behaviour")
- NORMAL (U"The transformation from a-coefficients to cepstral coefficients "
- "as described in @@Markel & Gray (1976)@.")
- ENTRY (U"Settings")
- TAG (U"%%Number of coefficients%")
- DEFINITION (U"the desired number of cepstral coefficients.")
- MAN_END
- MAN_BEGIN (U"LPC: To Matrix", U"djmw", 20011123)
- INTRO (U"Copies the linear prediction coefficients of the selected @LPC "
- "object to a newly created @Matrix object.")
- ENTRY (U"Behaviour")
- FORMULA (U"%z__%ji_ = %a__%ij_, with 1 \\<_ %i \\<_ %nx and "
- "1 \\<_ j \\<_ %nCoefficients__%i_,")
- NORMAL (U"where %z__%ji_ is the matrix element in row %j and column %i and "
- "%a__%ij_ is the %j-th linear prediction coefficient in frame %i.")
- MAN_END
- MAN_BEGIN (U"LPC: To Formant", U"djmw", 19970123)
- INTRO (U"You can choose this command after selecting 1 or more @LPC objects.")
- ENTRY (U"Behaviour")
- NORMAL (U"For each LPC_Frame, the zeros of the linear prediction polynomial are extracted. "
- "Zeros that are outside the unit circle are reflected into it. "
- "Next, formant frequencies and bandwidths are calculated from all the roots that have the "
- "imaginary part positive, i.e., that lie in the upper half of the unit circle. "
- "Formant frequencies smaller than 50 Hz or larger than (%Nyquist_frequency - 50) are discarded. "
- "The remaining frequencies and bandwidths are sorted "
- "and copied to the Formant_Frame. Finally, the %gain field of the LPC is copied to the %intensity "
- "field of the Formant_Frame.")
- ENTRY (U"Algorithm")
- NORMAL (U"The root finder is Laguerre's method followed by root polishing, see @@Press "
- "et al. (1992)@.")
- ENTRY (U"Warning")
- LIST_ITEM (U"\\bu The formant values can be very inaccurate if you did not resample the Sound "
- "before the LPC-analysis (consult the @@Source-filter synthesis@ tutorial).")
- LIST_ITEM (U"\\bu The results of the root finder may not always be accurate when more than 30 "
- "roots have to be found.")
- MAN_END
- MAN_BEGIN (U"LPC: To Polynomial (slice)...", U"djmw", 20040407)
- INTRO (U"A command that creates a Polynomial object from each selected @LPC object.")
- ENTRY (U"Settings")
- TAG (U"##Time (s)")
- DEFINITION (U"defines the LPC frame whose coefficents will be selected.")
- ENTRY (U"Behaviour")
- NORMAL (U"The linear prediction coefficients %a__1..%n_ of the selected LPC "
- "frame will be copied to polynomial coefficients %c__1..%n+1_ as follows:")
- FORMULA (U"%c__%i_ = %a__%n\\--%i+1_, ")
- FORMULA (U"%c__%n+1_ = 1")
- MAN_END
- MAN_BEGIN (U"LPC: To Spectrum (slice)...", U"djmw", 20071120)
- INTRO (U"You can choose this command after selecting 1 or more @LPC objects.")
- ENTRY (U"Settings")
- TAG (U"##Time (s)")
- DEFINITION (U"the time at which the Spectrum should be calculated.")
- TAG (U"##Minimum frequency resolution (Hz)")
- DEFINITION (U"successive frequencies in the @Spectrum "
- "will be maximally this distance apart.")
- TAG (U"##Bandwidth reduction (Hz)")
- DEFINITION (U"formants with small bandwidths show up very well as peaks in the spectrum because the poles "
- "lie close to the contour along which the spectrum is computed (the unit circle in the z-plane). "
- "Peak enhancement can be realized by computing the spectrum in the z-plane along a contour of radius "
- "%r = exp (\\-- %\\pi \\.c %bandwidthReduction / %samplingFrequency). "
- "This technique is also called off-axis spectrum computation. "
- "Negative values evaluate the spectrum on a contour %outside the unit circle and therefore result in a "
- "flattened spectrum.")
- TAG (U"##De-emphasis frequency (Hz)")
- DEFINITION (U"Performs de-emphasis when frequency is in the interval (0, @@Nyquist frequency@)")
- ENTRY (U"Algorithm")
- NORMAL (U"The Spectrum at time %t will be calculated from the %nearest LPC_Frame according to:")
- FORMULA (U"Spectrum (%f) = \\Vr(%gain\\.c%T/%df) / (1 + \\su__%k=1..%numberOfCoefficients_ %a__%k_%z^^\\--%k^),")
- NORMAL (U"where %T is the sampling period and %z = exp (\\--2 %\\pi %i %f %T) and %df is the distance in Hz "
- "between two successive components in the Spectrum.")
- LIST_ITEM (U"1. Allocate a large enough buffer[1..%nfft] to perform an FFT analysis.")
- LIST_ITEM (U"2. Make the first value of the buffer 1 and copy the prediction coefficients #a into "
- "the buffer. This results in buffer values: (1, %a__1_, ..., %a__%numberOfCoefficients_, 0, ..., 0).")
- LIST_ITEM (U"3. If ##De-emphasis frequency# is in the interval (0, %nyquistFrequency) then \"multiply\" "
- "the buffer with (1 - %b %z^^\\--1^), where %b = exp (\\-- %\\pi %deEmphasisFrequency %T). "
- "This results in buffer values: (1, %a__1_\\--%b, %a__2_\\--%b\\.c%a__1_, ..., "
- "%a__%numberOfCoefficients_\\--%b\\.c%a__%numberOfCoefficients\\--1_, "
- "\\--%b\\.c%a__%numberOfCoefficients_, 0, ..., 0). Note that the number of values in the buffer that differ from 0 "
- "has increased by one.")
- LIST_ITEM (U"4. If ##Bandwidth reduction# is greater than 0 then multiply corresponding values in the buffer by %g^^%i\\--1^ where "
- "%g = exp (2%\\pi %bandwidthReduction %T / %nfft), and %i is the position index in the buffer. "
- "%i runs from 1 to %numberOfCoefficients+1+%t, where %t equals 1 when de-emphasis was performed, "
- "else 0.")
- LIST_ITEM (U"5. Calculate the FFT spectrum of the buffer with the coefficients. This results in complex "
- "amplitudes (%a__%j_,%b__%j_), %j=1..%nfft/2+1.")
- LIST_ITEM (U"6. Calculate the LPC Spectrum by taking the inverse of the FFT spectrum, i.e., each complex "
- "amplitude becomes (%a__%j_,%b__%j_)^^\\--1^ = (%a__%j_,\\--%b__%j_) / (%a__%j_^2 + %b__%j_^2)")
- LIST_ITEM (U"7. Multiply all values with the scale factor \\Vr(%gain\\.c%T/%df).")
- MAN_END
- MAN_BEGIN (U"LPC: To Spectrogram...", U"djmw", 20040407)
- INTRO (U"You can choose this command after selecting 1 or more @LPC objects.")
- ENTRY (U"Settings")
- TAG (U"##Minimum frequency resolution (Hz)")
- DEFINITION (U"successive frequencies in the Spectrum will be maximally this distance apart")
- TAG (U"##Bandwidth reduction (Hz)")
- DEFINITION (U"formants with small bandwidths show up very well as darker regions in the spectrogram "
- "because the poles lie close to the contour along which a spectrum is computed (the unit circle "
- "in the z-plane). "
- "Peak enhancement can be realized by computing a spectrum in the z-plane along a contour of radius "
- "%r = exp (\\-- %\\pi \\.c %bandwidthReduction / %samplingFrequency).")
- TAG (U"##De-emphasis frequency (Hz)")
- DEFINITION (U"Performs de-emphasis when value is in the interval (0, @@Nyquist frequency@)")
- ENTRY (U"Algorithm")
- NORMAL (U"For each LPC_Frame the corresponding Spectrum will be calculated according to the algorithm "
- "explained in @@LPC: To Spectrum (slice)...@. "
- "For each frequency the power, i.e., the square of the complex values, will be stored in the "
- "corresponding area in the Spectrogram.")
- MAN_END
- MAN_BEGIN (U"LPC: To VocalTract (slice)...", U"djmw", 20050615)
- INTRO (U"You can choose this command after selecting 1 or more @LPC objects.")
- ENTRY (U"Settings")
- TAG (U"##Time (s)")
- DEFINITION (U"the time of the nearest frame, in seconds.")
- TAG (U"##Length (m)")
- DEFINITION (U"the length of the vocal tract, in metres.")
- /*
- TAG (U"##Compute length according to Wakita")
- DEFINITION (U"the length of the vocal tract is calculated according "
- "to the algorithm as described in @@Wakita (1977)@.")
- ENTRY (U"Behaviour")
- NORMAL (U"A new @VocalTract area function is calculated from the prediction coefficients in the frame. ")
- ENTRY (U"Warning")
- NORMAL (U"If ##Compute length according to Wakita# is on, the optimal length is searched for in the range from 0.1 m to "
- "0.25 m. This length calculation is extremely sensitive to the number of and the positions of the formants "
- "with respect to the @@Nyquist frequency@. For example, there is a large difference "
- "between the vocal tract length estimates if the highest formant is just below or just above the "
- "Nyquist frequency. "
- "The algorithm is not very reliable in vocal tract length estimation and we do not recommend using it. " )*/
- MAN_END
- MAN_BEGIN (U"LPC & Sound: Filter...", U"djmw", 20040407)
- INTRO (U"A command that creates a new Sound object from one @Sound and one @LPC "
- "object which have been selected together.")
- ENTRY (U"Settings")
- TAG (U"##Use LPC gain")
- DEFINITION (U"Determines whether the gain from the LPC is used in the synthesis.")
- ENTRY (U"Behaviour")
- NORMAL (U"Filters the selected Sound by the selected LPC-filter.")
- NORMAL (U"When the LPC-gain is used the samples in the new Sound will be "
- "multiplied with the square root of the corresponding LPC-gain value.")
- NORMAL (U"In #Z-domain notation: #O(%z) = #H(%z) \\.c #E(%z), where "
- "#E(%z) is the selected filter input Sound, #H(%z) the selected LPC filter, "
- "and, #O(%z) the filter output (the new Sound that will appear in the List of objects).")
- MAN_END
- MAN_BEGIN (U"LPC & Sound: Filter with filter at time...", U"djmw", 20101009)
- INTRO (U"Filters the selected @Sound with a static filter that is formed by the filter coefficients "
- "from only one @LPC frame.")
- ENTRY (U"Settings")
- TAG (U"##Channel")
- DEFINITION (U"determines the sound channel to be filtered.")
- TAG (U"##Use filter at time (s)")
- DEFINITION (U"determines which LPC frame will be chosen to filter the sound. ")
- MAN_END
- MAN_BEGIN (U"LPC & Sound: Filter (inverse)", U"djmw", 19970126)
- INTRO (U"A command that creates a new Sound object from one @Sound and one @LPC "
- "object which have been selected together.")
- ENTRY (U"Behaviour")
- NORMAL (U"Given a filter (the selected LPC) and its output (the selected Sound), "
- "its input is reconstructed (the new Sound that will appear in the List of objects).")
- NORMAL (U"In Z-domain notation: #E(%z) = #O(%z) / #H(%z), where "
- "#O(%z) is the filter output Sound, #H(%z) the LPC filter, and, #E(%z) the filter "
- "input Sound. (Selecting this newly generated Sound and the LPC, choosing the option "
- "`Filter...' generates a Sound that is identical to the Sound that originated "
- "the LPC.)")
- MAN_END
- MAN_BEGIN (U"LPC & Sound: Filter (inverse) with filter at time...", U"djmw", 20101009)
- INTRO (U"%%Inverse% filters the selected @Sound with a static inverse filter that is formed by the filter coefficients "
- "from only one @LPC frame.")
- ENTRY (U"Settings")
- TAG (U"##Channel")
- DEFINITION (U"determines the sound channel to be filtered.")
- TAG (U"##Use filter at time (s)")
- DEFINITION (U"determines which LPC frame will be chosen to inverse filter the sound. ")
- MAN_END
- MAN_BEGIN (U"MFCC", U"djmw", 20160225)
- INTRO (U"One of the @@types of objects@ in P\\s{RAAT}.")
- NORMAL (U"An object of type MFCC represents mel frequency cepstral coefficients "
- "as a function of time. The coefficients are represented in a number of frames centred at equally spaced times. "
- "at constant sampling period.")
- ENTRY (U"MFCC commands")
- NORMAL (U"Creation:")
- LIST_ITEM (U"\\bu @@Sound: To MFCC...@")
- LIST_ITEM (U"\\bu @@MelSpectrogram: To MFCC...@")
- MAN_END
- MAN_BEGIN (U"MFCC: To MelFilter...", U"djmw", 20141023)
- INTRO (U"A #deprecated command replaced by @@MFCC: To MelSpectrogram...@.")
- ENTRY (U"Settings")
- TAG (U"##From coefficient#, ##To coefficient#")
- DEFINITION (U"the range of coefficients that will be used in the reconstruction.")
- ENTRY (U"Details")
- NORMAL (U"The output of the triangular filters in a mel filter bank will be "
- "reconstructed by applying the inverse cosine transform:")
- FORMULA (U"%P__%j_ = 2/N (%c__0_/2 + \\Si__%k=1_^^%N-1^ %c__%k_ cos (\\pi%k(%j-0.5)/%N))),")
- NORMAL (U"where %N represents the number of filters, %j runs from 1 to %N, and coefficients %c__%k_ with %k less than "
- "%%fromCoefficient% and %k larger than %%toCoefficient% take zero values in the evaluation.")
- MAN_END
- MAN_BEGIN (U"MFCC: To MelSpectrogram...", U"djmw", 20141023)
- INTRO (U"A command to (re)construct a @MelSpectrogram object from the selected @MFCC object.")
- ENTRY (U"Settings")
- TAG (U"##From coefficient#, ##To coefficient#")
- DEFINITION (U"the range of coefficients that will be used in the reconstruction.")
- TAG (U"##Include constant term")
- DEFINITION (U"selects whether or not to include the %c__0_ coefficient in the reconstruction. As can be seen from the formula below, the contribution of the %c__0_ term is equal for each filter.")
- ENTRY (U"Details")
- NORMAL (U"The values %P__%j_ in each frame of the MelSpectrogram will be constructed by applying the inverse Discrete Cosine Transform to the corresponding frame of the MFCC object:")
- FORMULA (U"%P__%j_ = 2/N (%c__0_/2 + \\Si__%k=1_^^%N-1^ %c__%k_ cos (\\pi%k(%j-0.5)/%N))),")
- NORMAL (U"where %N represents the number of filters that were used to get the MFCC object, %j runs from 1 to %N, and coefficients %c__%k_ with %k less than "
- "%%fromCoefficient% and %k larger than %%toCoefficient% take zero values in the evaluation.")
- MAN_END
- MAN_BEGIN (U"Sound: To PowerCepstrogram...", U"djmw", 20130616)
- INTRO (U"A command that creates a @@PowerCepstrogram@ from every selected @@Sound@.")
- ENTRY (U"Settings")
- TAG (U"##Pitch floor (Hz)")
- DEFINITION (U"determines the effective length of the analysis window: it will be 3 longest periods long, i.e. if the pitch floor is 60 Hz, the window will be 3/60 = 0.05 seconds long.")
- TAG (U"##Time step (s)")
- TAG (U"##Maximum frequency (Hz)")
- TAG (U"##Pre-emphasis from (Hz)")
- MAN_END
- MAN_BEGIN (U"Sound: To Formant (robust)...", U"djmw", 20111027)
- INTRO (U"A command that creates a @@Formant@ object from every selected @@Sound@. ")
- ENTRY (U"Settings")
- NORMAL (U"The settings for ##Time step (s)#, ##Maximum number of formants#, ##Maximum formant (Hz), "
- "##Window length (s)# and ##Pre emphasis from (Hz)# are as in @@Sound: To Formant (burg)...@. "
- " The following settings determine aspects of the iterative formant frequency refinement.")
- TAG (U"%%Number of std. dev.%,")
- DEFINITION (U"determines the number of standard deviation from where selective weighing of samples starts. ")
- TAG (U"%%Maximum number of iterations%,")
- DEFINITION (U"determines the maximum number of iterations allowed in the refinement step.")
- TAG (U"%%Tolerance%,")
- DEFINITION (U"detemines another stop ctriterion for the refinement step. If the relative change in variance "
- "between successive iterations is less then this value, iteration stops. Iteration stops whenever "
- "one of the two defined stop criteria is reached.")
- ENTRY (U"Algorithm")
- NORMAL (U"First the sound is downsampled to twice the maximum formant frequency. Next the LPC coefficients are determined by the autocorrelation method. Finally, in an iterative procedure as described by @@Lee (1988)@ the formant frequencies and bandwidths are refined by selectively weighting of samples values.")
- MAN_END
- MAN_BEGIN (U"Sound: LPC analysis", U"djmw", 19970126)
- INTRO (U"You can perform this analysis by selecting one or more @Sound objects and "
- "choosing the appropriate command to generate an @LPC.")
- NORMAL (U"The acronym LPC stands for Linear Predictive Coding.")
- NORMAL (U"In the LPC analysis one tries to predict %x__%n_ on the basis of the %p previous samples,")
- FORMULA (U"%x\\'p__%n_ = \\su %a__%k_ %x__%%n-k%_")
- NORMAL (U"then {%a__1_, %a__2_, ..., %a__%p_} can be chosen to minimize the prediction power %%Q__p_% where")
- FORMULA (U"%%Q__p_% = E[ |%x__%n_ - %x\\'p__%n_|^2].")
- NORMAL (U"Several different algorithms exist for minimizing %%Q__p_%:")
- LIST_ITEM (U"\\bu @@Sound: To LPC (autocorrelation)...|To LPC (autocorrelation)...@")
- LIST_ITEM (U"\\bu @@Sound: To LPC (covariance)...|To LPC (covariance)...@")
- LIST_ITEM (U"\\bu @@Sound: To LPC (burg)...|To LPC (burg)...@")
- LIST_ITEM (U"\\bu @@Sound: To LPC (marple)...|To LPC (marple)...@")
- MAN_END
- #define Sound_to_LPC_COMMON_HELP(method) \
- INTRO (U"With this command you create a new @LPC from every selected @Sound, " \
- "using " method " method.") \
- ENTRY (U"Warning") \
- NORMAL (U"You are advised not to use this command for formant analysis. " \
- "For formant analysis, instead use @@Sound: To Formant (burg)...@, " \
- "which also works via LPC (linear predictive coding). This is because " \
- "##Sound: To Formant (burg)...# lets you specify a maximum frequency, " \
- "whereas the ##To LPC# commands automatically use the @@Nyquist frequency@ " \
- "as their maximum frequency. If you do use one of the ##To LPC# commands " \
- "for formant analysis, you may therefore want to downsample the sound first. " \
- "For instance, if you want five formants below 5500 Hz but your Sound has a sampling frequency " \
- "of 44100 Hz, you have to downsample the sound to 11000 Hz with the @@Sound: Resample...@ command. " \
- "After that, you can use the ##To LPC# commands, with a prediction order of 10 or 11.") \
- ENTRY (U"Settings") \
- TAG (U"##Prediction order#") \
- DEFINITION (U"the number of linear prediction coefficients, also called the %%number of poles%. " \
- "Choose this number at least twice as large as the number of spectral peaks that you want " \
- "to detect.") \
- TAG (U"##Analysis window duration (s)") \
- DEFINITION (U"the effective duration of each analysis frame, in seconds.") \
- TAG (U"##Time step (s)") \
- DEFINITION (U"the time step between two consecutive analysis frames.") \
- TAG (U"##Pre-emphasis frequency (Hz)") \
- DEFINITION (U"a +6dB / octave filtering will be applied above this frequency. " \
- "A pre-emphasis frequency of 48.47 Hz for a signal with a sampling frequency of 10 kHz " \
- "approximately corresponds to a value of %a = 0.97 for the filter %y__%n_ = %x__%n_ - %a \\.c %x__%n-1_. " \
- "The relation between %a and the pre-emphasis frequency is: " \
- "%a = exp (\\--2\\.c%\\pi\\.c%preemphasisFrequency/%samplingFrequency). " \
- "If you do not want pre-emphasis, choose a frequency greater than the @@Nyquist frequency@.")
- MAN_BEGIN (U"Sound: To LPC (autocorrelation)...", U"David Weenink & Paul Boersma", 20040407)
- Sound_to_LPC_COMMON_HELP ("the autocorrelation")
- ENTRY (U"Algorithm")
- NORMAL (U"The autocorrelation algorithm is decribed in @@Markel & Gray (1976)@.")
- MAN_END
- MAN_BEGIN (U"Sound: To LPC (covariance)...", U"David Weenink & Paul Boersma", 20040407)
- Sound_to_LPC_COMMON_HELP ("the covariance")
- ENTRY (U"Algorithm")
- NORMAL (U"The covariance algorithm is decribed in @@Markel & Gray (1976)@.")
- MAN_END
- MAN_BEGIN (U"Sound: To LPC (marple)...", U"djmw", 19970126)
- Sound_to_LPC_COMMON_HELP ("Marple's")
- TAG (U"##Tolerance 1")
- DEFINITION (U"stop the iteration when %E(%m) / %E(0) < %%Tolerance 1%, where %E(%m) is the "
- "prediction error for order %m.")
- TAG (U"##Tolerance 2")
- DEFINITION (U"stop the iteration when (%E(%m) - %E(%m-1)) / %E(%m-1) < %%Tolerance 2.")
- ENTRY (U"Algorithm")
- NORMAL (U"The algorithm is described in @@Marple (1980)@.")
- MAN_END
- MAN_BEGIN (U"Sound: To LPC (burg)...", U"David Weenink & Paul Boersma", 20040407)
- Sound_to_LPC_COMMON_HELP ("Burg's")
- ENTRY (U"Algorithm")
- NORMAL (U"Burg's algorithm is described in @@Anderson (1978)@")
- MAN_END
- MAN_BEGIN (U"Sound: To MFCC...", U"djmw", 20141022)
- INTRO (U"A command that creates a @MFCC object from every selected @Sound "
- "object.")
- NORMAL (U"The analysis proceeds in two steps:")
- LIST_ITEM (U"1. We perform a spectrum analysis on a mel frequency scale "
- "(see @@Sound: To MelSpectrogram...@ for details).")
- LIST_ITEM (U"2. We convert the melspectrogram values to mel frequency cepstral "
- "coefficients (see @@MelSpectrogram: To MFCC...@ for details).")
- MAN_END
- MAN_BEGIN (U"Spectrum: To PowerCepstrum", U"djmw", 20160909)
- INTRO (U"A command to create a @PowerCepstrum from every selected @Spectrum.")
- ENTRY (U"Mathematical procedure")
- MAN_END
- MAN_BEGIN (U"VocalTractTier", U"djmw", 20120423)
- INTRO (U"One of the @@types of objects@ in Praat. A VocalTractTier objects contains a number of (%time, %VocalTract) points, where a @@VocalTract@ represents the area function of the vocal tract expressed as m^^2^, running from the glottis to the lips.")
- MAN_END
- MAN_BEGIN (U"theil regression", U"djmw", 20130710)
- NORMAL (U"a robust linear regression method, first proposed by @@Theil (1950)@. The slope of the regression line is estimated as "
- "the median of all pairwise slopes between each pair of points in the data set. Because this number of pairs increases quadratically "
- "with the number of data points, we have implemented a somewhat less computationally intensive procedure, the %%incomplete% theil regression. In the incomplete method we first split the data set of %N data points (%x__%i_, %y__%i_), %i = 1..%N, in two equal sets "
- "of size %N/2 and then calculate %N/2 slopes as ")
- FORMULA (U"%m__%i_ = (%y__%N/2+%i_ - %y__%i_) / (%x__%N/2+%i_ - %x__%i_), for %i = 1..%N/2.")
- NORMAL (U"The regression slope %m is calculated as the median of these %N/2 values %m__%i_.")
- NORMAL (U"Given the slope %m, the offset %b is calculated as the median of the %N values %b__%i_= %y__%i_ - %m\\.c%x__%i_.")
- NORMAL (U"The theil regression has a breakdown point of 29.3\\% , which means that it can tolerate arbitrary corruption of up to 29.3% of the input data-points without degradation of its accuracy")
- MAN_END
- MAN_BEGIN (U"Anderson (1978)", U"djmw", 20030701)
- NORMAL (U"N. Anderson (1978): \"On the calculation of filter coefficients for "
- "maximum entropy spectral analysis.\" In Childers: %%Modern Spectrum Analysis%, "
- "IEEE Press: 252\\--255.")
- MAN_END
- MAN_BEGIN (U"Hillenbrand et al. (1994)", U"djmw", 20121017)
- NORMAL (U"J. Hillenbrand, R.A. Cleveland & R.L. Erickson (1994): \"Acoustic correlates of breathy vocal quality\", %%Journal of speech and hearing research% #37: 769\\--778.")
- MAN_END
- MAN_BEGIN (U"Hillenbrand & Houde (1996)", U"djmw", 20121203)
- NORMAL (U"J. Hillenbrand & R.A. Houde (1996): \"Acoustic correlates of breathy vocal quality: Dysphonic voices and continuous speech\", %%Journal of speech and hearing research% #39: 311\\--321.")
- MAN_END
- MAN_BEGIN (U"Lee (1988)", U"djmw", 20111027)
- NORMAL (U"C.-H. Lee (1988): \"On Robust Linear Prediction of Speech.\", %%IEEE Trans. on ASSP% #36: 642\\--649.")
- MAN_END
- MAN_BEGIN (U"Markel & Gray (1976)", U"djmw", 19980114)
- NORMAL (U"J.D. Markel & A.H. Gray, Jr. (1976): %%Linear Prediction of Speech.% "
- "Springer Verlag, Berlin.")
- MAN_END
- MAN_BEGIN (U"Marple (1980)", U"djmw", 19980114)
- NORMAL (U"L. Marple (1980): \"A new autoregressive spectrum analysis algorithm.\" "
- "%%IEEE Trans. on ASSP% #28, 441\\--454.")
- MAN_END
- MAN_BEGIN (U"Rothweiler (1999)", U"djmw", 20160507)
- NORMAL (U"J. Rothweiler (1999): \"On Polynomial Reduction in the Computation of LSP Frequencies.\" "
- "%%IEEE Trans. on ASSP% #7, 592\\--594.")
- MAN_END
- MAN_BEGIN (U"Theil (1950)", U"djmw", 20121118)
- NORMAL (U"H. Theil (1950): \"A rank-invariant method of linear and polynomial regression analysis\", "
- "%%Proceedings of Koninklijke Nederlandse Akademie van Wetenschappen% ##A.53#: 1397\\--1412.")
- MAN_END
- MAN_BEGIN (U"Wakita (1977)", U"djmw", 19980114)
- NORMAL (U"H. Wakita (1977): \"Normalization of vowels by vocal-tract "
- "length and its application to vowel identification.\" %%IEEE Trans. on ASSP% "
- "#25: 183\\--192.")
- MAN_END
- }
- /* End of file manual_LPC.cpp */
|