123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483 |
- /* Cepstrogram.cpp
- *
- * Copyright (C) 2013 - 2017 David Weenink
- *
- * This code is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or (at
- * your option) any later version.
- *
- * This code is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this work. If not, see <http://www.gnu.org/licenses/>.
- */
- /*
- djmw 20010514
- djmw 20020812 GPL header
- djmw 20080122 Version 1: float -> double
- djmw 20110304 Thing_new
- */
- #include "Cepstrogram.h"
- #include "Cepstrum_and_Spectrum.h"
- #include "NUM2.h"
- #include "Sound_and_Spectrum.h"
- #include "Sound_extensions.h"
- #define TOLOG(x) ((1 / NUMln10) * log ((x) + 1e-30))
- #define TO10LOG(x) ((10 / NUMln10) * log ((x) + 1e-30))
- #define FROMLOG(x) (exp ((x) * (NUMln10 / 10.0)) - 1e-30)
- Thing_implement (Cepstrogram, Matrix, 2);
- Thing_implement (PowerCepstrogram, Cepstrogram, 2); // derives from Matrix -> also version 2
- autoCepstrogram Cepstrogram_create (double tmin, double tmax, integer nt, double dt, double t1,
- double qmin, double qmax, integer nq, double dq, double q1) {
- try {
- autoCepstrogram me = Thing_new (Cepstrogram);
- Matrix_init (me.get(), tmin, tmax, nt, dt, t1, qmin, qmax, nq, dq, q1);
- return me;
- } catch (MelderError) {
- Melder_throw (U"Cepstrogram not created.");
- }
- }
- autoPowerCepstrogram PowerCepstrogram_create (double tmin, double tmax, integer nt, double dt, double t1,
- double qmin, double qmax, integer nq, double dq, double q1) {
- try {
- autoPowerCepstrogram me = Thing_new (PowerCepstrogram);
- Matrix_init (me.get(), tmin, tmax, nt, dt, t1, qmin, qmax, nq, dq, q1);
- return me;
- } catch (MelderError) {
- Melder_throw (U"PowerCepstrogram not created.");
- }
- }
- void PowerCepstrogram_paint (PowerCepstrogram me, Graphics g, double tmin, double tmax, double qmin, double qmax, double dBmaximum, int autoscaling, double dynamicRangedB, double dynamicCompression, int garnish) {
- if (tmax <= tmin) { tmin = my xmin; tmax = my xmax; }
- if (qmax <= qmin) { qmin = my ymin; qmax = my ymax; }
- integer itmin, itmax, ifmin, ifmax;
- if (! Matrix_getWindowSamplesX (me, tmin - 0.49999 * my dx, tmax + 0.49999 * my dx, & itmin, & itmax) ||
- ! Matrix_getWindowSamplesY (me, qmin - 0.49999 * my dy, qmax + 0.49999 * my dy, & ifmin, & ifmax)) {
- return;
- }
- autoMatrix thee = Data_copy (me);
- double min = 1e308, max = -min;
- for (integer i = 1; i <= my ny; i ++) {
- for (integer j = 1; j <= my nx; j ++) {
- double val = TO10LOG (my z [i] [j]);
- if (val < min) min = val;
- if (val > max) max = val;
- thy z [i] [j] = val;
- }
- }
- double dBminimum = dBmaximum - dynamicRangedB;
- if (autoscaling) {
- dBminimum = min;
- dBmaximum = max;
- }
- for (integer j = 1; j <= my nx; j ++) {
- double lmax = thy z [1] [j];
- for (integer i = 2; i <= my ny; i ++) {
- if (thy z [i] [j] > lmax) {
- lmax = thy z [i] [j];
- }
- }
- double factor = dynamicCompression * (max - lmax);
- for (integer i = 1; i <= my ny; i ++) {
- thy z [i] [j] += factor;
- }
- }
-
- Graphics_setInner (g);
- Graphics_setWindow (g, tmin, tmax, qmin, qmax);
- Graphics_image (g, thy z.at,
- itmin, itmax,
- Matrix_columnToX (thee.get(), itmin - 0.5),
- Matrix_columnToX (thee.get(), itmax + 0.5),
- ifmin, ifmax,
- Matrix_rowToY (thee.get(), ifmin - 0.5),
- Matrix_rowToY (thee.get(), ifmax + 0.5),
- dBminimum, dBmaximum);
- Graphics_unsetInner (g);
- if (garnish) {
- Graphics_drawInnerBox (g);
- Graphics_textBottom (g, true, U"Time (s)");
- Graphics_marksBottom (g, 2, true, true, false);
- Graphics_marksLeft (g, 2, true, true, false);
- Graphics_textLeft (g, true, U"Quefrency (s)");
- }
- }
- void PowerCepstrogram_subtractTilt_inplace (PowerCepstrogram me, double qstartFit, double qendFit, int lineType, int fitMethod) {
- try {
- autoPowerCepstrum thee = PowerCepstrum_create (my ymax, my ny);
- for (integer i = 1; i <= my nx; i ++) {
- for (integer j = 1; j <= my ny; j ++) {
- thy z [1] [j] = my z [j] [i];
- }
- PowerCepstrum_subtractTilt_inplace (thee.get(), qstartFit, qendFit, lineType, fitMethod);
- for (integer j = 1; j <= my ny; j ++) {
- my z [j] [i] = thy z [1] [j];
- }
- }
- } catch (MelderError) {
- Melder_throw (me, U": no tilt subtracted (inline).");
- }
- }
- autoPowerCepstrogram PowerCepstrogram_subtractTilt (PowerCepstrogram me, double qstartFit, double qendFit, int lineType, int fitMethod) {
- try {
- autoPowerCepstrogram thee = Data_copy (me);
- PowerCepstrogram_subtractTilt_inplace (thee.get(), qstartFit, qendFit, lineType, fitMethod);
- return thee;
- } catch (MelderError) {
- Melder_throw (me, U": no tilt subtracted.");
- }
-
- }
- autoTable PowerCepstrogram_to_Table_hillenbrand (PowerCepstrogram me, double pitchFloor, double pitchCeiling) {
- try {
- autoTable thee = Table_createWithColumnNames (my nx, U"time quefrency cpp f0");
- autoPowerCepstrum him = PowerCepstrum_create (my ymax, my ny);
- for (integer i = 1; i <= my nx; i ++) {
- for (integer j = 1; j <= my ny; j ++) {
- his z [1] [j] = my z [j] [i];
- }
- double qpeak, cpp = PowerCepstrum_getPeakProminence_hillenbrand (him.get(), pitchFloor, pitchCeiling, &qpeak);
- double time = Sampled_indexToX (me, i);
- Table_setNumericValue (thee.get(), i, 1, time);
- Table_setNumericValue (thee.get(), i, 2, qpeak);
- Table_setNumericValue (thee.get(), i, 3, cpp); // Cepstrogram_getCPPS depends on this index 3!!
- Table_setNumericValue (thee.get(), i, 4, 1.0 / qpeak);
- }
- return thee;
- } catch (MelderError) {
- Melder_throw (me, U": no Table with cepstral peak prominence values created.");
- }
- }
- autoTable PowerCepstrogram_to_Table_cpp (PowerCepstrogram me, double pitchFloor, double pitchCeiling, double deltaF0, int interpolation, double qstartFit, double qendFit, int lineType, int fitMethod) {
- try {
- autoTable thee = Table_createWithColumnNames (my nx, U"time quefrency cpp f0 rnr");
- autoPowerCepstrum him = PowerCepstrum_create (my ymax, my ny);
- for (integer i = 1; i <= my nx; i ++) {
- for (integer j = 1; j <= my ny; j ++) {
- his z [1] [j] = my z [j] [i];
- }
- double qpeak, cpp = PowerCepstrum_getPeakProminence (him.get(), pitchFloor, pitchCeiling, interpolation,
- qstartFit, qendFit, lineType, fitMethod, & qpeak);
- double rnr = PowerCepstrum_getRNR (him.get(), pitchFloor, pitchCeiling, deltaF0);
- double time = Sampled_indexToX (me, i);
- Table_setNumericValue (thee.get(), i, 1, time);
- Table_setNumericValue (thee.get(), i, 2, qpeak);
- Table_setNumericValue (thee.get(), i, 3, cpp); // Cepstrogram_getCPPS depends on this index!!
- Table_setNumericValue (thee.get(), i, 4, 1.0 / qpeak);
- Table_setNumericValue (thee.get(), i, 5, rnr);
- }
- return thee;
- } catch (MelderError) {
- Melder_throw (me, U": no Table with cepstral peak prominence values created.");
- }
- }
- autoPowerCepstrogram PowerCepstrogram_smooth (PowerCepstrogram me, double timeAveragingWindow, double quefrencyAveragingWindow) {
- try {
- autoPowerCepstrogram thee = Data_copy (me);
- // 1. average across time
- integer numberOfFrames = Melder_ifloor (timeAveragingWindow / my dx);
- if (numberOfFrames > 1) {
- autoVEC qin = VECraw (my nx);
- autoVEC qout = VECraw (my nx);
- for (integer iq = 1; iq <= my ny; iq ++) {
- VECcopy_preallocated (qin.get(), thy z.row(iq));
- VECsmoothByMovingAverage_preallocated (qout.get(), qin.get(), numberOfFrames);
- VECcopy_preallocated (thy z.row(iq), qout.get());
- }
- }
- // 2. average across quefrencies
- integer numberOfQuefrencyBins = Melder_ifloor (quefrencyAveragingWindow / my dy);
- if (numberOfQuefrencyBins > 1) {
- autoVEC qin = VECraw (thy ny);
- autoVEC qout = VECraw (thy ny);
- for (integer iframe = 1; iframe <= my nx; iframe ++) {
- for (integer iq = 1; iq <= thy ny; iq ++) {
- //qin[iq] = TO10LOG (my z[iq][iframe]);
- qin [iq] = thy z [iq] [iframe];
- }
- VECsmoothByMovingAverage_preallocated (qout.get(), qin.get(), numberOfQuefrencyBins);
- for (integer iq = 1; iq <= thy ny; iq ++) {
- //thy z[iq][iframe] = FROMLOG (qout[iq]);
- thy z [iq] [iframe] = qout [iq];
- }
- }
- }
- return thee;
- } catch (MelderError) {
- Melder_throw (me, U": not smoothed.");
- }
- }
- autoMatrix PowerCepstrogram_to_Matrix (PowerCepstrogram me) {
- try {
- autoMatrix thee = Thing_new (Matrix);
- my structMatrix :: v_copy (thee.get());
- return thee;
- } catch (MelderError) {
- Melder_throw (me, U": not converted to Matrix.");
- }
- }
- autoPowerCepstrum PowerCepstrogram_to_PowerCepstrum_slice (PowerCepstrogram me, double time) {
- try {
- integer iframe = Sampled_xToNearestIndex (me, time);
- iframe = iframe < 1 ? 1 : iframe > my nx ? my nx : iframe;
- autoPowerCepstrum thee = PowerCepstrum_create (my ymax, my ny);
- for (integer i = 1; i <= my ny; i ++) {
- thy z [1] [i] = my z [i] [iframe];
- }
- return thee;
- } catch (MelderError) {
- Melder_throw (me, U": Cepstrum not extracted.");
- }
- }
- autoPowerCepstrogram Matrix_to_PowerCepstrogram (Matrix me) {
- try {
- autoPowerCepstrogram thee = Thing_new (PowerCepstrogram);
- my structMatrix :: v_copy (thee.get());
- return thee;
- } catch (MelderError) {
- Melder_throw (me, U": not converted to PowerCepstrogram.");
- }
- }
- autoPowerCepstrogram Sound_to_PowerCepstrogram (Sound me, double pitchFloor, double dt, double maximumFrequency, double preEmphasisFrequency) {
- try {
- // minimum analysis window has 3 periods of lowest pitch
- double analysisWidth = 3.0 / pitchFloor;
- double windowDuration = 2.0 * analysisWidth; /* gaussian window */
- integer nFrames;
- // Convenience: analyse the whole sound into one Cepstrogram_frame
- if (windowDuration > my dx * my nx) {
- windowDuration = my dx * my nx;
- }
- double t1, samplingFrequency = 2 * maximumFrequency;
- autoSound sound = Sound_resample (me, samplingFrequency, 50);
- Sound_preEmphasis (sound.get(), preEmphasisFrequency);
- Sampled_shortTermAnalysis (me, windowDuration, dt, & nFrames, & t1);
- autoSound sframe = Sound_createSimple (1, windowDuration, samplingFrequency);
- autoSound window = Sound_createGaussian (windowDuration, samplingFrequency);
- // find out the size of the FFT
- integer nfft = 2;
- while (nfft < sframe -> nx) nfft *= 2;
- integer nq = nfft / 2 + 1;
- double qmax = 0.5 * nfft / samplingFrequency, dq = qmax / (nq - 1);
- autoPowerCepstrogram thee = PowerCepstrogram_create (my xmin, my xmax, nFrames, dt, t1, 0, qmax, nq, dq, 0);
- autoMelderProgress progress (U"Cepstrogram analysis");
- for (integer iframe = 1; iframe <= nFrames; iframe++) {
- double t = Sampled_indexToX (thee.get(), iframe);
- Sound_into_Sound (sound.get(), sframe.get(), t - windowDuration / 2);
- Vector_subtractMean (sframe.get());
- Sounds_multiply (sframe.get(), window.get());
- autoSpectrum spec = Sound_to_Spectrum (sframe.get(), true); // FFT yes
- autoPowerCepstrum cepstrum = Spectrum_to_PowerCepstrum (spec.get());
- for (integer i = 1; i <= nq; i ++) {
- thy z [i] [iframe] = cepstrum -> z [1] [i];
- }
- if ((iframe % 10) == 1) {
- Melder_progress ((double) iframe / nFrames, U"PowerCepstrogram analysis of frame ",
- iframe, U" out of ", nFrames, U".");
- }
- }
- return thee;
- } catch (MelderError) {
- Melder_throw (me, U": no PowerCepstrogram created.");
- }
- }
- autoCepstrum Spectrum_to_Cepstrum_hillenbrand (Spectrum me);
- autoCepstrum Spectrum_to_Cepstrum_hillenbrand (Spectrum me) {
- try {
- autoNUMfft_Table fftTable;
- // originalNumberOfSamplesProbablyOdd irrelevant
- if (my x1 != 0.0) {
- Melder_throw (U"A Fourier-transformable Spectrum must have a first frequency of 0 Hz, not ", my x1, U" Hz.");
- }
- integer numberOfSamples = my nx - 1;
- autoCepstrum thee = Cepstrum_create (0.5 / my dx, my nx);
- NUMfft_Table_init (& fftTable, my nx);
- autoVEC amp = VECraw (my nx);
-
- for (integer i = 1; i <= my nx; i ++) {
- amp [i] = my v_getValueAtSample (i, 0, 2);
- }
- NUMfft_forward (& fftTable, amp.get());
-
- for (integer i = 1; i <= my nx; i ++) {
- double val = amp [i] / numberOfSamples;// scaling 1/n because ifft(fft(1))= n;
- thy z [1] [i] = val * val; // power cepstrum
- }
- return thee;
- } catch (MelderError) {
- Melder_throw (me, U": not converted to Sound.");
- }
- }
- // 1 2 nfftdiv2
- // re im re im re im
- // ((fft[1],0) (fft[2],fft[3]), (,), (,), (fft[nfft], 0)) nfft even
- // ((fft[1],0) (fft[2],fft[3]), (,), (,), (fft[nfft-1], fft[nfft])) nfft uneven
- static void complexfftoutput_to_power (constVEC fft, VEC dbs, bool to_db) {
- double valsq = fft [1] * fft [1];
- dbs[1] = to_db ? TOLOG (valsq) : valsq;
- integer nfftdiv2p1 = (fft.size + 2) / 2;
- integer nend = fft.size % 2 == 0 ? nfftdiv2p1 : nfftdiv2p1 + 1;
- for (integer i = 2; i < nend; i ++) {
- double re = fft [i + i - 2], im = fft [i + i - 1];
- valsq = re * re + im * im;
- dbs [i] = to_db ? TOLOG (valsq) : valsq;
- }
- if (fft.size % 2 == 0) {
- valsq = fft [fft.size] * fft [fft.size];
- dbs[nfftdiv2p1] = to_db ? TOLOG (valsq) : valsq;
- }
- }
- autoPowerCepstrogram Sound_to_PowerCepstrogram_hillenbrand (Sound me, double pitchFloor, double dt) {
- try {
- // minimum analysis window has 3 periods of lowest pitch
- double analysisWidth = 3.0 / pitchFloor;
- if (analysisWidth > my dx * my nx) {
- analysisWidth = my dx * my nx;
- }
- double samplingFrequency = 1.0 / my dx;
- autoSound thee;
- if (samplingFrequency > 30000) {
- samplingFrequency = samplingFrequency / 2.0;
- thee = Sound_resample (me, samplingFrequency, 1);
- } else {
- thee = Data_copy (me);
- }
- // pre-emphasis with fixed coefficient 0.9
- for (integer i = thy nx; i > 1; i --) {
- thy z [1] [i] -= 0.9 * thy z [1] [i - 1];
- }
- integer nosInWindow = (integer) floorl (analysisWidth * samplingFrequency), numberOfFrames;
- if (nosInWindow < 8) {
- Melder_throw (U"Analysis window too short.");
- }
- double t1;
- Sampled_shortTermAnalysis (thee.get(), analysisWidth, dt, & numberOfFrames, & t1);
- autoNUMvector<double> hamming (1, nosInWindow);
- for (integer i = 1; i <= nosInWindow; i ++) {
- hamming [i] = 0.54 -0.46 * cos(2 * NUMpi * (i - 1) / (nosInWindow - 1));
- }
- integer nfft = 8; // minimum possible
- while (nfft < nosInWindow) { nfft *= 2; }
- integer nfftdiv2 = nfft / 2;
- autoVEC fftbuf = VECzero (nfft); // "complex" array
- autoVEC spectrum = VECzero (nfftdiv2 + 1); // +1 needed
- autoNUMfft_Table fftTable;
- NUMfft_Table_init (& fftTable, nfft); // sound to spectrum
-
- double qmax = 0.5 * nfft / samplingFrequency, dq = qmax / (nfftdiv2 + 1);
- autoPowerCepstrogram him = PowerCepstrogram_create (my xmin, my xmax, numberOfFrames, dt, t1, 0, qmax, nfftdiv2+1, dq, 0);
-
- autoMelderProgress progress (U"Cepstrogram analysis");
-
- for (integer iframe = 1; iframe <= numberOfFrames; iframe ++) {
- double tbegin = t1 + (iframe - 1) * dt - analysisWidth / 2;
- tbegin = tbegin < thy xmin ? thy xmin : tbegin;
- integer istart = Sampled_xToLowIndex (thee.get(), tbegin); // ppgb: afronding naar beneden?
- istart = istart < 1 ? 1 : istart;
- integer iend = istart + nosInWindow - 1;
- iend = iend > thy nx ? thy nx : iend;
- for (integer i = 1; i <= nosInWindow; i ++) {
- fftbuf [i] = thy z [1] [istart + i - 1] * hamming [i];
- }
- for (integer i = nosInWindow + 1; i <= nfft; i ++) {
- fftbuf [i] = 0;
- }
- NUMfft_forward (&fftTable, fftbuf.get());
- complexfftoutput_to_power (fftbuf.get(), spectrum.get(), true); // log10(|fft|^2)
- // subtract average
- double specmean = spectrum [1];
- for (integer i = 2; i <= nfftdiv2 + 1; i ++) {
- specmean += spectrum [i];
- }
- specmean /= nfftdiv2 + 1;
- for (integer i = 1; i <= nfftdiv2 + 1; i ++) {
- spectrum [i] -= specmean;
- }
- /*
- * Here we diverge from Hillenbrand as he takes the fft of half of the spectral values.
- * H. forgets that the actual spectrum has nfft/2+1 values. Thefore, we take the inverse
- * transform because this keeps the number of samples a power of 2.
- * At the same time this results in twice as many numbers in the quefrency domain, i.e. we end up with nfft/2+1
- * numbers while H. has only nfft/4!
- */
- fftbuf [1] = spectrum [1];
- for (integer i = 2; i < nfftdiv2 + 1; i ++) {
- fftbuf [i+i-2] = spectrum [i];
- fftbuf [i+i-1] = 0;
- }
- fftbuf [nfft] = spectrum [nfftdiv2 + 1];
- NUMfft_backward (& fftTable, fftbuf.get());
- for (integer i = 1; i <= nfftdiv2 + 1; i ++) {
- his z [i] [iframe] = fftbuf [i] * fftbuf [i];
- }
- if ((iframe % 10) == 1) {
- Melder_progress ((double) iframe / numberOfFrames, U"Cepstrogram analysis of frame ",
- iframe, U" out of ", numberOfFrames, U".");
- }
- }
- return him;
- } catch (MelderError) {
- Melder_throw (me, U": no Cepstrogram created.");
- }
- }
- double PowerCepstrogram_getCPPS (PowerCepstrogram me, bool subtractTiltBeforeSmoothing, double timeAveragingWindow, double quefrencyAveragingWindow, double pitchFloor, double pitchCeiling, double deltaF0, int interpolation, double qstartFit, double qendFit, int lineType, int fitMethod) {
- try {
- autoPowerCepstrogram flattened;
- if (subtractTiltBeforeSmoothing) {
- flattened = PowerCepstrogram_subtractTilt (me, qstartFit, qendFit, lineType, fitMethod);
- }
- autoPowerCepstrogram smooth = PowerCepstrogram_smooth (flattened ? flattened.get() : me, timeAveragingWindow, quefrencyAveragingWindow);
- autoTable table = PowerCepstrogram_to_Table_cpp (smooth.get(), pitchFloor, pitchCeiling, deltaF0, interpolation, qstartFit, qendFit, lineType, fitMethod);
- double cpps = Table_getMean (table.get(), 3);
- return cpps;
- } catch (MelderError) {
- Melder_throw (me, U": no CPPS value calculated.");
- }
- }
- double PowerCepstrogram_getCPPS_hillenbrand (PowerCepstrogram me, bool subtractTiltBeforeSmoothing, double timeAveragingWindow, double quefrencyAveragingWindow, double pitchFloor, double pitchCeiling) {
- try {
- autoPowerCepstrogram him;
- if (subtractTiltBeforeSmoothing) {
- him = PowerCepstrogram_subtractTilt (me, 0.001, 0, 1, 1);
- }
- autoPowerCepstrogram smooth = PowerCepstrogram_smooth (subtractTiltBeforeSmoothing ? him.get() : me, timeAveragingWindow, quefrencyAveragingWindow);
- autoTable table = PowerCepstrogram_to_Table_hillenbrand (smooth.get(), pitchFloor, pitchCeiling);
- double cpps = Table_getMean (table.get(), 3);
- return cpps;
- } catch (MelderError) {
- Melder_throw (me, U": no CPPS value calculated.");
- }
- }
- /* End of file Cepstrogram.cpp */
|