/** * Copyright 2007 DFKI GmbH. * All Rights Reserved. Use is subject to license terms. * * Permission is hereby granted, free of charge, to use and distribute * this software and its documentation without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sublicense, and/or sell copies of this work, and to * permit persons to whom this work is furnished to do so, subject to * the following conditions: * * 1. The code must retain the above copyright notice, this list of * conditions and the following disclaimer. * 2. Any modifications must be clearly marked as such. * 3. Original authors' names are not deleted. * 4. The authors' names are not used to endorse or promote products * derived from this software without specific prior written * permission. * * DFKI GMBH AND THE CONTRIBUTORS TO THIS WORK DISCLAIM ALL WARRANTIES WITH * REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF * MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL DFKI GMBH NOR THE * CONTRIBUTORS BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF * THIS SOFTWARE. */ package marytts.signalproc.analysis; import marytts.util.math.ArrayUtils; import marytts.util.math.MathUtils; import marytts.util.signal.SignalProcUtils; /** * Implements a cepstral envelope estimation algorithm for fitting an envelope to discrete frequency amplitudes. * * Reference: W. D'haes, X. Rodet: Discrete Cepstrum Coefficients as Perceptual Features, International Computer Music Conference * (ICMC), Singapore, 2003. * * @author oytun.turk * */ public class RegularizedPostWarpedCepstrumEstimator extends RegularizedCepstrumEstimator { public static int getAutoCepsOrderPre(int numSpectralLines) { if (numSpectralLines <= 0) return 40; else return numSpectralLines * 2; } public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrderPre, int cepsOrder) { return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder, null); } public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrderPre, int cepsOrder, double[] weights) { return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder, weights, DEFAULT_LAMBDA); } // Post warping as described in W. D'Haes and X. Rodet, "Discrete Cepstrum Coefficients as Perceptual Features" public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrderPre, int cepsOrder, double[] weights, double lambda) { if (cepsOrderPre < 1) cepsOrderPre = getAutoCepsOrderPre(linearAmps.length); float[] ceps = freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, false, weights, lambda); // Post warping as described in W. D'Haes and X. Rodet, "Discrete Cepstrum Coefficients as Perceptual Features" double[][] A = new double[cepsOrder][cepsOrderPre]; int k, l, n; double w; int N = cepsOrderPre; for (k = 0; k < cepsOrder; k++) { for (l = 0; l < cepsOrderPre; l++) { A[k][l] = 0.0; for (n = 0; n < N; n++) { w = SignalProcUtils.mel2radian((Math.PI * n) / N, samplingRateInHz); A[k][l] += Math.cos(l * w) * Math.cos((Math.PI * n * k) / N); } if (l == 0) A[k][l] *= 1.0 / N; else A[k][l] *= 2.0 / N; } } double[] cepsDouble = MathUtils.matrixProduct(A, ceps); ceps = ArrayUtils.copyDouble2Float(cepsDouble); return ceps; } public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder, double[] weights, double lambda) { return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, false, weights, lambda); } public static double[] spectralEnvelopeDB(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder, int fftSize) { float[] ceps = freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder); return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz); } public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder) { return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, false, null, DEFAULT_LAMBDA); } public static double[] cepstrum2logAmpHalfSpectrum(float[] ceps, int fftSize, int samplingRateInHz) { return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz, false); } public static double[] cepstrum2linearSpectrumValues(float[] ceps, int maxFreqIndex, int samplingRateInHz) { double[] freqsInHz = new double[maxFreqIndex]; for (int i = 0; i <= maxFreqIndex; i++) freqsInHz[i] = SignalProcUtils.index2freq(i, samplingRateInHz, maxFreqIndex); return cepstrum2linearSpectrumValues(ceps, freqsInHz, samplingRateInHz); } public static double[] cepstrum2linearSpectrumValues(float[] ceps, double[] freqsInHz, int samplingRateInHz) { return MathUtils.db2amp(cepstrum2dbSpectrumValues(ceps, freqsInHz, samplingRateInHz)); } public static double[] cepstrum2dbSpectrumValues(float[] ceps, int maxFreqIndex, int samplingRateInHz) { double[] freqsInHz = new double[maxFreqIndex + 1]; for (int i = 0; i <= maxFreqIndex; i++) freqsInHz[i] = SignalProcUtils.index2freq(i, samplingRateInHz, maxFreqIndex); return cepstrum2dbSpectrumValues(ceps, freqsInHz, samplingRateInHz); } public static double[] cepstrum2dbSpectrumValues(float[] ceps, double[] freqsInHz, int samplingRateInHz) { double[] vals = new double[freqsInHz.length]; for (int i = 0; i < freqsInHz.length; i++) vals[i] = cepstrum2dbSpectrumValue(ceps, freqsInHz[i], samplingRateInHz); return vals; } public static double[][] precomputeM(double[] freqsInHz, int samplingRateInHz, int cepsOrder) { return precomputeM(freqsInHz, samplingRateInHz, cepsOrder, false); } public static double cepstrum2dbSpectrumValue(float[] ceps, double freqInHz, int samplingRateInHz) { int p = ceps.length - 1; double w = SignalProcUtils.hz2mel(freqInHz, samplingRateInHz); double val = ceps[0]; for (int i = 1; i <= p; i++) val += 2.0 * ceps[i] * Math.cos(w * i); return val; } public static double[] spectralEnvelopeLinear(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrderPre, int cepsOrder) { return spectralEnvelopeLinear(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder, SignalProcUtils.getDFTSize(samplingRateInHz)); } public static double[] spectralEnvelopeLinear(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrderPre, int cepsOrder, int fftSize) { return MathUtils.db2amp(spectralEnvelopeDB(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder, fftSize)); } public static double[] spectralEnvelopeDB(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrderPre, int cepsOrder, int fftSize) { float[] ceps = freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder); return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz); } public static double cepstrum2linearSpectrumValue(float[] ceps, double freqInHz, int samplingRateInHz) { return MathUtils.db2amp(cepstrum2dbSpectrumValue(ceps, freqInHz, samplingRateInHz)); } }