/** * Copyright 2007 DFKI GmbH. * All Rights Reserved. Use is subject to license terms. * * Permission is hereby granted, free of charge, to use and distribute * this software and its documentation without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sublicense, and/or sell copies of this work, and to * permit persons to whom this work is furnished to do so, subject to * the following conditions: * * 1. The code must retain the above copyright notice, this list of * conditions and the following disclaimer. * 2. Any modifications must be clearly marked as such. * 3. Original authors' names are not deleted. * 4. The authors' names are not used to endorse or promote products * derived from this software without specific prior written * permission. * * DFKI GMBH AND THE CONTRIBUTORS TO THIS WORK DISCLAIM ALL WARRANTIES WITH * REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF * MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL DFKI GMBH NOR THE * CONTRIBUTORS BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF * THIS SOFTWARE. */ package marytts.signalproc.analysis; import marytts.util.math.MathUtils; import marytts.util.signal.SignalProcUtils; /** * * Implements the regularized cepstral envelope estimation in * * Cappe, O., Laroche, J., and Moulines E., 1995, "Regularized estimation of cepstrum envelope from discrete frequency points", in * IEEE ASSP Workshop on app. of sig. proc. to audio and acoust. * * This approach is used in Harmonic plus Noise (HNM) model for pitch modification for the purpose of estimating amplitudes of * harmonics at (new) pitch-modified locations. (See, i.e. (Stylianou, et. al.,1995) or Stylianou´s PhD thesis for details) * * Stylianou, Y, Laroche, J., and Moulines E., 1995, "High quality speech modification based on a Harmonic + Noise model", in * Proc. of the Europseech 1995. * * Various other techniques are used by other researchers to keep the overall spectral shape unchanged under pitch sclae * modifications. For example, Quatieri uses SEEVOC approach (linear interpolation) to find amplitude values at modified * frequencies. Failing to estimate the modified amplitudes successfully will result in changes in overal spectral envelope which * may affect voice quality, presence, or even the identity of phones after pitch scaling. * * @author Oytun Türk */ public class RegularizedPreWarpedCepstrumEstimator extends RegularizedCepstrumEstimator { public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder, double[] weights, double lambda) { return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, true, weights, lambda); } public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder) { return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, true, null, DEFAULT_LAMBDA); } public static double[] cepstrum2logAmpHalfSpectrum(float[] ceps, int fftSize, int samplingRateInHz) { return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz, true); } public static double cepstrum2linearSpectrumValue(float[] ceps, double freqInHz, int samplingRateInHz) { return MathUtils.db2amp(cepstrum2dbSpectrumValue(ceps, freqInHz, samplingRateInHz)); } public static double cepstrum2dbSpectrumValue(float[] ceps, double freqInHz, int samplingRateInHz) { int p = ceps.length - 1; double denum = (2.0 * SignalProcUtils.freq2barkNew(0.5 * samplingRateInHz)); double f = SignalProcUtils.freq2barkNew(freqInHz) / denum; double val = ceps[0]; for (int i = 1; i <= p; i++) val += 2.0 * ceps[i] * Math.cos(MathUtils.TWOPI * f * i); return val; } public static double[] cepstrum2dbSpectrumValues(float[] ceps, int maxFreqIndex, int samplingRateInHz) { double[] freqsInHz = new double[maxFreqIndex + 1]; for (int i = 0; i <= maxFreqIndex; i++) freqsInHz[i] = SignalProcUtils.index2freq(i, samplingRateInHz, maxFreqIndex); return cepstrum2dbSpectrumValues(ceps, freqsInHz, samplingRateInHz); } public static double[] cepstrum2dbSpectrumValues(float[] ceps, double[] freqsInHz, int samplingRateInHz) { double[] vals = new double[freqsInHz.length]; for (int i = 0; i < freqsInHz.length; i++) vals[i] = cepstrum2dbSpectrumValue(ceps, freqsInHz[i], samplingRateInHz); return vals; } public static double[][] precomputeM(double[] freqsInHz, int samplingRateInHz, int cepsOrder) { return precomputeM(freqsInHz, samplingRateInHz, cepsOrder, true); } public static double[] spectralEnvelopeLinear(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder) { return spectralEnvelopeLinear(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, SignalProcUtils.getDFTSize(samplingRateInHz)); } public static double[] spectralEnvelopeLinear(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder, int fftSize) { return MathUtils.db2amp(spectralEnvelopeDB(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, fftSize)); } public static double[] spectralEnvelopeDB(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder, int fftSize) { float[] ceps = freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder); return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz); } }