RegularizedPreWarpedCepstrumEstimator.java example

Explorer
marytts-master
/**
 * Copyright 2007 DFKI GmbH.
 * All Rights Reserved.  Use is subject to license terms.
 * 
 * Permission is hereby granted, free of charge, to use and distribute
 * this software and its documentation without restriction, including
 * without limitation the rights to use, copy, modify, merge, publish,
 * distribute, sublicense, and/or sell copies of this work, and to
 * permit persons to whom this work is furnished to do so, subject to
 * the following conditions:
 * 
 * 1. The code must retain the above copyright notice, this list of
 *    conditions and the following disclaimer.
 * 2. Any modifications must be clearly marked as such.
 * 3. Original authors' names are not deleted.
 * 4. The authors' names are not used to endorse or promote products
 *    derived from this software without specific prior written
 *    permission.
 *
 * DFKI GMBH AND THE CONTRIBUTORS TO THIS WORK DISCLAIM ALL WARRANTIES WITH
 * REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF
 * MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL DFKI GMBH NOR THE
 * CONTRIBUTORS BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL
 * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
 * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
 * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF
 * THIS SOFTWARE.
 */

package marytts.signalproc.analysis;

import marytts.util.math.MathUtils;
import marytts.util.signal.SignalProcUtils;

/**
 * 
 * Implements the regularized cepstral envelope estimation in
 * 
 * Cappe, O., Laroche, J., and Moulines E., 1995, "Regularized estimation of cepstrum envelope from discrete frequency points", in
 * IEEE ASSP Workshop on app. of sig. proc. to audio and acoust.
 * 
 * This approach is used in Harmonic plus Noise (HNM) model for pitch modification for the purpose of estimating amplitudes of
 * harmonics at (new) pitch-modified locations. (See, i.e. (Stylianou, et. al.,1995) or Stylianou´s PhD thesis for details)
 * 
 * Stylianou, Y, Laroche, J., and Moulines E., 1995, "High quality speech modification based on a Harmonic + Noise model", in
 * Proc. of the Europseech 1995.
 * 
 * Various other techniques are used by other researchers to keep the overall spectral shape unchanged under pitch sclae
 * modifications. For example, Quatieri uses SEEVOC approach (linear interpolation) to find amplitude values at modified
 * frequencies. Failing to estimate the modified amplitudes successfully will result in changes in overal spectral envelope which
 * may affect voice quality, presence, or even the identity of phones after pitch scaling.
 * 
 * @author Oytun Türk
 */
public class RegularizedPreWarpedCepstrumEstimator extends RegularizedCepstrumEstimator {
	public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder,
			double[] weights, double lambda) {
		return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, true, weights, lambda);
	}

	public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder) {
		return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, true, null, DEFAULT_LAMBDA);
	}

	public static double[] cepstrum2logAmpHalfSpectrum(float[] ceps, int fftSize, int samplingRateInHz) {
		return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz, true);
	}

	public static double cepstrum2linearSpectrumValue(float[] ceps, double freqInHz, int samplingRateInHz) {
		return MathUtils.db2amp(cepstrum2dbSpectrumValue(ceps, freqInHz, samplingRateInHz));
	}

	public static double cepstrum2dbSpectrumValue(float[] ceps, double freqInHz, int samplingRateInHz) {
		int p = ceps.length - 1;

		double denum = (2.0 * SignalProcUtils.freq2barkNew(0.5 * samplingRateInHz));
		double f = SignalProcUtils.freq2barkNew(freqInHz) / denum;

		double val = ceps[0];
		for (int i = 1; i <= p; i++)
			val += 2.0 * ceps[i] * Math.cos(MathUtils.TWOPI * f * i);

		return val;
	}

	public static double[] cepstrum2dbSpectrumValues(float[] ceps, int maxFreqIndex, int samplingRateInHz) {
		double[] freqsInHz = new double[maxFreqIndex + 1];
		for (int i = 0; i <= maxFreqIndex; i++)
			freqsInHz[i] = SignalProcUtils.index2freq(i, samplingRateInHz, maxFreqIndex);

		return cepstrum2dbSpectrumValues(ceps, freqsInHz, samplingRateInHz);
	}

	public static double[] cepstrum2dbSpectrumValues(float[] ceps, double[] freqsInHz, int samplingRateInHz) {
		double[] vals = new double[freqsInHz.length];
		for (int i = 0; i < freqsInHz.length; i++)
			vals[i] = cepstrum2dbSpectrumValue(ceps, freqsInHz[i], samplingRateInHz);

		return vals;
	}

	public static double[][] precomputeM(double[] freqsInHz, int samplingRateInHz, int cepsOrder) {
		return precomputeM(freqsInHz, samplingRateInHz, cepsOrder, true);
	}

	public static double[] spectralEnvelopeLinear(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder) {
		return spectralEnvelopeLinear(linearAmps, freqsInHz, samplingRateInHz, cepsOrder,
				SignalProcUtils.getDFTSize(samplingRateInHz));
	}

	public static double[] spectralEnvelopeLinear(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder,
			int fftSize) {
		return MathUtils.db2amp(spectralEnvelopeDB(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, fftSize));
	}

	public static double[] spectralEnvelopeDB(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder,
			int fftSize) {
		float[] ceps = freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder);

		return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz);
	}
}