RegularizedPostWarpedCepstrumEstimator.java example

Explorer
marytts-master
/**
 * Copyright 2007 DFKI GmbH.
 * All Rights Reserved.  Use is subject to license terms.
 * 
 * Permission is hereby granted, free of charge, to use and distribute
 * this software and its documentation without restriction, including
 * without limitation the rights to use, copy, modify, merge, publish,
 * distribute, sublicense, and/or sell copies of this work, and to
 * permit persons to whom this work is furnished to do so, subject to
 * the following conditions:
 * 
 * 1. The code must retain the above copyright notice, this list of
 *    conditions and the following disclaimer.
 * 2. Any modifications must be clearly marked as such.
 * 3. Original authors' names are not deleted.
 * 4. The authors' names are not used to endorse or promote products
 *    derived from this software without specific prior written
 *    permission.
 *
 * DFKI GMBH AND THE CONTRIBUTORS TO THIS WORK DISCLAIM ALL WARRANTIES WITH
 * REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF
 * MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL DFKI GMBH NOR THE
 * CONTRIBUTORS BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL
 * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
 * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
 * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF
 * THIS SOFTWARE.
 */

package marytts.signalproc.analysis;

import marytts.util.math.ArrayUtils;
import marytts.util.math.MathUtils;
import marytts.util.signal.SignalProcUtils;

/**
 * Implements a cepstral envelope estimation algorithm for fitting an envelope to discrete frequency amplitudes.
 * 
 * Reference: W. D'haes, X. Rodet: Discrete Cepstrum Coefficients as Perceptual Features, International Computer Music Conference
 * (ICMC), Singapore, 2003.
 * 
 * @author oytun.turk
 * 
 */
public class RegularizedPostWarpedCepstrumEstimator extends RegularizedCepstrumEstimator {
	public static int getAutoCepsOrderPre(int numSpectralLines) {
		if (numSpectralLines <= 0)
			return 40;
		else
			return numSpectralLines * 2;
	}

	public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz,
			int cepsOrderPre, int cepsOrder) {
		return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder, null);
	}

	public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz,
			int cepsOrderPre, int cepsOrder, double[] weights) {
		return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder, weights, DEFAULT_LAMBDA);
	}

	// Post warping as described in W. D'Haes and X. Rodet, "Discrete Cepstrum Coefficients as Perceptual Features"
	public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz,
			int cepsOrderPre, int cepsOrder, double[] weights, double lambda) {
		if (cepsOrderPre < 1)
			cepsOrderPre = getAutoCepsOrderPre(linearAmps.length);

		float[] ceps = freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, false, weights, lambda);

		// Post warping as described in W. D'Haes and X. Rodet, "Discrete Cepstrum Coefficients as Perceptual Features"
		double[][] A = new double[cepsOrder][cepsOrderPre];

		int k, l, n;
		double w;
		int N = cepsOrderPre;
		for (k = 0; k < cepsOrder; k++) {
			for (l = 0; l < cepsOrderPre; l++) {
				A[k][l] = 0.0;
				for (n = 0; n < N; n++) {
					w = SignalProcUtils.mel2radian((Math.PI * n) / N, samplingRateInHz);
					A[k][l] += Math.cos(l * w) * Math.cos((Math.PI * n * k) / N);
				}

				if (l == 0)
					A[k][l] *= 1.0 / N;
				else
					A[k][l] *= 2.0 / N;
			}
		}

		double[] cepsDouble = MathUtils.matrixProduct(A, ceps);
		ceps = ArrayUtils.copyDouble2Float(cepsDouble);

		return ceps;
	}

	public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder,
			double[] weights, double lambda) {
		return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, false, weights, lambda);
	}

	public static double[] spectralEnvelopeDB(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder,
			int fftSize) {
		float[] ceps = freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder);

		return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz);
	}

	public static float[] freqsLinearAmps2cepstrum(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrder) {
		return freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrder, false, null, DEFAULT_LAMBDA);
	}

	public static double[] cepstrum2logAmpHalfSpectrum(float[] ceps, int fftSize, int samplingRateInHz) {
		return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz, false);
	}

	public static double[] cepstrum2linearSpectrumValues(float[] ceps, int maxFreqIndex, int samplingRateInHz) {
		double[] freqsInHz = new double[maxFreqIndex];
		for (int i = 0; i <= maxFreqIndex; i++)
			freqsInHz[i] = SignalProcUtils.index2freq(i, samplingRateInHz, maxFreqIndex);

		return cepstrum2linearSpectrumValues(ceps, freqsInHz, samplingRateInHz);
	}

	public static double[] cepstrum2linearSpectrumValues(float[] ceps, double[] freqsInHz, int samplingRateInHz) {
		return MathUtils.db2amp(cepstrum2dbSpectrumValues(ceps, freqsInHz, samplingRateInHz));
	}

	public static double[] cepstrum2dbSpectrumValues(float[] ceps, int maxFreqIndex, int samplingRateInHz) {
		double[] freqsInHz = new double[maxFreqIndex + 1];
		for (int i = 0; i <= maxFreqIndex; i++)
			freqsInHz[i] = SignalProcUtils.index2freq(i, samplingRateInHz, maxFreqIndex);

		return cepstrum2dbSpectrumValues(ceps, freqsInHz, samplingRateInHz);
	}

	public static double[] cepstrum2dbSpectrumValues(float[] ceps, double[] freqsInHz, int samplingRateInHz) {
		double[] vals = new double[freqsInHz.length];
		for (int i = 0; i < freqsInHz.length; i++)
			vals[i] = cepstrum2dbSpectrumValue(ceps, freqsInHz[i], samplingRateInHz);

		return vals;
	}

	public static double[][] precomputeM(double[] freqsInHz, int samplingRateInHz, int cepsOrder) {
		return precomputeM(freqsInHz, samplingRateInHz, cepsOrder, false);
	}

	public static double cepstrum2dbSpectrumValue(float[] ceps, double freqInHz, int samplingRateInHz) {
		int p = ceps.length - 1;

		double w = SignalProcUtils.hz2mel(freqInHz, samplingRateInHz);

		double val = ceps[0];
		for (int i = 1; i <= p; i++)
			val += 2.0 * ceps[i] * Math.cos(w * i);

		return val;
	}

	public static double[] spectralEnvelopeLinear(double[] linearAmps, double[] freqsInHz, int samplingRateInHz,
			int cepsOrderPre, int cepsOrder) {
		return spectralEnvelopeLinear(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder,
				SignalProcUtils.getDFTSize(samplingRateInHz));
	}

	public static double[] spectralEnvelopeLinear(double[] linearAmps, double[] freqsInHz, int samplingRateInHz,
			int cepsOrderPre, int cepsOrder, int fftSize) {
		return MathUtils.db2amp(spectralEnvelopeDB(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder, fftSize));
	}

	public static double[] spectralEnvelopeDB(double[] linearAmps, double[] freqsInHz, int samplingRateInHz, int cepsOrderPre,
			int cepsOrder, int fftSize) {
		float[] ceps = freqsLinearAmps2cepstrum(linearAmps, freqsInHz, samplingRateInHz, cepsOrderPre, cepsOrder);

		return cepstrum2logAmpHalfSpectrum(ceps, fftSize, samplingRateInHz);
	}

	public static double cepstrum2linearSpectrumValue(float[] ceps, double freqInHz, int samplingRateInHz) {
		return MathUtils.db2amp(cepstrum2dbSpectrumValue(ceps, freqInHz, samplingRateInHz));
	}
}