LPCWhisperiser.java example

Explorer
marytts-master
/**
 * Copyright 2004-2006 DFKI GmbH.
 * All Rights Reserved.  Use is subject to license terms.
 *
 * This file is part of MARY TTS.
 *
 * MARY TTS is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Lesser General Public License as published by
 * the Free Software Foundation, version 3 of the License.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 */
package marytts.signalproc.process;

import java.io.File;

import javax.sound.sampled.AudioFileFormat;
import javax.sound.sampled.AudioInputStream;
import javax.sound.sampled.AudioSystem;

import marytts.signalproc.analysis.LpcAnalyser.LpCoeffs;
import marytts.signalproc.window.Window;
import marytts.util.data.BufferedDoubleDataSource;
import marytts.util.data.audio.AudioDoubleDataSource;
import marytts.util.data.audio.DDSAudioInputStream;
import marytts.util.math.MathUtils;

/**
 * @author Marc Schröder
 * 
 */
public class LPCWhisperiser extends LPCAnalysisResynthesis {
	protected double whisperAmount; // Amount of whispered voice at the output between 0.5 (half whispered+half unmodified) and
									// 1.0 (full whispered)
	protected double oneMinusWhisperAmount; // 1.0-whisperAmount

	public LPCWhisperiser(int predictionOrder, double amount) {
		super(predictionOrder);
		this.whisperAmount = MathUtils.trimToRange(amount, 0., 1.);
		this.oneMinusWhisperAmount = 1.0 - this.whisperAmount;
	}

	public LPCWhisperiser(int predictionOrder) {
		super(predictionOrder);
		whisperAmount = 1.0;
	}

	/**
	 * Replace residual with white noise
	 */
	protected void processLPC(LpCoeffs coeffs, double[] residual) {
		// Determine average residual energy:
		double totalResidualEnergy = coeffs.getGain() * coeffs.getGain();
		double avgAbsAmplitude = Math.sqrt(totalResidualEnergy / residual.length);
		double maxAbsAmplitude = 2 * avgAbsAmplitude;
		double spread = 2 * maxAbsAmplitude;
		for (int i = 0; i < residual.length; i++)
			residual[i] = whisperAmount * spread * (Math.random() - 0.5) + oneMinusWhisperAmount * residual[i];
	}

	public static void main(String[] args) throws Exception {
		for (int i = 0; i < args.length; i++) {
			AudioInputStream inputAudio = AudioSystem.getAudioInputStream(new File(args[i]));
			int samplingRate = (int) inputAudio.getFormat().getSampleRate();
			AudioDoubleDataSource signal = new AudioDoubleDataSource(inputAudio);
			int frameLength = Integer.getInteger("signalproc.lpcanalysissynthesis.framelength", 512).intValue();
			int predictionOrder = Integer.getInteger("signalproc.lpcwhisperiser.predictionorder", 20).intValue();
			FrameOverlapAddSource foas = new FrameOverlapAddSource(signal, Window.HANNING, true, frameLength, samplingRate,
					new LPCWhisperiser(predictionOrder));
			DDSAudioInputStream outputAudio = new DDSAudioInputStream(new BufferedDoubleDataSource(foas), inputAudio.getFormat());
			String outFileName = args[i].substring(0, args[i].length() - 4) + "_lpcwhisperised.wav";
			AudioSystem.write(outputAudio, AudioFileFormat.Type.WAVE, new File(outFileName));
		}

	}

}