/**
* Copyright 2007 DFKI GmbH.
* All Rights Reserved. Use is subject to license terms.
*
* This file is part of MARY TTS.
*
* MARY TTS is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, version 3 of the License.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*
*/
package marytts.signalproc.process;
import java.io.File;
import javax.sound.sampled.AudioFileFormat;
import javax.sound.sampled.AudioInputStream;
import javax.sound.sampled.AudioSystem;
import marytts.signalproc.window.Window;
import marytts.util.data.BufferedDoubleDataSource;
import marytts.util.data.audio.AudioDoubleDataSource;
import marytts.util.data.audio.DDSAudioInputStream;
import marytts.util.math.MathUtils;
import marytts.util.signal.SignalProcUtils;
/**
* @author Oytun Türk
*
*/
public class VocalTractScalingProcessor extends VocalTractModifier {
private double[] vscales;
private double[] PxOut;
/**
* @param p
* p
* @param fs
* fs
* @param fftSize
* fftSize
* @param vscalesIn
* vscalesIn
*/
public VocalTractScalingProcessor(int p, int fs, int fftSize, double[] vscalesIn) {
super(p, fs, fftSize);
PxOut = new double[this.maxFreq];
if (vscalesIn.length > 0) {
vscales = MathUtils.modifySize(vscalesIn, this.maxFreq); // Modify length to match current length of spectrum
for (int i = 0; i < this.maxFreq; i++) {
if (vscales[i] < 0.05)
vscales[i] = 0.05; // Put a floor to avoid divide by zero
}
} else
vscales = null;
}
protected void processSpectrum(double[] Px) {
if (vscales != null) {
/*
* //Scale the vocal tract int i; int wInd; for (i=1; i<=maxFreq; i++) { wInd =
* (int)(Math.floor(((double)i)/vscales[i-1]+0.5)); //Find new index if (wInd<1) wInd=1; if (wInd>maxFreq)
* wInd=maxFreq;
*
* PxOut[i-1] = Px[wInd-1]; } //
*
* //Copy the modified vocal tract spectrum to input System.arraycopy(PxOut, 0, Px, 0, maxFreq); //
*/
int newLen = (int) Math.floor(Px.length * vscales[0] + 0.5);
double[] Px2 = MathUtils.interpolate(Px, newLen);
int i;
if (newLen > maxFreq) {
for (i = 0; i < maxFreq; i++)
Px[i] = Px2[i];
} else {
for (i = 0; i < newLen; i++)
Px[i] = Px2[i];
for (i = newLen; i < maxFreq; i++)
Px[i] = 0.0;
}
}
}
public static void main(String[] args) throws Exception {
double[] vscales = { 1.0 };
for (int i = 0; i < args.length; i++) {
AudioInputStream inputAudio = AudioSystem.getAudioInputStream(new File(args[i]));
int samplingRate = (int) inputAudio.getFormat().getSampleRate();
int p = SignalProcUtils.getLPOrder(samplingRate);
int fftSize = Math.max(SignalProcUtils.getDFTSize(samplingRate), 1024);
AudioDoubleDataSource signal = new AudioDoubleDataSource(inputAudio);
FrameOverlapAddSource foas = new FrameOverlapAddSource(signal, Window.HANNING, true, fftSize, samplingRate,
new VocalTractScalingProcessor(p, samplingRate, fftSize, vscales));
DDSAudioInputStream outputAudio = new DDSAudioInputStream(new BufferedDoubleDataSource(foas), inputAudio.getFormat());
String outFileName = args[i].substring(0, args[i].length() - 4) + "_vocalTractScaled.wav";
AudioSystem.write(outputAudio, AudioFileFormat.Type.WAVE, new File(outFileName));
}
}
}