/** * Copyright 2007 DFKI GmbH. * All Rights Reserved. Use is subject to license terms. * * This file is part of MARY TTS. * * MARY TTS is free software: you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as published by * the Free Software Foundation, version 3 of the License. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public License * along with this program. If not, see <http://www.gnu.org/licenses/>. * */ package marytts.signalproc.analysis; import javax.swing.JFrame; import marytts.signalproc.display.FunctionGraph; import marytts.util.math.MathUtils; import marytts.util.signal.SignalProcUtils; /** * Spectral Enveope Estimation Vocoder (SEEVOC) - a simple implementation * * Reference: Paul, D., 1981, "The Spectral Envelope Estimation Vocoder", IEEE Trans. Acoust. Speech Signal Proc., ASSP-29, pp. * 786-794. * * @author Oytun Türk */ public class SeevocAnalyser { public static SpectrumWithPeakIndices calcSpecEnvelopeDB(double[] absMagSpecIndB, int samplingRate) { return calcSpecEnvelopeDB(absMagSpecIndB, samplingRate, 100.0); } // The returned spectral envelope is in linear scale public static SpectrumWithPeakIndices calcSpecEnvelopeLinear(double[] absMagSpecIndB, int samplingRate, double f0) { SpectrumWithPeakIndices s = calcSpecEnvelopeDB(absMagSpecIndB, samplingRate, f0); s.spec = MathUtils.db2amp(s.spec); return s; } // The returned spectral envelope is also in dB public static SpectrumWithPeakIndices calcSpecEnvelopeDB(double[] absMagSpecIndB, int samplingRate, double f0) { SpectrumWithPeakIndices s = new SpectrumWithPeakIndices(); int i, j; if (f0 < 10.0) f0 = 100.0f; int maxPeaks = (int) Math.floor(0.5 * samplingRate / f0 + 0.5) + 10; double[] peakVals = new double[maxPeaks]; int[] peakInds = new int[maxPeaks]; double[] peakFreqs = new double[maxPeaks]; int maxFreqInd = absMagSpecIndB.length - 1; double[] freqs = new double[maxFreqInd + 1]; for (i = 0; i <= maxFreqInd; i++) freqs[i] = SignalProcUtils.index2freq(i, samplingRate, maxFreqInd); int numPeaks = 0; double currentFreq = 0.0; double currentMax; int currentInd; int startInd, endInd; boolean bEndNotCovered = true; while (true) { if (currentFreq + 1.5 * f0 > 0.5 * samplingRate) break; startInd = SignalProcUtils.freq2index(currentFreq + 0.5 * f0, samplingRate, maxFreqInd); endInd = SignalProcUtils.freq2index(currentFreq + 1.5 * f0, samplingRate, maxFreqInd); startInd = Math.max(0, startInd); endInd = Math.min(endInd, maxFreqInd); startInd = Math.min(startInd, endInd); if (endInd == maxFreqInd) bEndNotCovered = false; currentInd = MathUtils.getAbsMaxInd(absMagSpecIndB, startInd, endInd); if (currentInd == -1) { peakVals[numPeaks + 1] = Math.max(absMagSpecIndB[startInd], absMagSpecIndB[endInd]); currentInd = (int) Math.floor(0.5 * (startInd + endInd) + 0.5); } else peakVals[numPeaks + 1] = absMagSpecIndB[currentInd]; currentFreq = SignalProcUtils.index2freq(currentInd, samplingRate, maxFreqInd); peakInds[numPeaks + 1] = currentInd; peakFreqs[numPeaks + 1] = currentFreq; numPeaks++; // Search for the for the first interval if (numPeaks == 1) { startInd = 0; endInd = SignalProcUtils.freq2index(currentFreq - 0.5 * f0, samplingRate, maxFreqInd); startInd = Math.max(0, startInd); endInd = Math.min(endInd, maxFreqInd); startInd = Math.min(startInd, endInd); currentInd = MathUtils.getAbsMaxInd(absMagSpecIndB, startInd, endInd); if (currentInd == -1) { peakVals[0] = Math.max(absMagSpecIndB[startInd], absMagSpecIndB[endInd]); currentInd = (int) Math.floor(0.5 * (startInd + endInd) + 0.5); } else peakVals[0] = absMagSpecIndB[currentInd]; peakInds[0] = currentInd; peakFreqs[0] = SignalProcUtils.index2freq(currentInd, samplingRate, maxFreqInd); } // if (numPeaks > maxPeaks - 3) break; } // Search for the last interval if (bEndNotCovered && numPeaks < maxPeaks) { startInd = SignalProcUtils.freq2index(currentFreq + 0.5 * f0, samplingRate, maxFreqInd); endInd = maxFreqInd; startInd = Math.max(0, startInd); startInd = Math.min(startInd, endInd); currentInd = MathUtils.getAbsMaxInd(absMagSpecIndB, startInd, endInd); if (currentInd == -1) { peakVals[numPeaks + 1] = Math.max(absMagSpecIndB[startInd], absMagSpecIndB[endInd]); currentInd = (int) Math.floor(0.5 * (startInd + endInd) + 0.5); } else peakVals[numPeaks + 1] = absMagSpecIndB[currentInd]; peakInds[numPeaks + 1] = currentInd; peakFreqs[numPeaks + 1] = SignalProcUtils.index2freq(currentInd, samplingRate, maxFreqInd); numPeaks++; } // s.spec = new double[maxFreqInd + 1]; for (j = 0; j < peakInds[0]; j++) s.spec[j] = absMagSpecIndB[0] + (absMagSpecIndB[peakInds[0]] - absMagSpecIndB[0]) / peakFreqs[0] * freqs[j]; for (i = 0; i < numPeaks - 1; i++) { for (j = peakInds[i]; j < peakInds[i + 1]; j++) s.spec[j] = absMagSpecIndB[peakInds[i]] + (absMagSpecIndB[peakInds[i + 1]] - absMagSpecIndB[peakInds[i]]) / (peakFreqs[i + 1] - peakFreqs[i]) * (freqs[j] - peakFreqs[i]); } for (j = peakInds[numPeaks - 1]; j <= maxFreqInd; j++) s.spec[j] = absMagSpecIndB[peakInds[numPeaks - 1]] + (absMagSpecIndB[maxFreqInd] - absMagSpecIndB[peakInds[numPeaks - 1]]) / (0.5 * samplingRate - peakFreqs[numPeaks - 1]) * (freqs[j] - peakFreqs[numPeaks - 1]); // s.spec = SignalProcUtils.medianFilter(H, 5, H[0], H[H.length-1]); // s.spec = SignalProcUtils.meanFilter(H, 19, H[0], H[H.length-1]); // Plot the DFT and the estimated spectral envelope to check visually // double [] excIndB = new double[s.spec.length]; // for (i=0; i<s.spec.length; i++) // excIndB[i] = absMagSpecIndB[i]-H[i]; // JFrame frame1 = showGraph(absMagSpecIndB, "DFT spectrum"); // JFrame frame2 = showGraph(s.spec, "SEEVOC"); // try { Thread.sleep(3000); } catch (InterruptedException e) {} // frame1.dispose(); // frame2.dispose(); s.indices = new int[numPeaks]; System.arraycopy(peakInds, 0, s.indices, 0, numPeaks); return s; } protected static JFrame showGraph(double[] array, String title) { FunctionGraph graph = new FunctionGraph(400, 200, 0, 1, array); JFrame frame = graph.showInJFrame(title, 500, 300, true, false); return frame; } }