BaseSynthsiser.java example

Explorer
java-speech-api-master
- src
  - main
    - java
      - com
        darkprograms
        speech
        microphone
        Microphone.java
        MicrophoneAnalyzer.java
        recognizer
        FlacEncoder.java
        GSpeechDuplex.java
        GSpeechResponseListener.java
        GoogleResponse.java
        Recognizer.java
        RecognizerChunked.java
        synthesiser
        BaseSynthsiser.java
        Synthesiser.java
        SynthesiserV2.java
        translator
        GoogleTranslate.java
        util
        ChunkedOutputStream.java
        Complex.java
        FFT.java
        StringUtil.java
package com.darkprograms.speech.synthesiser;

import com.darkprograms.speech.translator.GoogleTranslate;

import java.io.IOException;
import java.io.InputStream;
import java.io.SequenceInputStream;
import java.util.ArrayList;
import java.util.Collections;
import java.util.LinkedHashSet;
import java.util.List;
import java.util.Set;
import java.util.concurrent.Callable;
import java.util.concurrent.ExecutionException;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.Future;

/*******************************************************************************
 * Synthesiser class that connects to Google's unoffical API to retrieve data
 *
 * @author Luke Kuza, Aaron Gokaslan (Skylion)
 *******************************************************************************/
public abstract class BaseSynthsiser {

    /**
     * Gets an input stream to MP3 data for the returned information from a request
     *
     * @param synthText Text you want to be synthesized into MP3 data
     * @return Returns an input stream of the MP3 data that is returned from Google
     * @throws IOException Throws exception if it can not complete the request
     */
    public abstract InputStream getMP3Data(String synthText) throws IOException;

    /**
     * Gets an InputStream to MP3Data for the returned information from a request
     * @param synthText List of Strings you want to be synthesized into MP3 data
     * @return Returns an input stream of all the MP3 data that is returned from Google
     * @throws IOException Throws exception if it cannot complete the request
     */
    public InputStream getMP3Data(List<String> synthText) throws IOException {
        //Uses an executor service pool for concurrency. Limit to 1000 threads max.
        ExecutorService pool = Executors.newFixedThreadPool(1000);
        //Stores the Future (Data that will be returned in the future)
        Set<Future<InputStream>> set = new LinkedHashSet<Future<InputStream>>(synthText.size());
        for(String part: synthText){ //Iterates through the list
            Callable<InputStream> callable = new MP3DataFetcher(part);//Creates Callable
            Future<InputStream> future = pool.submit(callable);//Begins to run Callable
            set.add(future);//Adds the response that will be returned to a set.
        }
        List<InputStream> inputStreams = new ArrayList<InputStream>(set.size());
        for(Future<InputStream> future: set){
            try {
                inputStreams.add(future.get());//Gets the returned data from the future.
            } catch (ExecutionException e) {//Thrown if the MP3DataFetcher encountered an error.
                Throwable ex = e.getCause();
                if(ex instanceof IOException){
                    throw (IOException)ex;//Downcasts and rethrows it.
                }
            } catch (InterruptedException e){//Will probably never be called, but just in case...
                Thread.currentThread().interrupt();//Interrupts the thread since something went wrong.
            }
        }
        return new SequenceInputStream(Collections.enumeration(inputStreams));//Sequences the stream.
    }

    /**
     * Separates a string into smaller parts so that Google will not reject the request.
     * @param input The string you want to separate
     * @return A List<String> of the String fragments from your input..
     */
    protected List<String> parseString(String input){
        return parseString (input, new ArrayList<String>());
    }

    /**
     * Separates a string into smaller parts so that Google will not reject the request.
     * @param input The string you want to break up into smaller parts
     * @param fragments List<String> that you want to add stuff too.
     * If you don't have a List<String> already constructed "new ArrayList<String>()" works well.
     * @return A list of the fragments of the original String
     */
    private List<String> parseString(String input, List<String> fragments){
        if(input.length()<=100){//Base Case
            fragments.add(input);
            return fragments;
        }
        else{
            int lastWord = findLastWord(input);//Checks if a space exists
            if(lastWord<=0){
                fragments.add(input.substring(0,100));//In case you sent gibberish to Google.
                return parseString(input.substring(100), fragments);
            }else{
                fragments.add(input.substring(0,lastWord));
                //Otherwise, adds the last word to the list for recursion.
                return parseString(input.substring(lastWord), fragments);
            }
        }
    }

    /**
     * Finds the last word in your String (before the index of 99) by searching for spaces and ending punctuation.
     * Will preferably parse on punctuation to alleviate mid-sentence pausing
     * @param input The String you want to search through.
     * @return The index of where the last word of the string ends before the index of 99.
     */
    private int findLastWord(String input){
        if(input.length()<100)
            return input.length();
        int space = -1;
        for(int i = 99; i>0; i--){
            char tmp = input.charAt(i);
            if(isEndingPunctuation(tmp)){
                return i+1;
            }
            if(space==-1 && tmp == ' '){
                space = i;
            }
        }
        if(space>0){
            return space;
        }
        return -1;
    }

    /**
     * Checks if char is an ending character
     * Ending punctuation for all languages according to Wikipedia (Except for Sanskrit non-unicode)
     * @param input The char you want check
     * @return True if it is, false if not.
     */
    private boolean isEndingPunctuation(char input){
        return input == '.' || input == '!' || input == '?' || input == ';' || input == ':' || input == '|';
    }

    /**
     * Automatically determines the language of the original text
     * @param text represents the text you want to check the language of
     * @return the languageCode in ISO-639
     * @throws IOException if it cannot complete the request
     */
    public String detectLanguage(String text) throws IOException{
        return GoogleTranslate.detectLanguage(text);
    }

    /**
     * This class is a callable.
     * A callable is like a runnable except that it can return data and throw exceptions.
     * Useful when using futures. Dramatically improves the speed of execution.
     * @author Aaron Gokaslan (Skylion)
     */
    private class MP3DataFetcher implements Callable<InputStream>{
        private String synthText;

        public MP3DataFetcher(String synthText){
            this.synthText = synthText;
        }

        public InputStream call() throws IOException{
            return getMP3Data(synthText);
        }
    }
}