Add sample TTS engine

Bug: 4149751 Change-Id: Id8e96d4ec442db46cb97edaeab3ef7c13321ba1f
2011-03-11 16:51:56 +00:00
parent e89c5e20a0
commit b688761bab
14 changed files with 753 additions and 0 deletions
--- a/samples/TtsEngine/src/com/example/android/ttsengine/CheckVoiceData.java
+++ b/samples/TtsEngine/src/com/example/android/ttsengine/CheckVoiceData.java
@@ -0,0 +1,152 @@
+/*
+ * Copyright (C) 2011 The Android Open Source Project
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package com.example.android.ttsengine;
+
+import android.app.Activity;
+import android.content.Intent;
+import android.os.Bundle;
+import android.speech.tts.TextToSpeech;
+import android.text.TextUtils;
+import android.util.Log;
+
+import java.io.IOException;
+import java.io.InputStream;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.List;
+
+/*
+ * Checks if the voice data is present.
+ */
+public class CheckVoiceData extends Activity {
+    private static final String TAG = "CheckVoiceData";
+
+    private static final String[] SUPPORTED_LANGUAGES = { "eng-GBR", "eng-USA" };
+
+    @Override
+    protected void onCreate(Bundle savedInstanceState) {
+        super.onCreate(savedInstanceState);
+
+        Intent intent = getIntent();
+        List<String> checkLanguages = getCheckVoiceDataFor(intent);
+
+        // If the call didn't specify which languages to check, check
+        // for all the supported ones.
+        if (checkLanguages.isEmpty()) {
+            checkLanguages = Arrays.asList(SUPPORTED_LANGUAGES);
+        }
+
+        ArrayList<String> available = new ArrayList<String>();
+        ArrayList<String> unavailable = new ArrayList<String>();
+
+        for (String lang : checkLanguages) {
+            // This check is required because checkLanguages might contain
+            // an arbitrary list of languages if the intent specified them
+            // {@link #getCheckVoiceDataFor}.
+            if (isLanguageSupported(lang)) {
+                if (isDataInstalled(lang)) {
+                    available.add(lang);
+                } else {
+                    unavailable.add(lang);
+                }
+            }
+        }
+
+        int result;
+        if (!checkLanguages.isEmpty() && available.isEmpty()) {
+            // No voices available at all.
+            result = TextToSpeech.Engine.CHECK_VOICE_DATA_FAIL;
+        } else if (!unavailable.isEmpty()) {
+            // Some voices are available, but some have missing
+            // data.
+            result = TextToSpeech.Engine.CHECK_VOICE_DATA_MISSING_DATA;
+        } else {
+            // All voices are available.
+            result = TextToSpeech.Engine.CHECK_VOICE_DATA_PASS;
+        }
+
+        // We now return the list of available and unavailable voices
+        // as well as the return code.
+        Intent returnData = new Intent();
+        returnData.putStringArrayListExtra(
+                TextToSpeech.Engine.EXTRA_AVAILABLE_VOICES, available);
+        returnData.putStringArrayListExtra(
+                TextToSpeech.Engine.EXTRA_UNAVAILABLE_VOICES, unavailable);
+        setResult(result, returnData);
+        finish();
+    }
+
+    /**
+     * The intent that launches this activity can contain an intent extra
+     * {@link TextToSpeech.Engine.EXTRA_CHECK_VOICE_DATA_FOR} that might specify
+     * a given language to check voice data for. If the intent does not contain
+     * this extra, we assume that a voice check for all supported languages
+     * was requested.
+     */
+    private List<String> getCheckVoiceDataFor(Intent intent) {
+        ArrayList<String> list = intent.getStringArrayListExtra(
+                TextToSpeech.Engine.EXTRA_CHECK_VOICE_DATA_FOR);
+        ArrayList<String> ret = new ArrayList<String>();
+        if (list != null) {
+            for (String lang : list) {
+                if (!TextUtils.isEmpty(lang)) {
+                    ret.add(lang);
+                }
+            }
+        }
+        return ret;
+    }
+
+    /**
+     * Checks whether a given language is in the list of supported languages.
+     */
+    private boolean isLanguageSupported(String input) {
+        for (String lang : SUPPORTED_LANGUAGES) {
+            if (lang.equals(input)) {
+                return true;
+            }
+        }
+
+        return false;
+    }
+
+    /*
+     * Note that in our example, all data is packaged in our APK as
+     * assets (it could be a raw resource as well). This check is unnecessary
+     * because it will always succeed.
+     *
+     * If for example, engine data was downloaded or installed on external storage,
+     * this check would make much more sense.
+     */
+    private boolean isDataInstalled(String lang) {
+        try {
+            InputStream is = getAssets().open(lang + ".freq");
+
+            if (is != null) {
+                is.close();
+            } else {
+                return false;
+            }
+        } catch (IOException e) {
+            Log.w(TAG, "Unable to find data for: " + lang + ", exception: " + e);
+            return false;
+        }
+
+        // The asset InputStream was non null, and therefore this
+        // data file is available.
+        return true;
+    }
+}
--- a/samples/TtsEngine/src/com/example/android/ttsengine/GeneralSettingsFragment.java
+++ b/samples/TtsEngine/src/com/example/android/ttsengine/GeneralSettingsFragment.java
@@ -0,0 +1,31 @@
+/*
+ * Copyright (C) 2011 The Android Open Source Project
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package com.example.android.ttsengine;
+
+import android.os.Bundle;
+import android.preference.PreferenceFragment;
+
+public class GeneralSettingsFragment extends PreferenceFragment {
+    static final String SHARED_PREFS_NAME = "RobotSpeakSettings";
+    static final String WHISPER_KEY = "robot_speak_whisper";
+
+    @Override
+    public void onCreate(Bundle savedInstanceState) {
+        super.onCreate(savedInstanceState);
+        getPreferenceManager().setSharedPreferencesName(SHARED_PREFS_NAME);
+        addPreferencesFromResource(R.xml.general_settings);
+    }
+}
--- a/samples/TtsEngine/src/com/example/android/ttsengine/RobotSpeakSettings.java
+++ b/samples/TtsEngine/src/com/example/android/ttsengine/RobotSpeakSettings.java
@@ -0,0 +1,38 @@
+/*
+ * Copyright (C) 2011 The Android Open Source Project
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package com.example.android.ttsengine;
+
+import android.os.Bundle;
+import android.preference.PreferenceActivity;
+
+import java.util.List;
+
+/*
+ * This class is referenced via a meta data section in the manifest.
+ * A settings screen is optional, and if a given engine has no settings,
+ * there is no need to implement such a class.
+ */
+public class RobotSpeakSettings extends PreferenceActivity {
+    @Override
+    protected void onCreate(Bundle savedInstanceState) {
+        super.onCreate(savedInstanceState);
+    }
+
+    @Override
+    public void onBuildHeaders(List<Header> target) {
+        loadHeadersFromResource(R.xml.preferences_headers, target);
+    }
+}
--- a/samples/TtsEngine/src/com/example/android/ttsengine/RobotSpeakTtsService.java
+++ b/samples/TtsEngine/src/com/example/android/ttsengine/RobotSpeakTtsService.java
@@ -0,0 +1,294 @@
+/*
+ * Copyright (C) 2011 The Android Open Source Project
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License"); you may not
+ * use this file except in compliance with the License. You may obtain a copy of
+ * the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+ * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+ * License for the specific language governing permissions and limitations under
+ * the License.
+ */
+package com.example.android.ttsengine;
+
+import android.content.Context;
+import android.content.SharedPreferences;
+import android.media.AudioFormat;
+import android.speech.tts.SynthesisCallback;
+import android.speech.tts.SynthesisRequest;
+import android.speech.tts.TextToSpeech;
+import android.speech.tts.TextToSpeechService;
+import android.util.Log;
+
+import java.io.BufferedReader;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.InputStreamReader;
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+import java.util.HashMap;
+import java.util.Map;
+
+/**
+ * A text to speech engine that generates "speech" that a robot might understand.
+ * The engine supports two different "languages", each with their own frequency
+ * mappings.
+ *
+ * It exercises all aspects of the Text to speech engine API
+ * {@link android.speech.tts.TextToSpeechService}.
+ */
+public class RobotSpeakTtsService extends TextToSpeechService {
+    private static final String TAG = "ExampleTtsService";
+
+    /*
+     * This is the sampling rate of our output audio. This engine outputs
+     * audio at 16khz 16bits per sample PCM audio.
+     */
+    private static final int SAMPLING_RATE_HZ = 16000;
+
+    /*
+     * We multiply by a factor of two since each sample contains 16 bits (2 bytes).
+     */
+    private final byte[] mAudioBuffer = new byte[SAMPLING_RATE_HZ * 2];
+
+    private Map<Character, Integer> mFrequenciesMap;
+    private volatile String[] mCurrentLanguage = null;
+    private volatile boolean mStopRequested = false;
+    private SharedPreferences mSharedPrefs = null;
+
+    @Override
+    public void onCreate() {
+        super.onCreate();
+        mSharedPrefs = getSharedPreferences(GeneralSettingsFragment.SHARED_PREFS_NAME,
+                Context.MODE_PRIVATE);
+        // We load the default language when we start up. This isn't strictly
+        // required though, it can always be loaded lazily on the first call to
+        // onLoadLanguage or onSynthesizeText. This a tradeoff between memory usage
+        // and the latency of the first call.
+        onLoadLanguage("eng", "usa", "");
+    }
+
+    @Override
+    public void onDestroy() {
+        super.onDestroy();
+    }
+
+    @Override
+    protected String[] onGetLanguage() {
+        // Note that mCurrentLanguage is volatile because this can be called from
+        // multiple threads.
+        return mCurrentLanguage;
+    }
+
+    @Override
+    protected int onIsLanguageAvailable(String lang, String country, String variant) {
+        // The robot speak synthesizer supports only english.
+        if ("eng".equals(lang)) {
+            // We support two specific robot languages, the british robot language
+            // and the american robot language.
+            if ("USA".equals(country) || "GBR".equals(country)) {
+                // If the engine supported a specific variant, we would have
+                // something like.
+                //
+                // if ("android".equals(variant)) {
+                //     return TextToSpeech.LANG_COUNTRY_VAR_AVAILABLE;
+                // }
+                return TextToSpeech.LANG_COUNTRY_AVAILABLE;
+            }
+
+            // We support the language, but not the country.
+            return TextToSpeech.LANG_AVAILABLE;
+        }
+
+        return TextToSpeech.LANG_NOT_SUPPORTED;
+    }
+
+    /*
+     * Note that this method is synchronized, as is onSynthesizeText because
+     * onLoadLanguage can be called from multiple threads (while onSynthesizeText
+     * is always called from a single thread only).
+     */
+    @Override
+    protected synchronized int onLoadLanguage(String lang, String country, String variant) {
+        final int isLanguageAvailable = onIsLanguageAvailable(lang, country, variant);
+
+        if (isLanguageAvailable == TextToSpeech.LANG_NOT_SUPPORTED) {
+            return isLanguageAvailable;
+        }
+
+        String loadCountry = country;
+        if (isLanguageAvailable == TextToSpeech.LANG_AVAILABLE) {
+            loadCountry = "USA";
+        }
+
+        // If we've already loaded the requested language, we can return early.
+        if (mCurrentLanguage != null) {
+            if (mCurrentLanguage[0].equals(lang) && mCurrentLanguage[1].equals(country)) {
+                return isLanguageAvailable;
+            }
+        }
+
+        Map<Character, Integer> newFrequenciesMap = null;
+        try {
+            InputStream file = getAssets().open(lang + "-" + loadCountry + ".freq");
+            newFrequenciesMap = buildFrequencyMap(file);
+            file.close();
+        } catch (IOException e) {
+            Log.e(TAG, "Error loading data for : " + lang + "-" + country);
+        }
+
+        mFrequenciesMap = newFrequenciesMap;
+        mCurrentLanguage = new String[] { lang, loadCountry, ""};
+
+        return isLanguageAvailable;
+    }
+
+    @Override
+    protected void onStop() {
+        mStopRequested = true;
+    }
+
+    @Override
+    protected synchronized void onSynthesizeText(SynthesisRequest request,
+            SynthesisCallback callback) {
+        // Note that we call onLoadLanguage here since there is no guarantee
+        // that there would have been a prior call to this function.
+        int load = onLoadLanguage(request.getLanguage(), request.getCountry(),
+                request.getVariant());
+
+        // We might get requests for a language we don't support - in which case
+        // we error out early before wasting too much time.
+        if (load == TextToSpeech.LANG_NOT_SUPPORTED) {
+            callback.error();
+            return;
+        }
+
+        // At this point, we have loaded the language we need for synthesis and
+        // it is guaranteed that we support it so we proceed with synthesis.
+
+        // We denote that we are ready to start sending audio across to the
+        // framework. We use a fixed sampling rate (16khz), and send data across
+        // in 16bit PCM mono.
+        callback.start(SAMPLING_RATE_HZ,
+                AudioFormat.ENCODING_PCM_16BIT, 1 /* Number of channels. */);
+
+        // We then scan through each character of the request string and
+        // generate audio for it.
+        final String text = request.getText().toLowerCase();
+        for (int i = 0; i < text.length(); ++i) {
+            char value = normalize(text.charAt(i));
+            // It is crucial to call either of callback.error() or callback.done() to ensure
+            // that audio / other resources are released as soon as possible.
+            if (!generateOneSecondOfAudio(value, callback)) {
+                callback.error();
+                return;
+            }
+        }
+
+        // Alright, we're done with our synthesis - yay!
+        callback.done();
+    }
+
+    /*
+     * Normalizes a given character to the range 'a' - 'z' (inclusive). Our
+     * frequency mappings contain frequencies for each of these characters.
+     */
+    private static char normalize(char input) {
+        if (input == ' ') {
+            return input;
+        }
+
+        if (input < 'a') {
+            return 'a';
+        }
+        if (input > 'z') {
+            return 'z';
+        }
+
+        return input;
+    }
+
+    private Map<Character, Integer> buildFrequencyMap(InputStream is) throws IOException {
+        BufferedReader br = new BufferedReader(new InputStreamReader(is));
+        String line = null;
+        Map<Character, Integer> map = new HashMap<Character, Integer>();
+        try {
+            while ((line = br.readLine()) != null) {
+                String[] parts = line.split(":");
+                if (parts.length != 2) {
+                    throw new IOException("Invalid line encountered: " + line);
+                }
+                map.put(parts[0].charAt(0), Integer.parseInt(parts[1]));
+            }
+            map.put(' ', 0);
+            return map;
+        } finally {
+            is.close();
+        }
+    }
+
+    private boolean generateOneSecondOfAudio(char alphabet, SynthesisCallback cb) {
+        ByteBuffer buffer = ByteBuffer.wrap(mAudioBuffer).order(ByteOrder.LITTLE_ENDIAN);
+
+        // Someone called onStop, end the current synthesis and return.
+        // The mStopRequested variable will be reset at the beginning of the
+        // next synthesis.
+        //
+        // In general, a call to onStop( ) should make a best effort attempt
+        // to stop all processing for the *current* onSynthesizeText request (if
+        // one is active).
+        if (mStopRequested) {
+            return false;
+        }
+
+
+        if (mFrequenciesMap == null || !mFrequenciesMap.containsKey(alphabet)) {
+            return false;
+        }
+
+        final int frequency = mFrequenciesMap.get(alphabet);
+
+        if (frequency > 0) {
+            // This is the wavelength in samples. The frequency is chosen so that the
+            // waveLength is always a multiple of two and frequency divides the
+            // SAMPLING_RATE exactly.
+            final int waveLength = SAMPLING_RATE_HZ / frequency;
+            final int times = SAMPLING_RATE_HZ / waveLength;
+
+            for (int j = 0; j < times; ++j) {
+                // For a square curve, half of the values will be at Short.MIN_VALUE
+                // and the other half will be Short.MAX_VALUE.
+                for (int i = 0; i < waveLength / 2; ++i) {
+                    buffer.putShort((short)(getAmplitude() * -1));
+                }
+                for (int i = 0; i < waveLength / 2; ++i) {
+                    buffer.putShort(getAmplitude());
+                }
+            }
+        } else {
+            // Play a second of silence.
+            for (int i = 0; i < mAudioBuffer.length / 2; ++i) {
+                buffer.putShort((short) 0);
+            }
+        }
+
+        // Get the maximum allowed size of data we can send across in audioAvailable.
+        final int maxBufferSize = cb.getMaxBufferSize();
+        int offset = 0;
+        while (offset < mAudioBuffer.length) {
+            int bytesToWrite = Math.min(maxBufferSize, mAudioBuffer.length - offset);
+            cb.audioAvailable(mAudioBuffer, offset, bytesToWrite);
+            offset += bytesToWrite;
+        }
+        return true;
+    }
+
+    private short getAmplitude() {
+        boolean whisper = mSharedPrefs.getBoolean(GeneralSettingsFragment.WHISPER_KEY, false);
+        return (short) (whisper ? 2048 : 8192);
+    }
+}