| /* |
| * Copyright (C) 2013 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); you may not |
| * use this file except in compliance with the License. You may obtain a copy of |
| * the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT |
| * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the |
| * License for the specific language governing permissions and limitations under |
| * the License. |
| */ |
| |
| package android.speech.tts; |
| |
| import android.app.Activity; |
| import android.app.Application; |
| import android.content.ComponentName; |
| import android.content.Context; |
| import android.content.Intent; |
| import android.content.ServiceConnection; |
| import android.media.AudioManager; |
| import android.net.Uri; |
| import android.os.AsyncTask; |
| import android.os.Handler; |
| import android.os.IBinder; |
| import android.os.Looper; |
| import android.os.Message; |
| import android.os.ParcelFileDescriptor; |
| import android.os.RemoteException; |
| import android.speech.tts.ITextToSpeechCallback; |
| import android.speech.tts.ITextToSpeechService; |
| import android.util.Log; |
| import android.util.Pair; |
| |
| import java.io.File; |
| import java.io.FileNotFoundException; |
| import java.io.IOException; |
| import java.util.Collections; |
| import java.util.HashMap; |
| import java.util.List; |
| import java.util.concurrent.atomic.AtomicInteger; |
| |
| /** |
| * Synthesizes speech from text for immediate playback or to create a sound |
| * file. |
| * <p> |
| * This is an updated version of the speech synthesis client that supersedes |
| * {@link android.speech.tts.TextToSpeech}. |
| * <p> |
| * A TextToSpeechClient instance can only be used to synthesize text once it has |
| * connected to the service. The TextToSpeechClient instance will start establishing |
| * the connection after a call to the {@link #connect()} method. This is usually done in |
| * {@link Application#onCreate()} or {@link Activity#onCreate}. When the connection |
| * is established, the instance will call back using the |
| * {@link TextToSpeechClient.ConnectionCallbacks} interface. Only after a |
| * successful callback is the client usable. |
| * <p> |
| * After successful connection, the list of all available voices can be obtained |
| * by calling the {@link TextToSpeechClient#getEngineStatus()} method. The client can |
| * choose a voice using some custom heuristic and build a {@link RequestConfig} object |
| * using {@link RequestConfig.Builder}, or can use one of the common heuristics found |
| * in ({@link RequestConfigHelper}. |
| * <p> |
| * When you are done using the TextToSpeechClient instance, call the |
| * {@link #disconnect()} method to release the connection. |
| * <p> |
| * In the rare case of a change to the set of available voices, the service will call to the |
| * {@link ConnectionCallbacks#onEngineStatusChange} with new set of available voices as argument. |
| * In response, the client HAVE to recreate all {@link RequestConfig} instances in use. |
| */ |
| public class TextToSpeechClient { |
| private static final String TAG = TextToSpeechClient.class.getSimpleName(); |
| |
| private final Object mLock = new Object(); |
| private final TtsEngines mEnginesHelper; |
| private final Context mContext; |
| |
| // Guarded by mLock |
| private Connection mServiceConnection; |
| private final RequestCallbacks mDefaultRequestCallbacks; |
| private final ConnectionCallbacks mConnectionCallbacks; |
| private EngineStatus mEngineStatus; |
| private String mRequestedEngine; |
| private boolean mFallbackToDefault; |
| private HashMap<String, Pair<UtteranceId, RequestCallbacks>> mCallbacks; |
| // Guarded by mLock |
| |
| private InternalHandler mMainHandler = new InternalHandler(); |
| |
| /** Common voices parameters */ |
| public static final class Params { |
| private Params() {} |
| |
| /** |
| * Maximum allowed time for a single request attempt, in milliseconds, before synthesis |
| * fails (or fallback request starts, if requested using |
| * {@link #FALLBACK_VOICE_NAME}). |
| */ |
| public static final String NETWORK_TIMEOUT_MS = "networkTimeoutMs"; |
| |
| /** |
| * Number of network request retries that are attempted in case of failure |
| */ |
| public static final String NETWORK_RETRIES_COUNT = "networkRetriesCount"; |
| |
| /** |
| * Should synthesizer report sub-utterance progress on synthesis. Only applicable |
| * for the {@link TextToSpeechClient#queueSpeak} method. |
| */ |
| public static final String TRACK_SUBUTTERANCE_PROGRESS = "trackSubutteranceProgress"; |
| |
| /** |
| * If a voice exposes this parameter then it supports the fallback request feature. |
| * |
| * If it is set to a valid name of some other voice ({@link VoiceInfo#getName()}) then |
| * in case of request failure (due to network problems or missing data), fallback request |
| * will be attempted. Request will be done using the voice referenced by this parameter. |
| * If it is the case, the client will be informed by a callback to the {@link |
| * RequestCallbacks#onSynthesisFallback(UtteranceId)}. |
| */ |
| public static final String FALLBACK_VOICE_NAME = "fallbackVoiceName"; |
| |
| /** |
| * Audio parameter for specifying a linear multiplier to the speaking speed of the voice. |
| * The value is a float. Values below zero decrease speed of the synthesized speech |
| * values above one increase it. If the value of this parameter is equal to zero, |
| * then it will be replaced by a settings-configurable default before it reaches |
| * TTS service. |
| */ |
| public static final String SPEECH_SPEED = "speechSpeed"; |
| |
| /** |
| * Audio parameter for controlling the pitch of the output. The Value is a positive float, |
| * with default of {@code 1.0}. The value is used to scale the primary frequency linearly. |
| * Lower values lower the tone of the synthesized voice, greater values increase it. |
| */ |
| public static final String SPEECH_PITCH = "speechPitch"; |
| |
| /** |
| * Audio parameter for controlling output volume. Value is a float with scale of 0 to 1 |
| */ |
| public static final String AUDIO_PARAM_VOLUME = TextToSpeech.Engine.KEY_PARAM_VOLUME; |
| |
| /** |
| * Audio parameter for controlling output pan. |
| * Value is a float ranging from -1 to +1 where -1 maps to a hard-left pan, |
| * 0 to center (the default behavior), and +1 to hard-right. |
| */ |
| public static final String AUDIO_PARAM_PAN = TextToSpeech.Engine.KEY_PARAM_PAN; |
| |
| /** |
| * Audio parameter for specifying the audio stream type to be used when speaking text |
| * or playing back a file. The value should be one of the STREAM_ constants |
| * defined in {@link AudioManager}. |
| */ |
| public static final String AUDIO_PARAM_STREAM = TextToSpeech.Engine.KEY_PARAM_STREAM; |
| } |
| |
| /** |
| * Result codes for TTS operations. |
| */ |
| public static final class Status { |
| private Status() {} |
| |
| /** |
| * Denotes a successful operation. |
| */ |
| public static final int SUCCESS = 0; |
| |
| /** |
| * Denotes a stop requested by a client. It's used only on the service side of the API, |
| * client should never expect to see this result code. |
| */ |
| public static final int STOPPED = 100; |
| |
| /** |
| * Denotes a generic failure. |
| */ |
| public static final int ERROR_UNKNOWN = -1; |
| |
| /** |
| * Denotes a failure of a TTS engine to synthesize the given input. |
| */ |
| public static final int ERROR_SYNTHESIS = 10; |
| |
| /** |
| * Denotes a failure of a TTS service. |
| */ |
| public static final int ERROR_SERVICE = 11; |
| |
| /** |
| * Denotes a failure related to the output (audio device or a file). |
| */ |
| public static final int ERROR_OUTPUT = 12; |
| |
| /** |
| * Denotes a failure caused by a network connectivity problems. |
| */ |
| public static final int ERROR_NETWORK = 13; |
| |
| /** |
| * Denotes a failure caused by network timeout. |
| */ |
| public static final int ERROR_NETWORK_TIMEOUT = 14; |
| |
| /** |
| * Denotes a failure caused by an invalid request. |
| */ |
| public static final int ERROR_INVALID_REQUEST = 15; |
| |
| /** |
| * Denotes a failure related to passing a non-unique utterance id. |
| */ |
| public static final int ERROR_NON_UNIQUE_UTTERANCE_ID = 16; |
| |
| /** |
| * Denotes a failure related to missing data. The TTS implementation may download |
| * the missing data, and if so, request will succeed in future. This error can only happen |
| * for voices with {@link VoiceInfo#FEATURE_MAY_AUTOINSTALL} feature. |
| * Note: the recommended way to avoid this error is to create a request with the fallback |
| * voice. |
| */ |
| public static final int ERROR_DOWNLOADING_ADDITIONAL_DATA = 17; |
| } |
| |
| /** |
| * Set of callbacks for the events related to the progress of a synthesis request |
| * through the synthesis queue. Each synthesis request is associated with a call to |
| * {@link #queueSpeak} or {@link #queueSynthesizeToFile}. |
| * |
| * The callbacks specified in this method will NOT be called on UI thread. |
| */ |
| public static abstract class RequestCallbacks { |
| /** |
| * Called after synthesis of utterance successfully starts. |
| */ |
| public void onSynthesisStart(UtteranceId utteranceId) {} |
| |
| /** |
| * Called after synthesis successfully finishes. |
| * @param utteranceId |
| * Unique identifier of synthesized utterance. |
| */ |
| public void onSynthesisSuccess(UtteranceId utteranceId) {} |
| |
| /** |
| * Called after synthesis was stopped in middle of synthesis process. |
| * @param utteranceId |
| * Unique identifier of synthesized utterance. |
| */ |
| public void onSynthesisStop(UtteranceId utteranceId) {} |
| |
| /** |
| * Called when requested synthesis failed and fallback synthesis is about to be attempted. |
| * |
| * Requires voice with available {@link TextToSpeechClient.Params#FALLBACK_VOICE_NAME} |
| * parameter, and request with this parameter enabled. |
| * |
| * This callback will be followed by callback to the {@link #onSynthesisStart}, |
| * {@link #onSynthesisFailure} or {@link #onSynthesisSuccess} that depends on the |
| * fallback outcome. |
| * |
| * For more fallback feature reference, look at the |
| * {@link TextToSpeechClient.Params#FALLBACK_VOICE_NAME}. |
| * |
| * @param utteranceId |
| * Unique identifier of synthesized utterance. |
| */ |
| public void onSynthesisFallback(UtteranceId utteranceId) {} |
| |
| /** |
| * Called after synthesis of utterance fails. |
| * |
| * It may be called instead or after a {@link #onSynthesisStart} callback. |
| * |
| * @param utteranceId |
| * Unique identifier of synthesized utterance. |
| * @param errorCode |
| * One of the values from {@link Status}. |
| */ |
| public void onSynthesisFailure(UtteranceId utteranceId, int errorCode) {} |
| |
| /** |
| * Called during synthesis to mark synthesis progress. |
| * |
| * Requires voice with available |
| * {@link TextToSpeechClient.Params#TRACK_SUBUTTERANCE_PROGRESS} parameter, and |
| * request with this parameter enabled. |
| * |
| * @param utteranceId |
| * Unique identifier of synthesized utterance. |
| * @param charIndex |
| * String index (java char offset) of recently synthesized character. |
| * @param msFromStart |
| * Miliseconds from the start of the synthesis. |
| */ |
| public void onSynthesisProgress(UtteranceId utteranceId, int charIndex, |
| int msFromStart) {} |
| } |
| |
| /** |
| * Interface definition of callbacks that are called when the client is |
| * connected or disconnected from the TTS service. |
| * |
| * The callbacks specified in this method will be called on the UI thread. |
| */ |
| public static interface ConnectionCallbacks { |
| /** |
| * After calling {@link TextToSpeechClient#connect()}, this method will be invoked |
| * asynchronously when the connect request has successfully completed. |
| * |
| * Clients are strongly encouraged to call {@link TextToSpeechClient#getEngineStatus()} |
| * and create {@link RequestConfig} objects used in subsequent synthesis requests. |
| */ |
| public void onConnectionSuccess(); |
| |
| /** |
| * After calling {@link TextToSpeechClient#connect()}, this method may be invoked |
| * asynchronously when the connect request has failed to complete. |
| * |
| * It may be also invoked synchronously, from the body of |
| * {@link TextToSpeechClient#connect()} method. |
| */ |
| public void onConnectionFailure(); |
| |
| /** |
| * Called when the connection to the service is lost. This can happen if there is a problem |
| * with the speech service (e.g. a crash or resource problem causes it to be killed by the |
| * system). When called, all requests have been canceled and no outstanding listeners will |
| * be executed. Applications should disable UI components that require the service. |
| * |
| * When the service is working again, the client will receive a callback to the |
| * {@link #onConnectionSuccess()} method. |
| */ |
| public void onServiceDisconnected(); |
| |
| /** |
| * After receiving {@link #onConnectionSuccess()} callback, this method may be invoked |
| * if engine status obtained from {@link TextToSpeechClient#getEngineStatus()}) changes. |
| * It usually means that some voices were removed, changed or added. |
| * |
| * Clients are required to recreate {@link RequestConfig} objects used in subsequent |
| * synthesis requests. |
| */ |
| public void onEngineStatusChange(EngineStatus newEngineStatus); |
| } |
| |
| /** State of voices as provided by engine and user. */ |
| public static final class EngineStatus { |
| /** All available voices. */ |
| private final List<VoiceInfo> mVoices; |
| |
| /** Name of the TTS engine package */ |
| private final String mPackageName; |
| |
| private EngineStatus(String packageName, List<VoiceInfo> voices) { |
| this.mVoices = Collections.unmodifiableList(voices); |
| this.mPackageName = packageName; |
| } |
| |
| /** |
| * Get an immutable list of all Voices exposed by the TTS engine. |
| */ |
| public List<VoiceInfo> getVoices() { |
| return mVoices; |
| } |
| |
| /** |
| * Get name of the TTS engine package currently in use. |
| */ |
| public String getEnginePackage() { |
| return mPackageName; |
| } |
| } |
| |
| /** Unique synthesis request identifier. */ |
| public static class UtteranceId { |
| /** Unique identifier */ |
| private final int id; |
| |
| /** Unique identifier generator */ |
| private static final AtomicInteger ID_GENERATOR = new AtomicInteger(); |
| |
| /** |
| * Create new, unique UtteranceId instance. |
| */ |
| public UtteranceId() { |
| id = ID_GENERATOR.getAndIncrement(); |
| } |
| |
| /** |
| * Returns a unique string associated with an instance of this object. |
| * |
| * This string will be used to identify the synthesis request/utterance inside the |
| * TTS service. |
| */ |
| public final String toUniqueString() { |
| return "UID" + id; |
| } |
| } |
| |
| /** |
| * Create TextToSpeech service client. |
| * |
| * Will connect to the default TTS service. In order to be usable, {@link #connect()} need |
| * to be called first and successful connection callback need to be received. |
| * |
| * @param context |
| * The context this instance is running in. |
| * @param engine |
| * Package name of requested TTS engine. If it's null, then default engine will |
| * be selected regardless of {@code fallbackToDefaultEngine} parameter value. |
| * @param fallbackToDefaultEngine |
| * If requested engine is not available, should we fallback to the default engine? |
| * @param defaultRequestCallbacks |
| * Default request callbacks, it will be used for all synthesis requests without |
| * supplied RequestCallbacks instance. Can't be null. |
| * @param connectionCallbacks |
| * Callbacks for connecting and disconnecting from the service. Can't be null. |
| */ |
| public TextToSpeechClient(Context context, |
| String engine, boolean fallbackToDefaultEngine, |
| RequestCallbacks defaultRequestCallbacks, |
| ConnectionCallbacks connectionCallbacks) { |
| if (context == null) |
| throw new IllegalArgumentException("context can't be null"); |
| if (defaultRequestCallbacks == null) |
| throw new IllegalArgumentException("defaultRequestCallbacks can't be null"); |
| if (connectionCallbacks == null) |
| throw new IllegalArgumentException("connectionCallbacks can't be null"); |
| mContext = context; |
| mEnginesHelper = new TtsEngines(mContext); |
| mCallbacks = new HashMap<String, Pair<UtteranceId, RequestCallbacks>>(); |
| mDefaultRequestCallbacks = defaultRequestCallbacks; |
| mConnectionCallbacks = connectionCallbacks; |
| |
| mRequestedEngine = engine; |
| mFallbackToDefault = fallbackToDefaultEngine; |
| } |
| |
| /** |
| * Create TextToSpeech service client. Will connect to the default TTS |
| * service. In order to be usable, {@link #connect()} need to be called |
| * first and successful connection callback need to be received. |
| * |
| * @param context Context this instance is running in. |
| * @param defaultRequestCallbacks Default request callbacks, it |
| * will be used for all synthesis requests without supplied |
| * RequestCallbacks instance. Can't be null. |
| * @param connectionCallbacks Callbacks for connecting and disconnecting |
| * from the service. Can't be null. |
| */ |
| public TextToSpeechClient(Context context, RequestCallbacks defaultRequestCallbacks, |
| ConnectionCallbacks connectionCallbacks) { |
| this(context, null, true, defaultRequestCallbacks, connectionCallbacks); |
| } |
| |
| |
| private boolean initTts(String requestedEngine, boolean fallbackToDefaultEngine) { |
| // Step 1: Try connecting to the engine that was requested. |
| if (requestedEngine != null) { |
| if (mEnginesHelper.isEngineInstalled(requestedEngine)) { |
| if ((mServiceConnection = connectToEngine(requestedEngine)) != null) { |
| return true; |
| } else if (!fallbackToDefaultEngine) { |
| Log.w(TAG, "Couldn't connect to requested engine: " + requestedEngine); |
| return false; |
| } |
| } else if (!fallbackToDefaultEngine) { |
| Log.w(TAG, "Requested engine not installed: " + requestedEngine); |
| return false; |
| } |
| } |
| |
| // Step 2: Try connecting to the user's default engine. |
| final String defaultEngine = mEnginesHelper.getDefaultEngine(); |
| if (defaultEngine != null && !defaultEngine.equals(requestedEngine)) { |
| if ((mServiceConnection = connectToEngine(defaultEngine)) != null) { |
| return true; |
| } |
| } |
| |
| // Step 3: Try connecting to the highest ranked engine in the |
| // system. |
| final String highestRanked = mEnginesHelper.getHighestRankedEngineName(); |
| if (highestRanked != null && !highestRanked.equals(requestedEngine) && |
| !highestRanked.equals(defaultEngine)) { |
| if ((mServiceConnection = connectToEngine(highestRanked)) != null) { |
| return true; |
| } |
| } |
| |
| Log.w(TAG, "Couldn't find working TTS engine"); |
| return false; |
| } |
| |
| private Connection connectToEngine(String engine) { |
| Connection connection = new Connection(engine); |
| Intent intent = new Intent(TextToSpeech.Engine.INTENT_ACTION_TTS_SERVICE); |
| intent.setPackage(engine); |
| boolean bound = mContext.bindService(intent, connection, Context.BIND_AUTO_CREATE); |
| if (!bound) { |
| Log.e(TAG, "Failed to bind to " + engine); |
| return null; |
| } else { |
| Log.i(TAG, "Successfully bound to " + engine); |
| return connection; |
| } |
| } |
| |
| /** |
| * Connects the client to TTS service. This method returns immediately, and connects to the |
| * service in the background. |
| * |
| * After connection initializes successfully, {@link ConnectionCallbacks#onConnectionSuccess()} |
| * is called. On a failure {@link ConnectionCallbacks#onConnectionFailure} is called. |
| * |
| * Both of those callback may be called asynchronously on the main thread, |
| * {@link ConnectionCallbacks#onConnectionFailure} may be called synchronously, before |
| * this method returns. |
| */ |
| public void connect() { |
| synchronized (mLock) { |
| if (mServiceConnection != null) { |
| return; |
| } |
| if(!initTts(mRequestedEngine, mFallbackToDefault)) { |
| mConnectionCallbacks.onConnectionFailure(); |
| } |
| } |
| } |
| |
| /** |
| * Checks if the client is currently connected to the service, so that |
| * requests to other methods will succeed. |
| */ |
| public boolean isConnected() { |
| synchronized (mLock) { |
| return mServiceConnection != null && mServiceConnection.isEstablished(); |
| } |
| } |
| |
| /** |
| * Closes the connection to TextToSpeech service. No calls can be made on this object after |
| * calling this method. |
| * It is good practice to call this method in the onDestroy() method of an Activity |
| * so the TextToSpeech engine can be cleanly stopped. |
| */ |
| public void disconnect() { |
| synchronized (mLock) { |
| if (mServiceConnection != null) { |
| mServiceConnection.disconnect(); |
| mServiceConnection = null; |
| mCallbacks.clear(); |
| } |
| } |
| } |
| |
| /** |
| * Register callback. |
| * |
| * @param utteranceId Non-null UtteranceId instance. |
| * @param callback Non-null callbacks for the request |
| * @return Status.SUCCESS or error code in case of invalid arguments. |
| */ |
| private int addCallback(UtteranceId utteranceId, RequestCallbacks callback) { |
| synchronized (mLock) { |
| if (utteranceId == null || callback == null) { |
| return Status.ERROR_INVALID_REQUEST; |
| } |
| if (mCallbacks.put(utteranceId.toUniqueString(), |
| new Pair<UtteranceId, RequestCallbacks>(utteranceId, callback)) != null) { |
| return Status.ERROR_NON_UNIQUE_UTTERANCE_ID; |
| } |
| return Status.SUCCESS; |
| } |
| } |
| |
| /** |
| * Remove and return callback. |
| * |
| * @param utteranceIdStr Unique string obtained from {@link UtteranceId#toUniqueString}. |
| */ |
| private Pair<UtteranceId, RequestCallbacks> removeCallback(String utteranceIdStr) { |
| synchronized (mLock) { |
| return mCallbacks.remove(utteranceIdStr); |
| } |
| } |
| |
| /** |
| * Get callback and utterance id. |
| * |
| * @param utteranceIdStr Unique string obtained from {@link UtteranceId#toUniqueString}. |
| */ |
| private Pair<UtteranceId, RequestCallbacks> getCallback(String utteranceIdStr) { |
| synchronized (mLock) { |
| return mCallbacks.get(utteranceIdStr); |
| } |
| } |
| |
| /** |
| * Remove callback and call {@link RequestCallbacks#onSynthesisFailure} with passed |
| * error code. |
| * |
| * @param utteranceIdStr Unique string obtained from {@link UtteranceId#toUniqueString}. |
| * @param errorCode argument to {@link RequestCallbacks#onSynthesisFailure} call. |
| */ |
| private void removeCallbackAndErr(String utteranceIdStr, int errorCode) { |
| synchronized (mLock) { |
| Pair<UtteranceId, RequestCallbacks> c = mCallbacks.remove(utteranceIdStr); |
| c.second.onSynthesisFailure(c.first, errorCode); |
| } |
| } |
| |
| /** |
| * Retrieve TTS engine status {@link EngineStatus}. Requires connected client. |
| */ |
| public EngineStatus getEngineStatus() { |
| synchronized (mLock) { |
| return mEngineStatus; |
| } |
| } |
| |
| /** |
| * Query TTS engine about available voices and defaults. |
| * |
| * @return EngineStatus is connected or null if client is disconnected. |
| */ |
| private EngineStatus requestEngineStatus(ITextToSpeechService service) |
| throws RemoteException { |
| List<VoiceInfo> voices = service.getVoicesInfo(); |
| if (voices == null) { |
| Log.e(TAG, "Requested engine doesn't support TTS V2 API"); |
| return null; |
| } |
| |
| return new EngineStatus(mServiceConnection.getEngineName(), voices); |
| } |
| |
| private class Connection implements ServiceConnection { |
| private final String mEngineName; |
| |
| private ITextToSpeechService mService; |
| |
| private boolean mEstablished; |
| |
| private PrepareConnectionAsyncTask mSetupConnectionAsyncTask; |
| |
| public Connection(String engineName) { |
| this.mEngineName = engineName; |
| } |
| |
| private final ITextToSpeechCallback.Stub mCallback = new ITextToSpeechCallback.Stub() { |
| |
| @Override |
| public void onStart(String utteranceIdStr) { |
| synchronized (mLock) { |
| Pair<UtteranceId, RequestCallbacks> callbacks = getCallback(utteranceIdStr); |
| callbacks.second.onSynthesisStart(callbacks.first); |
| } |
| } |
| |
| public void onStop(String utteranceIdStr) { |
| synchronized (mLock) { |
| Pair<UtteranceId, RequestCallbacks> callbacks = removeCallback(utteranceIdStr); |
| callbacks.second.onSynthesisStop(callbacks.first); |
| } |
| } |
| |
| @Override |
| public void onSuccess(String utteranceIdStr) { |
| synchronized (mLock) { |
| Pair<UtteranceId, RequestCallbacks> callbacks = removeCallback(utteranceIdStr); |
| callbacks.second.onSynthesisSuccess(callbacks.first); |
| } |
| } |
| |
| public void onFallback(String utteranceIdStr) { |
| synchronized (mLock) { |
| Pair<UtteranceId, RequestCallbacks> callbacks = getCallback( |
| utteranceIdStr); |
| callbacks.second.onSynthesisFallback(callbacks.first); |
| } |
| }; |
| |
| @Override |
| public void onError(String utteranceIdStr, int errorCode) { |
| removeCallbackAndErr(utteranceIdStr, errorCode); |
| } |
| |
| @Override |
| public void onVoicesInfoChange(List<VoiceInfo> voicesInfo) { |
| synchronized (mLock) { |
| mEngineStatus = new EngineStatus(mServiceConnection.getEngineName(), |
| voicesInfo); |
| mMainHandler.obtainMessage(InternalHandler.WHAT_ENGINE_STATUS_CHANGED, |
| mEngineStatus).sendToTarget(); |
| } |
| } |
| }; |
| |
| private class PrepareConnectionAsyncTask extends AsyncTask<Void, Void, EngineStatus> { |
| |
| private final ComponentName mName; |
| |
| public PrepareConnectionAsyncTask(ComponentName name) { |
| mName = name; |
| } |
| |
| @Override |
| protected EngineStatus doInBackground(Void... params) { |
| synchronized(mLock) { |
| if (isCancelled()) { |
| return null; |
| } |
| try { |
| mService.setCallback(getCallerIdentity(), mCallback); |
| return requestEngineStatus(mService); |
| } catch (RemoteException re) { |
| Log.e(TAG, "Error setting up the TTS service"); |
| return null; |
| } |
| } |
| } |
| |
| @Override |
| protected void onPostExecute(EngineStatus result) { |
| synchronized(mLock) { |
| if (mSetupConnectionAsyncTask == this) { |
| mSetupConnectionAsyncTask = null; |
| } |
| if (result == null) { |
| Log.e(TAG, "Setup task failed"); |
| disconnect(); |
| mConnectionCallbacks.onConnectionFailure(); |
| return; |
| } |
| |
| mEngineStatus = result; |
| mEstablished = true; |
| } |
| mConnectionCallbacks.onConnectionSuccess(); |
| } |
| } |
| |
| @Override |
| public void onServiceConnected(ComponentName name, IBinder service) { |
| Log.i(TAG, "Connected to " + name); |
| |
| synchronized(mLock) { |
| mEstablished = false; |
| mService = ITextToSpeechService.Stub.asInterface(service); |
| startSetupConnectionTask(name); |
| } |
| } |
| |
| @Override |
| public void onServiceDisconnected(ComponentName name) { |
| Log.i(TAG, "Asked to disconnect from " + name); |
| |
| synchronized(mLock) { |
| mEstablished = false; |
| mService = null; |
| stopSetupConnectionTask(); |
| } |
| mMainHandler.obtainMessage(InternalHandler.WHAT_SERVICE_DISCONNECTED).sendToTarget(); |
| } |
| |
| private void startSetupConnectionTask(ComponentName name) { |
| stopSetupConnectionTask(); |
| mSetupConnectionAsyncTask = new PrepareConnectionAsyncTask(name); |
| mSetupConnectionAsyncTask.execute(); |
| } |
| |
| private boolean stopSetupConnectionTask() { |
| boolean result = false; |
| if (mSetupConnectionAsyncTask != null) { |
| result = mSetupConnectionAsyncTask.cancel(false); |
| mSetupConnectionAsyncTask = null; |
| } |
| return result; |
| } |
| |
| IBinder getCallerIdentity() { |
| return mCallback; |
| } |
| |
| boolean isEstablished() { |
| return mService != null && mEstablished; |
| } |
| |
| <T> ActionResult<T> runAction(Action<T> action) { |
| synchronized (mLock) { |
| try { |
| return new ActionResult<T>(true, action.run(mService)); |
| } catch (Exception ex) { |
| Log.e(TAG, action.getName() + " failed", ex); |
| disconnect(); |
| return new ActionResult<T>(false); |
| } |
| } |
| } |
| |
| void disconnect() { |
| mContext.unbindService(this); |
| stopSetupConnectionTask(); |
| mService = null; |
| mEstablished = false; |
| if (mServiceConnection == this) { |
| mServiceConnection = null; |
| } |
| } |
| |
| String getEngineName() { |
| return mEngineName; |
| } |
| } |
| |
| private abstract class Action<T> { |
| private final String mName; |
| |
| public Action(String name) { |
| mName = name; |
| } |
| |
| public String getName() {return mName;} |
| abstract T run(ITextToSpeechService service) throws RemoteException; |
| } |
| |
| private class ActionResult<T> { |
| boolean mSuccess; |
| T mResult; |
| |
| ActionResult(boolean success) { |
| mSuccess = success; |
| } |
| |
| ActionResult(boolean success, T result) { |
| mSuccess = success; |
| mResult = result; |
| } |
| } |
| |
| private IBinder getCallerIdentity() { |
| if (mServiceConnection != null) { |
| return mServiceConnection.getCallerIdentity(); |
| } |
| return null; |
| } |
| |
| private <T> ActionResult<T> runAction(Action<T> action) { |
| synchronized (mLock) { |
| if (mServiceConnection == null) { |
| Log.w(TAG, action.getName() + " failed: not bound to TTS engine"); |
| return new ActionResult<T>(false); |
| } |
| if (!mServiceConnection.isEstablished()) { |
| Log.w(TAG, action.getName() + " failed: not fully bound to TTS engine"); |
| return new ActionResult<T>(false); |
| } |
| return mServiceConnection.runAction(action); |
| } |
| } |
| |
| private static final String ACTION_STOP_NAME = "stop"; |
| |
| /** |
| * Interrupts the current utterance spoken (whether played or rendered to file) and discards |
| * other utterances in the queue. |
| */ |
| public void stop() { |
| runAction(new Action<Void>(ACTION_STOP_NAME) { |
| @Override |
| public Void run(ITextToSpeechService service) throws RemoteException { |
| if (service.stop(getCallerIdentity()) != Status.SUCCESS) { |
| Log.e(TAG, "Stop failed"); |
| } |
| mCallbacks.clear(); |
| return null; |
| } |
| }); |
| } |
| |
| private static final String ACTION_QUEUE_SPEAK_NAME = "queueSpeak"; |
| |
| /** |
| * Speaks the string using the specified queuing strategy and the current |
| * voice. This method is asynchronous, i.e. the method just adds the request |
| * to the queue of TTS requests and then returns. The synthesis might not |
| * have finished (or even started!) at the time when this method returns. |
| * |
| * @param utterance The string of text to be spoken. No longer than |
| * 1000 characters. |
| * @param utteranceId Unique identificator used to track the synthesis progress |
| * in {@link RequestCallbacks}. |
| * @param config Synthesis request configuration. Can't be null. Has to contain a |
| * voice. |
| * @param callbacks Synthesis request callbacks. If null, the default request |
| * callbacks object will be used. |
| */ |
| public void queueSpeak(final String utterance, final UtteranceId utteranceId, |
| final RequestConfig config, |
| final RequestCallbacks callbacks) { |
| queueSpeak(createMarkupFromString(utterance), utteranceId, config, callbacks); |
| } |
| |
| /** |
| * Speaks the {@link Markup} (which can be constructed with {@link Utterance}) using |
| * the specified queuing strategy and the current voice. This method is |
| * asynchronous, i.e. the method just adds the request to the queue of TTS |
| * requests and then returns. The synthesis might not have finished (or even |
| * started!) at the time when this method returns. |
| * |
| * @param markup The Markup to be spoken. The written equivalent of the spoken |
| * text should be no longer than 1000 characters. |
| * @param utteranceId Unique identificator used to track the synthesis progress |
| * in {@link RequestCallbacks}. |
| * @param config Synthesis request configuration. Can't be null. Has to contain a |
| * voice. |
| * @param callbacks Synthesis request callbacks. If null, the default request |
| * callbacks object will be used. |
| */ |
| public void queueSpeak(final Markup markup, |
| final UtteranceId utteranceId, |
| final RequestConfig config, |
| final RequestCallbacks callbacks) { |
| runAction(new Action<Void>(ACTION_QUEUE_SPEAK_NAME) { |
| @Override |
| public Void run(ITextToSpeechService service) throws RemoteException { |
| RequestCallbacks c = mDefaultRequestCallbacks; |
| if (callbacks != null) { |
| c = callbacks; |
| } |
| int addCallbackStatus = addCallback(utteranceId, c); |
| if (addCallbackStatus != Status.SUCCESS) { |
| c.onSynthesisFailure(utteranceId, Status.ERROR_INVALID_REQUEST); |
| return null; |
| } |
| |
| int queueResult = service.speakV2( |
| getCallerIdentity(), |
| new SynthesisRequestV2(markup, utteranceId.toUniqueString(), config)); |
| if (queueResult != Status.SUCCESS) { |
| removeCallbackAndErr(utteranceId.toUniqueString(), queueResult); |
| } |
| return null; |
| } |
| }); |
| } |
| |
| private static final String ACTION_QUEUE_SYNTHESIZE_TO_FILE = "queueSynthesizeToFile"; |
| |
| /** |
| * Synthesizes the given text to a file using the specified parameters. This |
| * method is asynchronous, i.e. the method just adds the request to the |
| * queue of TTS requests and then returns. The synthesis might not have |
| * finished (or even started!) at the time when this method returns. |
| * |
| * @param utterance The text that should be synthesized. No longer than |
| * 1000 characters. |
| * @param utteranceId Unique identificator used to track the synthesis progress |
| * in {@link RequestCallbacks}. |
| * @param outputFile File to write the generated audio data to. |
| * @param config Synthesis request configuration. Can't be null. Have to contain a |
| * voice. |
| * @param callbacks Synthesis request callbacks. If null, the default request |
| * callbacks object will be used. |
| */ |
| public void queueSynthesizeToFile(final String utterance, final UtteranceId utteranceId, |
| final File outputFile, final RequestConfig config, |
| final RequestCallbacks callbacks) { |
| queueSynthesizeToFile(createMarkupFromString(utterance), utteranceId, outputFile, config, callbacks); |
| } |
| |
| /** |
| * Synthesizes the given {@link Markup} (can be constructed with {@link Utterance}) |
| * to a file using the specified parameters. This method is asynchronous, i.e. the |
| * method just adds the request to the queue of TTS requests and then returns. The |
| * synthesis might not have finished (or even started!) at the time when this method |
| * returns. |
| * |
| * @param markup The Markup that should be synthesized. The written equivalent of |
| * the spoken text should be no longer than 1000 characters. |
| * @param utteranceId Unique identificator used to track the synthesis progress |
| * in {@link RequestCallbacks}. |
| * @param outputFile File to write the generated audio data to. |
| * @param config Synthesis request configuration. Can't be null. Have to contain a |
| * voice. |
| * @param callbacks Synthesis request callbacks. If null, the default request |
| * callbacks object will be used. |
| */ |
| public void queueSynthesizeToFile( |
| final Markup markup, |
| final UtteranceId utteranceId, |
| final File outputFile, final RequestConfig config, |
| final RequestCallbacks callbacks) { |
| runAction(new Action<Void>(ACTION_QUEUE_SYNTHESIZE_TO_FILE) { |
| @Override |
| public Void run(ITextToSpeechService service) throws RemoteException { |
| RequestCallbacks c = mDefaultRequestCallbacks; |
| if (callbacks != null) { |
| c = callbacks; |
| } |
| int addCallbackStatus = addCallback(utteranceId, c); |
| if (addCallbackStatus != Status.SUCCESS) { |
| c.onSynthesisFailure(utteranceId, Status.ERROR_INVALID_REQUEST); |
| return null; |
| } |
| |
| ParcelFileDescriptor fileDescriptor = null; |
| try { |
| if (outputFile.exists() && !outputFile.canWrite()) { |
| Log.e(TAG, "No permissions to write to " + outputFile); |
| removeCallbackAndErr(utteranceId.toUniqueString(), Status.ERROR_OUTPUT); |
| return null; |
| } |
| fileDescriptor = ParcelFileDescriptor.open(outputFile, |
| ParcelFileDescriptor.MODE_WRITE_ONLY | |
| ParcelFileDescriptor.MODE_CREATE | |
| ParcelFileDescriptor.MODE_TRUNCATE); |
| |
| int queueResult = service.synthesizeToFileDescriptorV2(getCallerIdentity(), |
| fileDescriptor, |
| new SynthesisRequestV2(markup, utteranceId.toUniqueString(), config)); |
| fileDescriptor.close(); |
| if (queueResult != Status.SUCCESS) { |
| removeCallbackAndErr(utteranceId.toUniqueString(), queueResult); |
| } |
| } catch (FileNotFoundException e) { |
| Log.e(TAG, "Opening file " + outputFile + " failed", e); |
| removeCallbackAndErr(utteranceId.toUniqueString(), Status.ERROR_OUTPUT); |
| } catch (IOException e) { |
| Log.e(TAG, "Closing file " + outputFile + " failed", e); |
| removeCallbackAndErr(utteranceId.toUniqueString(), Status.ERROR_OUTPUT); |
| } |
| return null; |
| } |
| }); |
| } |
| |
| private static Markup createMarkupFromString(String str) { |
| return new Utterance() |
| .append(new Utterance.TtsText(str)) |
| .setNoWarningOnFallback(true) |
| .createMarkup(); |
| } |
| |
| private static final String ACTION_QUEUE_SILENCE_NAME = "queueSilence"; |
| |
| /** |
| * Plays silence for the specified amount of time. This method is asynchronous, |
| * i.e. the method just adds the request to the queue of TTS requests and then |
| * returns. The synthesis might not have finished (or even started!) at the time |
| * when this method returns. |
| * |
| * @param durationInMs The duration of the silence in milliseconds. |
| * @param utteranceId Unique identificator used to track the synthesis progress |
| * in {@link RequestCallbacks}. |
| * @param callbacks Synthesis request callbacks. If null, default request |
| * callbacks object will be used. |
| */ |
| public void queueSilence(final long durationInMs, final UtteranceId utteranceId, |
| final RequestCallbacks callbacks) { |
| runAction(new Action<Void>(ACTION_QUEUE_SILENCE_NAME) { |
| @Override |
| public Void run(ITextToSpeechService service) throws RemoteException { |
| RequestCallbacks c = mDefaultRequestCallbacks; |
| if (callbacks != null) { |
| c = callbacks; |
| } |
| int addCallbackStatus = addCallback(utteranceId, c); |
| if (addCallbackStatus != Status.SUCCESS) { |
| c.onSynthesisFailure(utteranceId, Status.ERROR_INVALID_REQUEST); |
| } |
| |
| int queueResult = service.playSilence(getCallerIdentity(), durationInMs, |
| TextToSpeech.QUEUE_ADD, utteranceId.toUniqueString()); |
| |
| if (queueResult != Status.SUCCESS) { |
| removeCallbackAndErr(utteranceId.toUniqueString(), queueResult); |
| } |
| return null; |
| } |
| }); |
| } |
| |
| |
| private static final String ACTION_QUEUE_AUDIO_NAME = "queueAudio"; |
| |
| /** |
| * Plays the audio resource using the specified parameters. |
| * This method is asynchronous, i.e. the method just adds the request to the queue of TTS |
| * requests and then returns. The synthesis might not have finished (or even started!) at the |
| * time when this method returns. |
| * |
| * @param audioUrl The audio resource that should be played |
| * @param utteranceId Unique identificator used to track synthesis progress |
| * in {@link RequestCallbacks}. |
| * @param config Synthesis request configuration. Can't be null. Doesn't have to contain a |
| * voice (only system parameters are used). |
| * @param callbacks Synthesis request callbacks. If null, default request |
| * callbacks object will be used. |
| */ |
| public void queueAudio(final Uri audioUrl, final UtteranceId utteranceId, |
| final RequestConfig config, final RequestCallbacks callbacks) { |
| runAction(new Action<Void>(ACTION_QUEUE_AUDIO_NAME) { |
| @Override |
| public Void run(ITextToSpeechService service) throws RemoteException { |
| RequestCallbacks c = mDefaultRequestCallbacks; |
| if (callbacks != null) { |
| c = callbacks; |
| } |
| int addCallbackStatus = addCallback(utteranceId, c); |
| if (addCallbackStatus != Status.SUCCESS) { |
| c.onSynthesisFailure(utteranceId, Status.ERROR_INVALID_REQUEST); |
| } |
| |
| int queueResult = service.playAudioV2(getCallerIdentity(), audioUrl, |
| utteranceId.toUniqueString(), config.getVoiceParams()); |
| |
| if (queueResult != Status.SUCCESS) { |
| removeCallbackAndErr(utteranceId.toUniqueString(), queueResult); |
| } |
| return null; |
| } |
| }); |
| } |
| |
| private static final String ACTION_IS_SPEAKING_NAME = "isSpeaking"; |
| |
| /** |
| * Checks whether the TTS engine is busy speaking. Note that a speech item is |
| * considered complete once it's audio data has been sent to the audio mixer, or |
| * written to a file. There might be a finite lag between this point, and when |
| * the audio hardware completes playback. |
| * |
| * @return {@code true} if the TTS engine is speaking. |
| */ |
| public boolean isSpeaking() { |
| ActionResult<Boolean> result = runAction(new Action<Boolean>(ACTION_IS_SPEAKING_NAME) { |
| @Override |
| public Boolean run(ITextToSpeechService service) throws RemoteException { |
| return service.isSpeaking(); |
| } |
| }); |
| if (!result.mSuccess) { |
| return false; // We can't really say, return false |
| } |
| return result.mResult; |
| } |
| |
| |
| class InternalHandler extends Handler { |
| final static int WHAT_ENGINE_STATUS_CHANGED = 1; |
| final static int WHAT_SERVICE_DISCONNECTED = 2; |
| |
| @Override |
| public void handleMessage(Message msg) { |
| switch (msg.what) { |
| case WHAT_ENGINE_STATUS_CHANGED: |
| mConnectionCallbacks.onEngineStatusChange((EngineStatus) msg.obj); |
| return; |
| case WHAT_SERVICE_DISCONNECTED: |
| mConnectionCallbacks.onServiceDisconnected(); |
| return; |
| } |
| } |
| } |
| } |