1 /*
2  * Copyright (C) 2010 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License"); you may not
5  * use this file except in compliance with the License. You may obtain a copy of
6  * the License at
7  *
8  * http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
12  * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
13  * License for the specific language governing permissions and limitations under
14  * the License.
15  */
16 
17 package android.speech;
18 
19 import android.annotation.SdkConstant;
20 import android.annotation.SdkConstant.SdkConstantType;
21 import android.app.Service;
22 import android.content.Intent;
23 import android.content.PermissionChecker;
24 import android.os.Binder;
25 import android.os.Bundle;
26 import android.os.Handler;
27 import android.os.IBinder;
28 import android.os.Message;
29 import android.os.RemoteException;
30 import android.util.Log;
31 
32 import java.lang.ref.WeakReference;
33 
34 /**
35  * This class provides a base class for recognition service implementations. This class should be
36  * extended only in case you wish to implement a new speech recognizer. Please note that the
37  * implementation of this service is stateless.
38  */
39 public abstract class RecognitionService extends Service {
40     /**
41      * The {@link Intent} that must be declared as handled by the service.
42      */
43     @SdkConstant(SdkConstantType.SERVICE_ACTION)
44     public static final String SERVICE_INTERFACE = "android.speech.RecognitionService";
45 
46     /**
47      * Name under which a RecognitionService component publishes information about itself.
48      * This meta-data should reference an XML resource containing a
49      * <code>&lt;{@link android.R.styleable#RecognitionService recognition-service}&gt;</code> tag.
50      */
51     public static final String SERVICE_META_DATA = "android.speech";
52 
53     /** Log messages identifier */
54     private static final String TAG = "RecognitionService";
55 
56     /** Debugging flag */
57     private static final boolean DBG = false;
58 
59     /** Binder of the recognition service */
60     private RecognitionServiceBinder mBinder = new RecognitionServiceBinder(this);
61 
62     /**
63      * The current callback of an application that invoked the
64      * {@link RecognitionService#onStartListening(Intent, Callback)} method
65      */
66     private Callback mCurrentCallback = null;
67 
68     private static final int MSG_START_LISTENING = 1;
69 
70     private static final int MSG_STOP_LISTENING = 2;
71 
72     private static final int MSG_CANCEL = 3;
73 
74     private static final int MSG_RESET = 4;
75 
76     private final Handler mHandler = new Handler() {
77         @Override
78         public void handleMessage(Message msg) {
79             switch (msg.what) {
80                 case MSG_START_LISTENING:
81                     StartListeningArgs args = (StartListeningArgs) msg.obj;
82                     dispatchStartListening(args.mIntent, args.mListener, args.mCallingUid);
83                     break;
84                 case MSG_STOP_LISTENING:
85                     dispatchStopListening((IRecognitionListener) msg.obj);
86                     break;
87                 case MSG_CANCEL:
88                     dispatchCancel((IRecognitionListener) msg.obj);
89                     break;
90                 case MSG_RESET:
91                     dispatchClearCallback();
92                     break;
93             }
94         }
95     };
96 
dispatchStartListening(Intent intent, final IRecognitionListener listener, int callingUid)97     private void dispatchStartListening(Intent intent, final IRecognitionListener listener,
98             int callingUid) {
99         if (mCurrentCallback == null) {
100             if (DBG) Log.d(TAG, "created new mCurrentCallback, listener = " + listener.asBinder());
101             try {
102                 listener.asBinder().linkToDeath(new IBinder.DeathRecipient() {
103                     @Override
104                     public void binderDied() {
105                         mHandler.sendMessage(mHandler.obtainMessage(MSG_CANCEL, listener));
106                     }
107                 }, 0);
108             } catch (RemoteException re) {
109                 Log.e(TAG, "dead listener on startListening");
110                 return;
111             }
112             mCurrentCallback = new Callback(listener, callingUid);
113             RecognitionService.this.onStartListening(intent, mCurrentCallback);
114         } else {
115             try {
116                 listener.onError(SpeechRecognizer.ERROR_RECOGNIZER_BUSY);
117             } catch (RemoteException e) {
118                 Log.d(TAG, "onError call from startListening failed");
119             }
120             Log.i(TAG, "concurrent startListening received - ignoring this call");
121         }
122     }
123 
dispatchStopListening(IRecognitionListener listener)124     private void dispatchStopListening(IRecognitionListener listener) {
125         try {
126             if (mCurrentCallback == null) {
127                 listener.onError(SpeechRecognizer.ERROR_CLIENT);
128                 Log.w(TAG, "stopListening called with no preceding startListening - ignoring");
129             } else if (mCurrentCallback.mListener.asBinder() != listener.asBinder()) {
130                 listener.onError(SpeechRecognizer.ERROR_RECOGNIZER_BUSY);
131                 Log.w(TAG, "stopListening called by other caller than startListening - ignoring");
132             } else { // the correct state
133                 RecognitionService.this.onStopListening(mCurrentCallback);
134             }
135         } catch (RemoteException e) { // occurs if onError fails
136             Log.d(TAG, "onError call from stopListening failed");
137         }
138     }
139 
dispatchCancel(IRecognitionListener listener)140     private void dispatchCancel(IRecognitionListener listener) {
141         if (mCurrentCallback == null) {
142             if (DBG) Log.d(TAG, "cancel called with no preceding startListening - ignoring");
143         } else if (mCurrentCallback.mListener.asBinder() != listener.asBinder()) {
144             Log.w(TAG, "cancel called by client who did not call startListening - ignoring");
145         } else { // the correct state
146             RecognitionService.this.onCancel(mCurrentCallback);
147             mCurrentCallback = null;
148             if (DBG) Log.d(TAG, "canceling - setting mCurrentCallback to null");
149         }
150     }
151 
dispatchClearCallback()152     private void dispatchClearCallback() {
153         mCurrentCallback = null;
154     }
155 
156     private class StartListeningArgs {
157         public final Intent mIntent;
158 
159         public final IRecognitionListener mListener;
160         public final int mCallingUid;
161 
StartListeningArgs(Intent intent, IRecognitionListener listener, int callingUid)162         public StartListeningArgs(Intent intent, IRecognitionListener listener, int callingUid) {
163             this.mIntent = intent;
164             this.mListener = listener;
165             this.mCallingUid = callingUid;
166         }
167     }
168 
169     /**
170      * Checks whether the caller has sufficient permissions
171      *
172      * @param listener to send the error message to in case of error
173      * @return {@code true} if the caller has enough permissions, {@code false} otherwise
174      */
checkPermissions(IRecognitionListener listener)175     private boolean checkPermissions(IRecognitionListener listener) {
176         if (DBG) Log.d(TAG, "checkPermissions");
177         if (PermissionChecker.checkCallingOrSelfPermission(this,
178                 android.Manifest.permission.RECORD_AUDIO) == PermissionChecker.PERMISSION_GRANTED) {
179             return true;
180         }
181         try {
182             Log.e(TAG, "call for recognition service without RECORD_AUDIO permissions");
183             listener.onError(SpeechRecognizer.ERROR_INSUFFICIENT_PERMISSIONS);
184         } catch (RemoteException re) {
185             Log.e(TAG, "sending ERROR_INSUFFICIENT_PERMISSIONS message failed", re);
186         }
187         return false;
188     }
189 
190     /**
191      * Notifies the service that it should start listening for speech.
192      *
193      * @param recognizerIntent contains parameters for the recognition to be performed. The intent
194      *        may also contain optional extras, see {@link RecognizerIntent}. If these values are
195      *        not set explicitly, default values should be used by the recognizer.
196      * @param listener that will receive the service's callbacks
197      */
onStartListening(Intent recognizerIntent, Callback listener)198     protected abstract void onStartListening(Intent recognizerIntent, Callback listener);
199 
200     /**
201      * Notifies the service that it should cancel the speech recognition.
202      */
onCancel(Callback listener)203     protected abstract void onCancel(Callback listener);
204 
205     /**
206      * Notifies the service that it should stop listening for speech. Speech captured so far should
207      * be recognized as if the user had stopped speaking at this point. This method is only called
208      * if the application calls it explicitly.
209      */
onStopListening(Callback listener)210     protected abstract void onStopListening(Callback listener);
211 
212     @Override
onBind(final Intent intent)213     public final IBinder onBind(final Intent intent) {
214         if (DBG) Log.d(TAG, "onBind, intent=" + intent);
215         return mBinder;
216     }
217 
218     @Override
onDestroy()219     public void onDestroy() {
220         if (DBG) Log.d(TAG, "onDestroy");
221         mCurrentCallback = null;
222         mBinder.clearReference();
223         super.onDestroy();
224     }
225 
226     /**
227      * This class receives callbacks from the speech recognition service and forwards them to the
228      * user. An instance of this class is passed to the
229      * {@link RecognitionService#onStartListening(Intent, Callback)} method. Recognizers may call
230      * these methods on any thread.
231      */
232     public class Callback {
233         private final IRecognitionListener mListener;
234         private final int mCallingUid;
235 
Callback(IRecognitionListener listener, int callingUid)236         private Callback(IRecognitionListener listener, int callingUid) {
237             mListener = listener;
238             mCallingUid = callingUid;
239         }
240 
241         /**
242          * The service should call this method when the user has started to speak.
243          */
beginningOfSpeech()244         public void beginningOfSpeech() throws RemoteException {
245             if (DBG) Log.d(TAG, "beginningOfSpeech");
246             mListener.onBeginningOfSpeech();
247         }
248 
249         /**
250          * The service should call this method when sound has been received. The purpose of this
251          * function is to allow giving feedback to the user regarding the captured audio.
252          *
253          * @param buffer a buffer containing a sequence of big-endian 16-bit integers representing a
254          *        single channel audio stream. The sample rate is implementation dependent.
255          */
bufferReceived(byte[] buffer)256         public void bufferReceived(byte[] buffer) throws RemoteException {
257             mListener.onBufferReceived(buffer);
258         }
259 
260         /**
261          * The service should call this method after the user stops speaking.
262          */
endOfSpeech()263         public void endOfSpeech() throws RemoteException {
264             mListener.onEndOfSpeech();
265         }
266 
267         /**
268          * The service should call this method when a network or recognition error occurred.
269          *
270          * @param error code is defined in {@link SpeechRecognizer}
271          */
error(int error)272         public void error(int error) throws RemoteException {
273             Message.obtain(mHandler, MSG_RESET).sendToTarget();
274             mListener.onError(error);
275         }
276 
277         /**
278          * The service should call this method when partial recognition results are available. This
279          * method can be called at any time between {@link #beginningOfSpeech()} and
280          * {@link #results(Bundle)} when partial results are ready. This method may be called zero,
281          * one or multiple times for each call to {@link SpeechRecognizer#startListening(Intent)},
282          * depending on the speech recognition service implementation.
283          *
284          * @param partialResults the returned results. To retrieve the results in
285          *        ArrayList&lt;String&gt; format use {@link Bundle#getStringArrayList(String)} with
286          *        {@link SpeechRecognizer#RESULTS_RECOGNITION} as a parameter
287          */
partialResults(Bundle partialResults)288         public void partialResults(Bundle partialResults) throws RemoteException {
289             mListener.onPartialResults(partialResults);
290         }
291 
292         /**
293          * The service should call this method when the endpointer is ready for the user to start
294          * speaking.
295          *
296          * @param params parameters set by the recognition service. Reserved for future use.
297          */
readyForSpeech(Bundle params)298         public void readyForSpeech(Bundle params) throws RemoteException {
299             mListener.onReadyForSpeech(params);
300         }
301 
302         /**
303          * The service should call this method when recognition results are ready.
304          *
305          * @param results the recognition results. To retrieve the results in {@code
306          *        ArrayList<String>} format use {@link Bundle#getStringArrayList(String)} with
307          *        {@link SpeechRecognizer#RESULTS_RECOGNITION} as a parameter
308          */
results(Bundle results)309         public void results(Bundle results) throws RemoteException {
310             Message.obtain(mHandler, MSG_RESET).sendToTarget();
311             mListener.onResults(results);
312         }
313 
314         /**
315          * The service should call this method when the sound level in the audio stream has changed.
316          * There is no guarantee that this method will be called.
317          *
318          * @param rmsdB the new RMS dB value
319          */
rmsChanged(float rmsdB)320         public void rmsChanged(float rmsdB) throws RemoteException {
321             mListener.onRmsChanged(rmsdB);
322         }
323 
324         /**
325          * Return the Linux uid assigned to the process that sent you the current transaction that
326          * is being processed. This is obtained from {@link Binder#getCallingUid()}.
327          */
getCallingUid()328         public int getCallingUid() {
329             return mCallingUid;
330         }
331     }
332 
333     /** Binder of the recognition service */
334     private static final class RecognitionServiceBinder extends IRecognitionService.Stub {
335         private final WeakReference<RecognitionService> mServiceRef;
336 
RecognitionServiceBinder(RecognitionService service)337         public RecognitionServiceBinder(RecognitionService service) {
338             mServiceRef = new WeakReference<RecognitionService>(service);
339         }
340 
341         @Override
startListening(Intent recognizerIntent, IRecognitionListener listener)342         public void startListening(Intent recognizerIntent, IRecognitionListener listener) {
343             if (DBG) Log.d(TAG, "startListening called by:" + listener.asBinder());
344             final RecognitionService service = mServiceRef.get();
345             if (service != null && service.checkPermissions(listener)) {
346                 service.mHandler.sendMessage(Message.obtain(service.mHandler,
347                         MSG_START_LISTENING, service.new StartListeningArgs(
348                                 recognizerIntent, listener, Binder.getCallingUid())));
349             }
350         }
351 
352         @Override
stopListening(IRecognitionListener listener)353         public void stopListening(IRecognitionListener listener) {
354             if (DBG) Log.d(TAG, "stopListening called by:" + listener.asBinder());
355             final RecognitionService service = mServiceRef.get();
356             if (service != null && service.checkPermissions(listener)) {
357                 service.mHandler.sendMessage(Message.obtain(service.mHandler,
358                         MSG_STOP_LISTENING, listener));
359             }
360         }
361 
362         @Override
cancel(IRecognitionListener listener)363         public void cancel(IRecognitionListener listener) {
364             if (DBG) Log.d(TAG, "cancel called by:" + listener.asBinder());
365             final RecognitionService service = mServiceRef.get();
366             if (service != null && service.checkPermissions(listener)) {
367                 service.mHandler.sendMessage(Message.obtain(service.mHandler,
368                         MSG_CANCEL, listener));
369             }
370         }
371 
clearReference()372         public void clearReference() {
373             mServiceRef.clear();
374         }
375     }
376 }
377