src/starboard/speech_recognizer.h - cobalt - Git at Google

 // Copyright 2017 The Cobalt Authors. All Rights Reserved.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //     http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 // Module Overview: Starboard speech recognizer module
 //
 // Defines a streaming speech recognizer API. It provides access to the platform
 // speech recognition service.
 //
 // Note that there can be only one speech recognizer. Attempting to create a
 // second speech recognizer without destroying the first one will result in
 // undefined behavior.
 //
 // |SbSpeechRecognizerCreate|, |SbSpeechRecognizerStart|,
 // |SbSpeechRecognizerStop|, |SbSpeechRecognizerCancel| and
 // |SbSpeechRecognizerDestroy| should be called from a single thread. Callbacks
 // defined in |SbSpeechRecognizerHandler| will happen on another thread, so
 // calls back into the SbSpeechRecognizer from the callback thread are
 // disallowed.

 #ifndef STARBOARD_SPEECH_RECOGNIZER_H_
 #define STARBOARD_SPEECH_RECOGNIZER_H_

 #include "starboard/configuration.h"
 #include "starboard/export.h"
 #include "starboard/types.h"

 #if SB_API_VERSION >= 12 || SB_HAS(SPEECH_RECOGNIZER) && SB_API_VERSION >= 5

 #ifdef __cplusplus
 extern "C" {
 #endif

 // An opaque handle to an implementation-private structure that represents a
 // speech recognizer.
 typedef struct SbSpeechRecognizerPrivate* SbSpeechRecognizer;

 // Well-defined value for an invalid speech recognizer handle.
 #define kSbSpeechRecognizerInvalid ((SbSpeechRecognizer)NULL)

 // Indicates whether the given speech recognizer is valid.
 static SB_C_INLINE bool SbSpeechRecognizerIsValid(
     SbSpeechRecognizer recognizer) {
   return recognizer != kSbSpeechRecognizerInvalid;
 }

 // Indicates what has gone wrong with the recognition.
 typedef enum SbSpeechRecognizerError {
   // No speech was detected. Speech timed out.
   kSbNoSpeechError,
   // Speech input was aborted somehow.
   kSbAborted,
   // Audio capture failed.
   kSbAudioCaptureError,
   // Some network communication that was required to complete the recognition
   // failed.
   kSbNetworkError,
   // The implementation is not allowing any speech input to occur for reasons of
   // security, privacy or user preference.
   kSbNotAllowed,
   // The implementation is not allowing the application requested speech
   // service, but would allow some speech service, to be used either because the
   // implementation doesn't support the selected one or because of reasons of
   // security, privacy or user preference.
   kSbServiceNotAllowed,
   // There was an error in the speech recognition grammar or semantic tags, or
   // the grammar format or semantic tag format is supported.
   kSbBadGrammar,
   // The language was not supported.
   kSbLanguageNotSupported,
 } SbSpeechRecognizerError;

 // The recognition response that is received from the recognizer.
 typedef struct SbSpeechResult {
   // The raw words that the user spoke.
   char* transcript;
   // A numeric estimate between 0 and 1 of how confident the recognition system
   // is that the recognition is correct. A higher number means the system is
   // more confident. NaN represents an unavailable confidence score.
   float confidence;
 } SbSpeechResult;

 typedef struct SbSpeechConfiguration {
   // When the continuous value is set to false, the implementation MUST
   // return no more than one final result in response to starting recognition.
   // When the continuous attribute is set to true, the implementation MUST
   // return zero or more final results representing multiple consecutive
   // recognitions in response to starting recognition. This attribute setting
   // does not affect interim results.
   bool continuous;
   // Controls whether interim results are returned. When set to true, interim
   // results SHOULD be returned. When set to false, interim results MUST NOT be
   // returned. This value setting does not affect final results.
   bool interim_results;
   // This sets the maximum number of SbSpeechResult in
   // |SbSpeechRecognizerOnResults| callback.
   int max_alternatives;
 } SbSpeechConfiguration;

 // A function to notify that the user has started to speak or stops speaking.
 // |detected|: true if the user has started to speak, and false if the user
 // stops speaking.
 typedef void (*SbSpeechRecognizerSpeechDetectedFunction)(void* context,
                                                          bool detected);

 // A function to notify that a speech recognition error occurred.
 // |error|: The occurred speech recognition error.
 typedef void (*SbSpeechRecognizerErrorFunction)(void* context,
                                                 SbSpeechRecognizerError error);

 // A function to notify that the recognition results are ready.
 // |results|: the list of recognition results.
 // |results_size|: the number of |results|.
 // |is_final|: indicates if the |results| is final.
 typedef void (*SbSpeechRecognizerResultsFunction)(void* context,
                                                   SbSpeechResult* results,
                                                   int results_size,
                                                   bool is_final);

 // Allows receiving notifications from the device when recognition related
 // events occur.
 //
 // The void* context is passed to every function.
 struct SbSpeechRecognizerHandler {
   // Function to notify the beginning/end of the speech.
   SbSpeechRecognizerSpeechDetectedFunction on_speech_detected;

   // Function to notify the speech error.
   SbSpeechRecognizerErrorFunction on_error;

   // Function to notify that the recognition results are available.
   SbSpeechRecognizerResultsFunction on_results;

   // This is passed to handler functions as first argument.
   void* context;
 };

 #if SB_API_VERSION >= 12
 // Returns whether the platform supports SbSpeechRecognizer.
 SB_EXPORT bool SbSpeechRecognizerIsSupported();
 #endif

 // Creates a speech recognizer with a speech recognizer handler.
 //
 // If the system has a speech recognition service available, this function
 // returns the newly created handle.
 //
 // If no speech recognition service is available on the device, this function
 // returns |kSbSpeechRecognizerInvalid|.
 //
 // |SbSpeechRecognizerCreate| does not expect the passed
 // SbSpeechRecognizerHandler structure to live after |SbSpeechRecognizerCreate|
 // is called, so the implementation must copy the contents if necessary.
 SB_EXPORT SbSpeechRecognizer
 SbSpeechRecognizerCreate(const SbSpeechRecognizerHandler* handler);

 // Starts listening to audio and recognizing speech with the specified speech
 // configuration. If |SbSpeechRecognizerStart| is called on an already
 // started speech recognizer, the implementation MUST ignore the call and return
 // false.
 //
 // Returns whether the speech recognizer is started successfully.
 SB_EXPORT bool SbSpeechRecognizerStart(
     SbSpeechRecognizer recognizer,
     const SbSpeechConfiguration* configuration);

 // Stops listening to audio and returns a result using just the audio that it
 // has already received. Once |SbSpeechRecognizerStop| is called, the
 // implementation MUST NOT collect additional audio and MUST NOT continue to
 // listen to the user. This is important for privacy reasons. If
 // |SbSpeechRecognizerStop| is called on a speech recognizer which is already
 // stopped or being stopped, the implementation MUST ignore the call.
 SB_EXPORT void SbSpeechRecognizerStop(SbSpeechRecognizer recognizer);

 // Cancels speech recognition. The speech recognizer stops listening to
 // audio and does not return any information. When |SbSpeechRecognizerCancel| is
 // called, the implementation MUST NOT collect additional audio, MUST NOT
 // continue to listen to the user, and MUST stop recognizing. This is important
 // for privacy reasons. If |SbSpeechRecognizerCancel| is called on a speech
 // recognizer which is already stopped or cancelled, the implementation MUST
 // ignore the call.
 SB_EXPORT void SbSpeechRecognizerCancel(SbSpeechRecognizer recognizer);

 // Destroys the given speech recognizer. If the speech recognizer is in the
 // started state, it is first stopped and then destroyed.
 SB_EXPORT void SbSpeechRecognizerDestroy(SbSpeechRecognizer recognizer);

 #ifdef __cplusplus
 }  // extern "C"
 #endif

 #endif  // SB_API_VERSION >= 12 ||
         // SB_HAS(SPEECH_RECOGNIZER)
         // && SB_API_VERSION >= 5

 #endif  // STARBOARD_SPEECH_RECOGNIZER_H_
	// Copyright 2017 The Cobalt Authors. All Rights Reserved.
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.

	// Module Overview: Starboard speech recognizer module
	//
	// Defines a streaming speech recognizer API. It provides access to the platform
	// speech recognition service.
	//
	// Note that there can be only one speech recognizer. Attempting to create a
	// second speech recognizer without destroying the first one will result in
	// undefined behavior.
	//
	// \|SbSpeechRecognizerCreate\|, \|SbSpeechRecognizerStart\|,
	// \|SbSpeechRecognizerStop\|, \|SbSpeechRecognizerCancel\| and
	// \|SbSpeechRecognizerDestroy\| should be called from a single thread. Callbacks
	// defined in \|SbSpeechRecognizerHandler\| will happen on another thread, so
	// calls back into the SbSpeechRecognizer from the callback thread are
	// disallowed.

	#ifndef STARBOARD_SPEECH_RECOGNIZER_H_
	#define STARBOARD_SPEECH_RECOGNIZER_H_

	#include "starboard/configuration.h"
	#include "starboard/export.h"
	#include "starboard/types.h"

	#if SB_API_VERSION >= 12 \|\| SB_HAS(SPEECH_RECOGNIZER) && SB_API_VERSION >= 5

	#ifdef __cplusplus
	extern "C" {
	#endif

	// An opaque handle to an implementation-private structure that represents a
	// speech recognizer.
	typedef struct SbSpeechRecognizerPrivate* SbSpeechRecognizer;

	// Well-defined value for an invalid speech recognizer handle.
	#define kSbSpeechRecognizerInvalid ((SbSpeechRecognizer)NULL)

	// Indicates whether the given speech recognizer is valid.
	static SB_C_INLINE bool SbSpeechRecognizerIsValid(
	SbSpeechRecognizer recognizer) {
	return recognizer != kSbSpeechRecognizerInvalid;
	}

	// Indicates what has gone wrong with the recognition.
	typedef enum SbSpeechRecognizerError {
	// No speech was detected. Speech timed out.
	kSbNoSpeechError,
	// Speech input was aborted somehow.
	kSbAborted,
	// Audio capture failed.
	kSbAudioCaptureError,
	// Some network communication that was required to complete the recognition
	// failed.
	kSbNetworkError,
	// The implementation is not allowing any speech input to occur for reasons of
	// security, privacy or user preference.
	kSbNotAllowed,
	// The implementation is not allowing the application requested speech
	// service, but would allow some speech service, to be used either because the
	// implementation doesn't support the selected one or because of reasons of
	// security, privacy or user preference.
	kSbServiceNotAllowed,
	// There was an error in the speech recognition grammar or semantic tags, or
	// the grammar format or semantic tag format is supported.
	kSbBadGrammar,
	// The language was not supported.
	kSbLanguageNotSupported,
	} SbSpeechRecognizerError;

	// The recognition response that is received from the recognizer.
	typedef struct SbSpeechResult {
	// The raw words that the user spoke.
	char* transcript;
	// A numeric estimate between 0 and 1 of how confident the recognition system
	// is that the recognition is correct. A higher number means the system is
	// more confident. NaN represents an unavailable confidence score.
	float confidence;
	} SbSpeechResult;

	typedef struct SbSpeechConfiguration {
	// When the continuous value is set to false, the implementation MUST
	// return no more than one final result in response to starting recognition.
	// When the continuous attribute is set to true, the implementation MUST
	// return zero or more final results representing multiple consecutive
	// recognitions in response to starting recognition. This attribute setting
	// does not affect interim results.
	bool continuous;
	// Controls whether interim results are returned. When set to true, interim
	// results SHOULD be returned. When set to false, interim results MUST NOT be
	// returned. This value setting does not affect final results.
	bool interim_results;
	// This sets the maximum number of SbSpeechResult in
	// \|SbSpeechRecognizerOnResults\| callback.
	int max_alternatives;
	} SbSpeechConfiguration;

	// A function to notify that the user has started to speak or stops speaking.
	// \|detected\|: true if the user has started to speak, and false if the user
	// stops speaking.
	typedef void (SbSpeechRecognizerSpeechDetectedFunction)(void context,
	bool detected);

	// A function to notify that a speech recognition error occurred.
	// \|error\|: The occurred speech recognition error.
	typedef void (SbSpeechRecognizerErrorFunction)(void context,
	SbSpeechRecognizerError error);

	// A function to notify that the recognition results are ready.
	// \|results\|: the list of recognition results.
	// \|results_size\|: the number of \|results\|.
	// \|is_final\|: indicates if the \|results\| is final.
	typedef void (SbSpeechRecognizerResultsFunction)(void context,
	SbSpeechResult* results,
	int results_size,
	bool is_final);

	// Allows receiving notifications from the device when recognition related
	// events occur.
	//
	// The void* context is passed to every function.
	struct SbSpeechRecognizerHandler {
	// Function to notify the beginning/end of the speech.
	SbSpeechRecognizerSpeechDetectedFunction on_speech_detected;

	// Function to notify the speech error.
	SbSpeechRecognizerErrorFunction on_error;

	// Function to notify that the recognition results are available.
	SbSpeechRecognizerResultsFunction on_results;

	// This is passed to handler functions as first argument.
	void* context;
	};

	#if SB_API_VERSION >= 12
	// Returns whether the platform supports SbSpeechRecognizer.
	SB_EXPORT bool SbSpeechRecognizerIsSupported();
	#endif

	// Creates a speech recognizer with a speech recognizer handler.
	//
	// If the system has a speech recognition service available, this function
	// returns the newly created handle.
	//
	// If no speech recognition service is available on the device, this function
	// returns \|kSbSpeechRecognizerInvalid\|.
	//
	// \|SbSpeechRecognizerCreate\| does not expect the passed
	// SbSpeechRecognizerHandler structure to live after \|SbSpeechRecognizerCreate\|
	// is called, so the implementation must copy the contents if necessary.
	SB_EXPORT SbSpeechRecognizer
	SbSpeechRecognizerCreate(const SbSpeechRecognizerHandler* handler);

	// Starts listening to audio and recognizing speech with the specified speech
	// configuration. If \|SbSpeechRecognizerStart\| is called on an already
	// started speech recognizer, the implementation MUST ignore the call and return
	// false.
	//
	// Returns whether the speech recognizer is started successfully.
	SB_EXPORT bool SbSpeechRecognizerStart(
	SbSpeechRecognizer recognizer,
	const SbSpeechConfiguration* configuration);

	// Stops listening to audio and returns a result using just the audio that it
	// has already received. Once \|SbSpeechRecognizerStop\| is called, the
	// implementation MUST NOT collect additional audio and MUST NOT continue to
	// listen to the user. This is important for privacy reasons. If
	// \|SbSpeechRecognizerStop\| is called on a speech recognizer which is already
	// stopped or being stopped, the implementation MUST ignore the call.
	SB_EXPORT void SbSpeechRecognizerStop(SbSpeechRecognizer recognizer);

	// Cancels speech recognition. The speech recognizer stops listening to
	// audio and does not return any information. When \|SbSpeechRecognizerCancel\| is
	// called, the implementation MUST NOT collect additional audio, MUST NOT
	// continue to listen to the user, and MUST stop recognizing. This is important
	// for privacy reasons. If \|SbSpeechRecognizerCancel\| is called on a speech
	// recognizer which is already stopped or cancelled, the implementation MUST
	// ignore the call.
	SB_EXPORT void SbSpeechRecognizerCancel(SbSpeechRecognizer recognizer);

	// Destroys the given speech recognizer. If the speech recognizer is in the
	// started state, it is first stopped and then destroyed.
	SB_EXPORT void SbSpeechRecognizerDestroy(SbSpeechRecognizer recognizer);

	#ifdef __cplusplus
	} // extern "C"
	#endif

	#endif // SB_API_VERSION >= 12 \|\|
	// SB_HAS(SPEECH_RECOGNIZER)
	// && SB_API_VERSION >= 5

	#endif // STARBOARD_SPEECH_RECOGNIZER_H_