chrome/browser/speech/extension_api/tts_extension_api.cc - chromium/src.git - Git at Google

 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "chrome/browser/speech/extension_api/tts_extension_api.h"

 #include <stddef.h>

 #include <memory>
 #include <string>
 #include <utility>

 #include "base/lazy_instance.h"
 #include "base/metrics/histogram_macros.h"
 #include "base/metrics/user_metrics.h"
 #include "base/values.h"
 #include "build/chromeos_buildflags.h"
 #include "chrome/browser/profiles/profile.h"
 #include "chrome/browser/speech/extension_api/tts_engine_extension_api.h"
 #include "chrome/browser/speech/extension_api/tts_extension_api_constants.h"
 #include "content/public/browser/tts_controller.h"
 #include "extensions/browser/event_router.h"
 #include "extensions/browser/extension_function_registry.h"
 #include "extensions/browser/extension_host.h"
 #include "extensions/browser/process_manager.h"
 #include "third_party/blink/public/mojom/speech/speech_synthesis.mojom.h"
 #include "ui/base/l10n/l10n_util.h"

 #if BUILDFLAG(IS_CHROMEOS_ASH)
 #include "chrome/browser/speech/extension_api/tts_engine_extension_observer_chromeos.h"
 #include "chrome/common/extensions/extension_constants.h"
 #endif  // BUILDFLAG(IS_CHROMEOS_ASH)

 namespace constants = tts_extension_api_constants;

 #if BUILDFLAG(IS_CHROMEOS_ASH)
 namespace {

 // ChromeOS source that triggered text-to-speech utterance.
 //
 // These values are logged to UMA. Entries should not be renumbered and
 // numeric values should never be reused. Please keep in sync with
 // "TextToSpeechSource" in src/tools/metrics/histograms/enums.xml.
 enum class UMATextToSpeechSource {
   kOther = 0,
   kChromeVox = 1,
   kSelectToSpeak = 2,

   kMaxValue = kSelectToSpeak,
 };

 }  // namespace
 #endif  // BUILDFLAG(IS_CHROMEOS_ASH)

 namespace events {
 const char kOnEvent[] = "tts.onEvent";
 }  // namespace events

 const char* TtsEventTypeToString(content::TtsEventType event_type) {
   switch (event_type) {
     case content::TTS_EVENT_START:
       return constants::kEventTypeStart;
     case content::TTS_EVENT_END:
       return constants::kEventTypeEnd;
     case content::TTS_EVENT_WORD:
       return constants::kEventTypeWord;
     case content::TTS_EVENT_SENTENCE:
       return constants::kEventTypeSentence;
     case content::TTS_EVENT_MARKER:
       return constants::kEventTypeMarker;
     case content::TTS_EVENT_INTERRUPTED:
       return constants::kEventTypeInterrupted;
     case content::TTS_EVENT_CANCELLED:
       return constants::kEventTypeCancelled;
     case content::TTS_EVENT_ERROR:
       return constants::kEventTypeError;
     case content::TTS_EVENT_PAUSE:
       return constants::kEventTypePause;
     case content::TTS_EVENT_RESUME:
       return constants::kEventTypeResume;
     default:
       NOTREACHED();
       return constants::kEventTypeError;
   }
 }

 content::TtsEventType TtsEventTypeFromString(const std::string& str) {
   if (str == constants::kEventTypeStart)
     return content::TTS_EVENT_START;
   if (str == constants::kEventTypeEnd)
     return content::TTS_EVENT_END;
   if (str == constants::kEventTypeWord)
     return content::TTS_EVENT_WORD;
   if (str == constants::kEventTypeSentence)
     return content::TTS_EVENT_SENTENCE;
   if (str == constants::kEventTypeMarker)
     return content::TTS_EVENT_MARKER;
   if (str == constants::kEventTypeInterrupted)
     return content::TTS_EVENT_INTERRUPTED;
   if (str == constants::kEventTypeCancelled)
     return content::TTS_EVENT_CANCELLED;
   if (str == constants::kEventTypeError)
     return content::TTS_EVENT_ERROR;
   if (str == constants::kEventTypePause)
     return content::TTS_EVENT_PAUSE;
   if (str == constants::kEventTypeResume)
     return content::TTS_EVENT_RESUME;

   NOTREACHED();
   return content::TTS_EVENT_ERROR;
 }

 namespace extensions {

 // One of these is constructed for each utterance, and deleted
 // when the utterance gets any final event.
 class TtsExtensionEventHandler : public content::UtteranceEventDelegate {
  public:
   explicit TtsExtensionEventHandler(const std::string& src_extension_id);

   void OnTtsEvent(content::TtsUtterance* utterance,
                   content::TtsEventType event_type,
                   int char_index,
                   int length,
                   const std::string& error_message) override;

  private:
   // The extension ID of the extension that called speak() and should
   // receive events.
   std::string src_extension_id_;
 };

 TtsExtensionEventHandler::TtsExtensionEventHandler(
     const std::string& src_extension_id)
     : src_extension_id_(src_extension_id) {
 }

 void TtsExtensionEventHandler::OnTtsEvent(content::TtsUtterance* utterance,
                                           content::TtsEventType event_type,
                                           int char_index,
                                           int length,
                                           const std::string& error_message) {
   if (utterance->GetSrcId() < 0) {
     if (utterance->IsFinished())
       delete this;
     return;
   }

   const std::set<content::TtsEventType>& desired_event_types =
       utterance->GetDesiredEventTypes();
   if (!desired_event_types.empty() &&
       desired_event_types.find(event_type) == desired_event_types.end()) {
     if (utterance->IsFinished())
       delete this;
     return;
   }

   const char *event_type_string = TtsEventTypeToString(event_type);
   std::unique_ptr<base::DictionaryValue> details(new base::DictionaryValue());
   if (char_index >= 0)
     details->SetInteger(constants::kCharIndexKey, char_index);
   if (length >= 0)
     details->SetInteger(constants::kLengthKey, length);
   details->SetString(constants::kEventTypeKey, event_type_string);
   if (event_type == content::TTS_EVENT_ERROR) {
     details->SetString(constants::kErrorMessageKey, error_message);
   }
   details->SetInteger(constants::kSrcIdKey, utterance->GetSrcId());
   details->SetBoolean(constants::kIsFinalEventKey, utterance->IsFinished());

   std::unique_ptr<base::ListValue> arguments(new base::ListValue());
   arguments->Append(std::move(details));

   auto event = std::make_unique<extensions::Event>(
       ::extensions::events::TTS_ON_EVENT, ::events::kOnEvent,
       std::move(arguments), utterance->GetBrowserContext());
   event->event_url = utterance->GetSrcUrl();
   extensions::EventRouter::Get(utterance->GetBrowserContext())
       ->DispatchEventToExtension(src_extension_id_, std::move(event));

   if (utterance->IsFinished())
     delete this;
 }

 ExtensionFunction::ResponseAction TtsSpeakFunction::Run() {
   std::string text;
   EXTENSION_FUNCTION_VALIDATE(args_->GetString(0, &text));
   if (text.size() > 32768) {
     return RespondNow(Error(constants::kErrorUtteranceTooLong));
   }

   std::unique_ptr<base::DictionaryValue> options(new base::DictionaryValue());
   if (args_->GetSize() >= 2) {
     base::DictionaryValue* temp_options = NULL;
     if (args_->GetDictionary(1, &temp_options))
       options.reset(temp_options->DeepCopy());
   }

   std::string voice_name;
   if (options->FindKey(constants::kVoiceNameKey)) {
     EXTENSION_FUNCTION_VALIDATE(
         options->GetString(constants::kVoiceNameKey, &voice_name));
   }

   std::string lang;
   if (options->FindKey(constants::kLangKey))
     EXTENSION_FUNCTION_VALIDATE(options->GetString(constants::kLangKey, &lang));
   if (!lang.empty() && !l10n_util::IsValidLocaleSyntax(lang)) {
     return RespondNow(Error(constants::kErrorInvalidLang));
   }

   // TODO(katie): Remove this after M73. This is just used to track how the
   // gender deprecation is progressing.
   std::string gender_str;
   if (options->FindKey(constants::kGenderKey))
     EXTENSION_FUNCTION_VALIDATE(
         options->GetString(constants::kGenderKey, &gender_str));
   UMA_HISTOGRAM_BOOLEAN("TextToSpeech.Utterance.HasGender",
                         !gender_str.empty());

   double rate = blink::mojom::kSpeechSynthesisDoublePrefNotSet;
   if (options->FindKey(constants::kRateKey)) {
     EXTENSION_FUNCTION_VALIDATE(
         options->GetDouble(constants::kRateKey, &rate));
     if (rate < 0.1 || rate > 10.0) {
       return RespondNow(Error(constants::kErrorInvalidRate));
     }
   }

   double pitch = blink::mojom::kSpeechSynthesisDoublePrefNotSet;
   if (options->FindKey(constants::kPitchKey)) {
     EXTENSION_FUNCTION_VALIDATE(
         options->GetDouble(constants::kPitchKey, &pitch));
     if (pitch < 0.0 || pitch > 2.0) {
       return RespondNow(Error(constants::kErrorInvalidPitch));
     }
   }

   double volume = blink::mojom::kSpeechSynthesisDoublePrefNotSet;
   if (options->FindKey(constants::kVolumeKey)) {
     EXTENSION_FUNCTION_VALIDATE(
         options->GetDouble(constants::kVolumeKey, &volume));
     if (volume < 0.0 || volume > 1.0) {
       return RespondNow(Error(constants::kErrorInvalidVolume));
     }
   }

   bool can_enqueue = false;
   if (options->FindKey(constants::kEnqueueKey)) {
     EXTENSION_FUNCTION_VALIDATE(
         options->GetBoolean(constants::kEnqueueKey, &can_enqueue));
   }

   std::set<content::TtsEventType> required_event_types;
   if (options->FindKey(constants::kRequiredEventTypesKey)) {
     base::ListValue* list;
     EXTENSION_FUNCTION_VALIDATE(
         options->GetList(constants::kRequiredEventTypesKey, &list));
     for (size_t i = 0; i < list->GetSize(); ++i) {
       std::string event_type;
       if (list->GetString(i, &event_type))
         required_event_types.insert(TtsEventTypeFromString(event_type.c_str()));
     }
   }

   std::set<content::TtsEventType> desired_event_types;
   if (options->FindKey(constants::kDesiredEventTypesKey)) {
     base::ListValue* list;
     EXTENSION_FUNCTION_VALIDATE(
         options->GetList(constants::kDesiredEventTypesKey, &list));
     for (size_t i = 0; i < list->GetSize(); ++i) {
       std::string event_type;
       if (list->GetString(i, &event_type))
         desired_event_types.insert(TtsEventTypeFromString(event_type.c_str()));
     }
   }

   std::string voice_extension_id;
   if (options->FindKey(constants::kExtensionIdKey)) {
     EXTENSION_FUNCTION_VALIDATE(
         options->GetString(constants::kExtensionIdKey, &voice_extension_id));
   }

   int src_id = -1;
   if (options->FindKey(constants::kSrcIdKey)) {
     EXTENSION_FUNCTION_VALIDATE(
         options->GetInteger(constants::kSrcIdKey, &src_id));
   }

 #if BUILDFLAG(IS_CHROMEOS_ASH)
   UMATextToSpeechSource source = UMATextToSpeechSource::kOther;
   const std::string host = source_url().host();
   if (host == extension_misc::kSelectToSpeakExtensionId) {
     source = UMATextToSpeechSource::kSelectToSpeak;
   } else if (host == extension_misc::kChromeVoxExtensionId) {
     source = UMATextToSpeechSource::kChromeVox;
   }
   UMA_HISTOGRAM_ENUMERATION("TextToSpeech.Utterance.Source", source);
 #endif  // BUILDFLAG(IS_CHROMEOS_ASH)

   // If we got this far, the arguments were all in the valid format, so
   // send the success response to the callback now - this ensures that
   // the callback response always arrives before events, which makes
   // the behavior more predictable and easier to write unit tests for too.
   Respond(NoArguments());

   std::unique_ptr<content::TtsUtterance> utterance;
   if (extension()) {
     extensions::ExtensionHost* host =
         extensions::ProcessManager::Get(browser_context())
             ->GetBackgroundHostForExtension(extension()->id());

     if (host && host->host_contents())
       utterance = content::TtsUtterance::Create(host->host_contents());
   }

   if (!utterance)
     utterance = content::TtsUtterance::Create(browser_context());

   utterance->SetText(text);
   utterance->SetVoiceName(voice_name);
   utterance->SetSrcId(src_id);
   utterance->SetSrcUrl(source_url());
   utterance->SetLang(lang);
   utterance->SetContinuousParameters(rate, pitch, volume);
   utterance->SetShouldClearQueue(!can_enqueue);
   utterance->SetRequiredEventTypes(required_event_types);
   utterance->SetDesiredEventTypes(desired_event_types);
   utterance->SetEngineId(voice_extension_id);
   utterance->SetOptions(options.get());
   if (extension())
     utterance->SetEventDelegate(new TtsExtensionEventHandler(extension_id()));

   content::TtsController* controller = content::TtsController::GetInstance();
   controller->SpeakOrEnqueue(std::move(utterance));
   return AlreadyResponded();
 }

 ExtensionFunction::ResponseAction TtsStopSpeakingFunction::Run() {
   content::TtsController::GetInstance()->Stop(source_url());
   return RespondNow(NoArguments());
 }

 ExtensionFunction::ResponseAction TtsPauseFunction::Run() {
   content::TtsController::GetInstance()->Pause();
   return RespondNow(NoArguments());
 }

 ExtensionFunction::ResponseAction TtsResumeFunction::Run() {
   content::TtsController::GetInstance()->Resume();
   return RespondNow(NoArguments());
 }

 ExtensionFunction::ResponseAction TtsIsSpeakingFunction::Run() {
   return RespondNow(OneArgument(
       base::Value(content::TtsController::GetInstance()->IsSpeaking())));
 }

 ExtensionFunction::ResponseAction TtsGetVoicesFunction::Run() {
   std::vector<content::VoiceData> voices;
   content::TtsController::GetInstance()->GetVoices(browser_context(), &voices);

   auto result_voices = std::make_unique<base::ListValue>();
   for (size_t i = 0; i < voices.size(); ++i) {
     const content::VoiceData& voice = voices[i];
     std::unique_ptr<base::DictionaryValue> result_voice(
         new base::DictionaryValue());
     result_voice->SetString(constants::kVoiceNameKey, voice.name);
     result_voice->SetBoolean(constants::kRemoteKey, voice.remote);
     if (!voice.lang.empty())
       result_voice->SetString(constants::kLangKey, voice.lang);
     if (!voice.engine_id.empty())
       result_voice->SetString(constants::kExtensionIdKey, voice.engine_id);

     auto event_types = std::make_unique<base::ListValue>();
     for (auto iter = voice.events.begin(); iter != voice.events.end(); ++iter) {
       const char* event_name_constant = TtsEventTypeToString(*iter);
       event_types->AppendString(event_name_constant);
     }
     result_voice->Set(constants::kEventTypesKey, std::move(event_types));

     result_voices->Append(std::move(result_voice));
   }

   return RespondNow(
       OneArgument(base::Value::FromUniquePtrValue(std::move(result_voices))));
 }

 TtsAPI::TtsAPI(content::BrowserContext* context) {
   ExtensionFunctionRegistry& registry =
       ExtensionFunctionRegistry::GetInstance();
   registry.RegisterFunction<ExtensionTtsEngineUpdateVoicesFunction>();
   registry.RegisterFunction<ExtensionTtsEngineSendTtsEventFunction>();
   registry.RegisterFunction<ExtensionTtsEngineSendTtsAudioFunction>();
   registry.RegisterFunction<TtsGetVoicesFunction>();
   registry.RegisterFunction<TtsIsSpeakingFunction>();
   registry.RegisterFunction<TtsSpeakFunction>();
   registry.RegisterFunction<TtsStopSpeakingFunction>();
   registry.RegisterFunction<TtsPauseFunction>();
   registry.RegisterFunction<TtsResumeFunction>();

 #if BUILDFLAG(IS_CHROMEOS_ASH)
   // Ensure we're observing newly added engines for the given context.
   TtsEngineExtensionObserverChromeOS::GetInstance(
       Profile::FromBrowserContext(context));
 #endif  // BUILDFLAG(IS_CHROMEOS_ASH)
 }

 TtsAPI::~TtsAPI() {
 }

 static base::LazyInstance<
     BrowserContextKeyedAPIFactory<TtsAPI>>::DestructorAtExit g_factory =
     LAZY_INSTANCE_INITIALIZER;

 BrowserContextKeyedAPIFactory<TtsAPI>* TtsAPI::GetFactoryInstance() {
   return g_factory.Pointer();
 }

 }  // namespace extensions
	// Copyright (c) 2012 The Chromium Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#include "chrome/browser/speech/extension_api/tts_extension_api.h"

	#include <stddef.h>

	#include <memory>
	#include <string>
	#include <utility>

	#include "base/lazy_instance.h"
	#include "base/metrics/histogram_macros.h"
	#include "base/metrics/user_metrics.h"
	#include "base/values.h"
	#include "build/chromeos_buildflags.h"
	#include "chrome/browser/profiles/profile.h"
	#include "chrome/browser/speech/extension_api/tts_engine_extension_api.h"
	#include "chrome/browser/speech/extension_api/tts_extension_api_constants.h"
	#include "content/public/browser/tts_controller.h"
	#include "extensions/browser/event_router.h"
	#include "extensions/browser/extension_function_registry.h"
	#include "extensions/browser/extension_host.h"
	#include "extensions/browser/process_manager.h"
	#include "third_party/blink/public/mojom/speech/speech_synthesis.mojom.h"
	#include "ui/base/l10n/l10n_util.h"

	#if BUILDFLAG(IS_CHROMEOS_ASH)
	#include "chrome/browser/speech/extension_api/tts_engine_extension_observer_chromeos.h"
	#include "chrome/common/extensions/extension_constants.h"
	#endif // BUILDFLAG(IS_CHROMEOS_ASH)

	namespace constants = tts_extension_api_constants;

	#if BUILDFLAG(IS_CHROMEOS_ASH)
	namespace {

	// ChromeOS source that triggered text-to-speech utterance.
	//
	// These values are logged to UMA. Entries should not be renumbered and
	// numeric values should never be reused. Please keep in sync with
	// "TextToSpeechSource" in src/tools/metrics/histograms/enums.xml.
	enum class UMATextToSpeechSource {
	kOther = 0,
	kChromeVox = 1,
	kSelectToSpeak = 2,

	kMaxValue = kSelectToSpeak,
	};

	} // namespace
	#endif // BUILDFLAG(IS_CHROMEOS_ASH)

	namespace events {
	const char kOnEvent[] = "tts.onEvent";
	} // namespace events

	const char* TtsEventTypeToString(content::TtsEventType event_type) {
	switch (event_type) {
	case content::TTS_EVENT_START:
	return constants::kEventTypeStart;
	case content::TTS_EVENT_END:
	return constants::kEventTypeEnd;
	case content::TTS_EVENT_WORD:
	return constants::kEventTypeWord;
	case content::TTS_EVENT_SENTENCE:
	return constants::kEventTypeSentence;
	case content::TTS_EVENT_MARKER:
	return constants::kEventTypeMarker;
	case content::TTS_EVENT_INTERRUPTED:
	return constants::kEventTypeInterrupted;
	case content::TTS_EVENT_CANCELLED:
	return constants::kEventTypeCancelled;
	case content::TTS_EVENT_ERROR:
	return constants::kEventTypeError;
	case content::TTS_EVENT_PAUSE:
	return constants::kEventTypePause;
	case content::TTS_EVENT_RESUME:
	return constants::kEventTypeResume;
	default:
	NOTREACHED();
	return constants::kEventTypeError;
	}
	}

	content::TtsEventType TtsEventTypeFromString(const std::string& str) {
	if (str == constants::kEventTypeStart)
	return content::TTS_EVENT_START;
	if (str == constants::kEventTypeEnd)
	return content::TTS_EVENT_END;
	if (str == constants::kEventTypeWord)
	return content::TTS_EVENT_WORD;
	if (str == constants::kEventTypeSentence)
	return content::TTS_EVENT_SENTENCE;
	if (str == constants::kEventTypeMarker)
	return content::TTS_EVENT_MARKER;
	if (str == constants::kEventTypeInterrupted)
	return content::TTS_EVENT_INTERRUPTED;
	if (str == constants::kEventTypeCancelled)
	return content::TTS_EVENT_CANCELLED;
	if (str == constants::kEventTypeError)
	return content::TTS_EVENT_ERROR;
	if (str == constants::kEventTypePause)
	return content::TTS_EVENT_PAUSE;
	if (str == constants::kEventTypeResume)
	return content::TTS_EVENT_RESUME;

	NOTREACHED();
	return content::TTS_EVENT_ERROR;
	}

	namespace extensions {

	// One of these is constructed for each utterance, and deleted
	// when the utterance gets any final event.
	class TtsExtensionEventHandler : public content::UtteranceEventDelegate {
	public:
	explicit TtsExtensionEventHandler(const std::string& src_extension_id);

	void OnTtsEvent(content::TtsUtterance* utterance,
	content::TtsEventType event_type,
	int char_index,
	int length,
	const std::string& error_message) override;

	private:
	// The extension ID of the extension that called speak() and should
	// receive events.
	std::string src_extension_id_;
	};

	TtsExtensionEventHandler::TtsExtensionEventHandler(
	const std::string& src_extension_id)
	: src_extension_id_(src_extension_id) {
	}

	void TtsExtensionEventHandler::OnTtsEvent(content::TtsUtterance* utterance,
	content::TtsEventType event_type,
	int char_index,
	int length,
	const std::string& error_message) {
	if (utterance->GetSrcId() < 0) {
	if (utterance->IsFinished())
	delete this;
	return;
	}

	const std::set<content::TtsEventType>& desired_event_types =
	utterance->GetDesiredEventTypes();
	if (!desired_event_types.empty() &&
	desired_event_types.find(event_type) == desired_event_types.end()) {
	if (utterance->IsFinished())
	delete this;
	return;
	}

	const char *event_type_string = TtsEventTypeToString(event_type);
	std::unique_ptr<base::DictionaryValue> details(new base::DictionaryValue());
	if (char_index >= 0)
	details->SetInteger(constants::kCharIndexKey, char_index);
	if (length >= 0)
	details->SetInteger(constants::kLengthKey, length);
	details->SetString(constants::kEventTypeKey, event_type_string);
	if (event_type == content::TTS_EVENT_ERROR) {
	details->SetString(constants::kErrorMessageKey, error_message);
	}
	details->SetInteger(constants::kSrcIdKey, utterance->GetSrcId());
	details->SetBoolean(constants::kIsFinalEventKey, utterance->IsFinished());

	std::unique_ptr<base::ListValue> arguments(new base::ListValue());
	arguments->Append(std::move(details));

	auto event = std::make_unique<extensions::Event>(
	::extensions::events::TTS_ON_EVENT, ::events::kOnEvent,
	std::move(arguments), utterance->GetBrowserContext());
	event->event_url = utterance->GetSrcUrl();
	extensions::EventRouter::Get(utterance->GetBrowserContext())
	->DispatchEventToExtension(src_extension_id_, std::move(event));

	if (utterance->IsFinished())
	delete this;
	}

	ExtensionFunction::ResponseAction TtsSpeakFunction::Run() {
	std::string text;
	EXTENSION_FUNCTION_VALIDATE(args_->GetString(0, &text));
	if (text.size() > 32768) {
	return RespondNow(Error(constants::kErrorUtteranceTooLong));
	}

	std::unique_ptr<base::DictionaryValue> options(new base::DictionaryValue());
	if (args_->GetSize() >= 2) {
	base::DictionaryValue* temp_options = NULL;
	if (args_->GetDictionary(1, &temp_options))
	options.reset(temp_options->DeepCopy());
	}

	std::string voice_name;
	if (options->FindKey(constants::kVoiceNameKey)) {
	EXTENSION_FUNCTION_VALIDATE(
	options->GetString(constants::kVoiceNameKey, &voice_name));
	}

	std::string lang;
	if (options->FindKey(constants::kLangKey))
	EXTENSION_FUNCTION_VALIDATE(options->GetString(constants::kLangKey, &lang));
	if (!lang.empty() && !l10n_util::IsValidLocaleSyntax(lang)) {
	return RespondNow(Error(constants::kErrorInvalidLang));
	}

	// TODO(katie): Remove this after M73. This is just used to track how the
	// gender deprecation is progressing.
	std::string gender_str;
	if (options->FindKey(constants::kGenderKey))
	EXTENSION_FUNCTION_VALIDATE(
	options->GetString(constants::kGenderKey, &gender_str));
	UMA_HISTOGRAM_BOOLEAN("TextToSpeech.Utterance.HasGender",
	!gender_str.empty());

	double rate = blink::mojom::kSpeechSynthesisDoublePrefNotSet;
	if (options->FindKey(constants::kRateKey)) {
	EXTENSION_FUNCTION_VALIDATE(
	options->GetDouble(constants::kRateKey, &rate));
	if (rate < 0.1 \|\| rate > 10.0) {
	return RespondNow(Error(constants::kErrorInvalidRate));
	}
	}

	double pitch = blink::mojom::kSpeechSynthesisDoublePrefNotSet;
	if (options->FindKey(constants::kPitchKey)) {
	EXTENSION_FUNCTION_VALIDATE(
	options->GetDouble(constants::kPitchKey, &pitch));
	if (pitch < 0.0 \|\| pitch > 2.0) {
	return RespondNow(Error(constants::kErrorInvalidPitch));
	}
	}

	double volume = blink::mojom::kSpeechSynthesisDoublePrefNotSet;
	if (options->FindKey(constants::kVolumeKey)) {
	EXTENSION_FUNCTION_VALIDATE(
	options->GetDouble(constants::kVolumeKey, &volume));
	if (volume < 0.0 \|\| volume > 1.0) {
	return RespondNow(Error(constants::kErrorInvalidVolume));
	}
	}

	bool can_enqueue = false;
	if (options->FindKey(constants::kEnqueueKey)) {
	EXTENSION_FUNCTION_VALIDATE(
	options->GetBoolean(constants::kEnqueueKey, &can_enqueue));
	}

	std::set<content::TtsEventType> required_event_types;
	if (options->FindKey(constants::kRequiredEventTypesKey)) {
	base::ListValue* list;
	EXTENSION_FUNCTION_VALIDATE(
	options->GetList(constants::kRequiredEventTypesKey, &list));
	for (size_t i = 0; i < list->GetSize(); ++i) {
	std::string event_type;
	if (list->GetString(i, &event_type))
	required_event_types.insert(TtsEventTypeFromString(event_type.c_str()));
	}
	}

	std::set<content::TtsEventType> desired_event_types;
	if (options->FindKey(constants::kDesiredEventTypesKey)) {
	base::ListValue* list;
	EXTENSION_FUNCTION_VALIDATE(
	options->GetList(constants::kDesiredEventTypesKey, &list));
	for (size_t i = 0; i < list->GetSize(); ++i) {
	std::string event_type;
	if (list->GetString(i, &event_type))
	desired_event_types.insert(TtsEventTypeFromString(event_type.c_str()));
	}
	}

	std::string voice_extension_id;
	if (options->FindKey(constants::kExtensionIdKey)) {
	EXTENSION_FUNCTION_VALIDATE(
	options->GetString(constants::kExtensionIdKey, &voice_extension_id));
	}

	int src_id = -1;
	if (options->FindKey(constants::kSrcIdKey)) {
	EXTENSION_FUNCTION_VALIDATE(
	options->GetInteger(constants::kSrcIdKey, &src_id));
	}

	#if BUILDFLAG(IS_CHROMEOS_ASH)
	UMATextToSpeechSource source = UMATextToSpeechSource::kOther;
	const std::string host = source_url().host();
	if (host == extension_misc::kSelectToSpeakExtensionId) {
	source = UMATextToSpeechSource::kSelectToSpeak;
	} else if (host == extension_misc::kChromeVoxExtensionId) {
	source = UMATextToSpeechSource::kChromeVox;
	}
	UMA_HISTOGRAM_ENUMERATION("TextToSpeech.Utterance.Source", source);
	#endif // BUILDFLAG(IS_CHROMEOS_ASH)

	// If we got this far, the arguments were all in the valid format, so
	// send the success response to the callback now - this ensures that
	// the callback response always arrives before events, which makes
	// the behavior more predictable and easier to write unit tests for too.
	Respond(NoArguments());

	std::unique_ptr<content::TtsUtterance> utterance;
	if (extension()) {
	extensions::ExtensionHost* host =
	extensions::ProcessManager::Get(browser_context())
	->GetBackgroundHostForExtension(extension()->id());

	if (host && host->host_contents())
	utterance = content::TtsUtterance::Create(host->host_contents());
	}

	if (!utterance)
	utterance = content::TtsUtterance::Create(browser_context());

	utterance->SetText(text);
	utterance->SetVoiceName(voice_name);
	utterance->SetSrcId(src_id);
	utterance->SetSrcUrl(source_url());
	utterance->SetLang(lang);
	utterance->SetContinuousParameters(rate, pitch, volume);
	utterance->SetShouldClearQueue(!can_enqueue);
	utterance->SetRequiredEventTypes(required_event_types);
	utterance->SetDesiredEventTypes(desired_event_types);
	utterance->SetEngineId(voice_extension_id);
	utterance->SetOptions(options.get());
	if (extension())
	utterance->SetEventDelegate(new TtsExtensionEventHandler(extension_id()));

	content::TtsController* controller = content::TtsController::GetInstance();
	controller->SpeakOrEnqueue(std::move(utterance));
	return AlreadyResponded();
	}

	ExtensionFunction::ResponseAction TtsStopSpeakingFunction::Run() {
	content::TtsController::GetInstance()->Stop(source_url());
	return RespondNow(NoArguments());
	}

	ExtensionFunction::ResponseAction TtsPauseFunction::Run() {
	content::TtsController::GetInstance()->Pause();
	return RespondNow(NoArguments());
	}

	ExtensionFunction::ResponseAction TtsResumeFunction::Run() {
	content::TtsController::GetInstance()->Resume();
	return RespondNow(NoArguments());
	}

	ExtensionFunction::ResponseAction TtsIsSpeakingFunction::Run() {
	return RespondNow(OneArgument(
	base::Value(content::TtsController::GetInstance()->IsSpeaking())));
	}

	ExtensionFunction::ResponseAction TtsGetVoicesFunction::Run() {
	std::vector<content::VoiceData> voices;
	content::TtsController::GetInstance()->GetVoices(browser_context(), &voices);

	auto result_voices = std::make_unique<base::ListValue>();
	for (size_t i = 0; i < voices.size(); ++i) {
	const content::VoiceData& voice = voices[i];
	std::unique_ptr<base::DictionaryValue> result_voice(
	new base::DictionaryValue());
	result_voice->SetString(constants::kVoiceNameKey, voice.name);
	result_voice->SetBoolean(constants::kRemoteKey, voice.remote);
	if (!voice.lang.empty())
	result_voice->SetString(constants::kLangKey, voice.lang);
	if (!voice.engine_id.empty())
	result_voice->SetString(constants::kExtensionIdKey, voice.engine_id);

	auto event_types = std::make_unique<base::ListValue>();
	for (auto iter = voice.events.begin(); iter != voice.events.end(); ++iter) {
	const char* event_name_constant = TtsEventTypeToString(*iter);
	event_types->AppendString(event_name_constant);
	}
	result_voice->Set(constants::kEventTypesKey, std::move(event_types));

	result_voices->Append(std::move(result_voice));
	}

	return RespondNow(
	OneArgument(base::Value::FromUniquePtrValue(std::move(result_voices))));
	}

	TtsAPI::TtsAPI(content::BrowserContext* context) {
	ExtensionFunctionRegistry& registry =
	ExtensionFunctionRegistry::GetInstance();
	registry.RegisterFunction<ExtensionTtsEngineUpdateVoicesFunction>();
	registry.RegisterFunction<ExtensionTtsEngineSendTtsEventFunction>();
	registry.RegisterFunction<ExtensionTtsEngineSendTtsAudioFunction>();
	registry.RegisterFunction<TtsGetVoicesFunction>();
	registry.RegisterFunction<TtsIsSpeakingFunction>();
	registry.RegisterFunction<TtsSpeakFunction>();
	registry.RegisterFunction<TtsStopSpeakingFunction>();
	registry.RegisterFunction<TtsPauseFunction>();
	registry.RegisterFunction<TtsResumeFunction>();

	#if BUILDFLAG(IS_CHROMEOS_ASH)
	// Ensure we're observing newly added engines for the given context.
	TtsEngineExtensionObserverChromeOS::GetInstance(
	Profile::FromBrowserContext(context));
	#endif // BUILDFLAG(IS_CHROMEOS_ASH)
	}

	TtsAPI::~TtsAPI() {
	}

	static base::LazyInstance<
	BrowserContextKeyedAPIFactory<TtsAPI>>::DestructorAtExit g_factory =
	LAZY_INSTANCE_INITIALIZER;

	BrowserContextKeyedAPIFactory<TtsAPI>* TtsAPI::GetFactoryInstance() {
	return g_factory.Pointer();
	}

	} // namespace extensions