SpeechRecognitionServer.cpp [plain text]
#include "config.h"
#include "SpeechRecognitionServer.h"
#include "UserMediaProcessManager.h"
#include "WebProcessProxy.h"
#include "WebSpeechRecognitionConnectionMessages.h"
#include <WebCore/SpeechRecognitionRequestInfo.h>
#include <WebCore/SpeechRecognitionUpdate.h>
#define MESSAGE_CHECK(assertion) MESSAGE_CHECK_BASE(assertion, messageSenderConnection())
namespace WebKit {
SpeechRecognitionServer::SpeechRecognitionServer(Ref<IPC::Connection>&& connection, SpeechRecognitionServerIdentifier identifier, SpeechRecognitionPermissionChecker&& permissionChecker, SpeechRecognitionCheckIfMockSpeechRecognitionEnabled&& checkIfEnabled
#if ENABLE(MEDIA_STREAM)
, RealtimeMediaSourceCreateFunction&& function
#endif
)
: m_connection(WTFMove(connection))
, m_identifier(identifier)
, m_permissionChecker(WTFMove(permissionChecker))
, m_checkIfMockSpeechRecognitionEnabled(WTFMove(checkIfEnabled))
#if ENABLE(MEDIA_STREAM)
, m_realtimeMediaSourceCreateFunction(WTFMove(function))
#endif
{
}
void SpeechRecognitionServer::start(WebCore::SpeechRecognitionConnectionClientIdentifier clientIdentifier, String&& lang, bool continuous, bool interimResults, uint64_t maxAlternatives, WebCore::ClientOrigin&& origin, WebCore::FrameIdentifier frameIdentifier)
{
MESSAGE_CHECK(clientIdentifier);
ASSERT(!m_requests.contains(clientIdentifier));
auto requestInfo = WebCore::SpeechRecognitionRequestInfo { clientIdentifier, WTFMove(lang), continuous, interimResults, maxAlternatives, WTFMove(origin), frameIdentifier };
auto& newRequest = m_requests.add(clientIdentifier, makeUnique<WebCore::SpeechRecognitionRequest>(WTFMove(requestInfo))).iterator->value;
requestPermissionForRequest(*newRequest);
}
void SpeechRecognitionServer::requestPermissionForRequest(WebCore::SpeechRecognitionRequest& request)
{
m_permissionChecker(request.lang(), request.clientOrigin(), request.frameIdentifier(), [this, weakThis = makeWeakPtr(this), weakRequest = makeWeakPtr(request)](auto error) mutable {
if (!weakThis)
return;
if (!weakRequest)
return;
auto identifier = weakRequest->clientIdentifier();
if (error) {
m_requests.remove(identifier);
sendUpdate(identifier, WebCore::SpeechRecognitionUpdateType::Error, WTFMove(error));
return;
}
handleRequest(*weakRequest);
});
}
void SpeechRecognitionServer::handleRequest(WebCore::SpeechRecognitionRequest& request)
{
if (!m_recognizer) {
m_recognizer = makeUnique<WebCore::SpeechRecognizer>([this, weakThis = makeWeakPtr(this)](auto& update) {
if (!weakThis)
return;
auto clientIdentifier = update.clientIdentifier();
if (!m_requests.contains(clientIdentifier))
return;
sendUpdate(update);
auto type = update.type();
if (type != WebCore::SpeechRecognitionUpdateType::Error && type != WebCore::SpeechRecognitionUpdateType::End)
return;
if (m_isResetting)
return;
m_isResetting = true;
m_recognizer->reset();
m_requests.remove(clientIdentifier);
m_isResetting = false;
});
}
if (auto currentClientIdentifier = m_recognizer->currentClientIdentifier()) {
auto error = WebCore::SpeechRecognitionError { WebCore::SpeechRecognitionErrorType::Aborted, "Another request is started"_s };
sendUpdate(*currentClientIdentifier, WebCore::SpeechRecognitionUpdateType::Error, error);
m_recognizer->reset();
}
auto clientIdentifier = request.clientIdentifier();
#if ENABLE(MEDIA_STREAM)
auto sourceOrError = m_realtimeMediaSourceCreateFunction();
if (!sourceOrError) {
m_requests.remove(clientIdentifier);
sendUpdate(WebCore::SpeechRecognitionUpdate::createError(clientIdentifier, WebCore::SpeechRecognitionError { WebCore::SpeechRecognitionErrorType::AudioCapture, sourceOrError.errorMessage }));
return;
}
WebProcessProxy::muteCaptureInPagesExcept(m_identifier);
bool mockDeviceCapturesEnabled = m_checkIfMockSpeechRecognitionEnabled();
m_recognizer->start(clientIdentifier, sourceOrError.source(), mockDeviceCapturesEnabled, request.lang(), request.continuous(), request.interimResults(), request.maxAlternatives());
#else
m_requests.remove(clientIdentifier);
sendUpdate(clientIdentifier, WebCore::SpeechRecognitionUpdateType::Error, WebCore::SpeechRecognitionError { WebCore::SpeechRecognitionErrorType::AudioCapture, "Audio capture is not implemented"_s });
#endif
}
void SpeechRecognitionServer::stop(WebCore::SpeechRecognitionConnectionClientIdentifier clientIdentifier)
{
MESSAGE_CHECK(clientIdentifier);
if (m_recognizer && m_recognizer->currentClientIdentifier() == clientIdentifier) {
m_recognizer->stop();
return;
}
if (m_requests.remove(clientIdentifier))
sendUpdate(clientIdentifier, WebCore::SpeechRecognitionUpdateType::End);
}
void SpeechRecognitionServer::abort(WebCore::SpeechRecognitionConnectionClientIdentifier clientIdentifier)
{
MESSAGE_CHECK(clientIdentifier);
if (m_recognizer && m_recognizer->currentClientIdentifier() == clientIdentifier) {
m_recognizer->abort();
return;
}
if (m_requests.remove(clientIdentifier))
sendUpdate(clientIdentifier, WebCore::SpeechRecognitionUpdateType::End);
}
void SpeechRecognitionServer::invalidate(WebCore::SpeechRecognitionConnectionClientIdentifier clientIdentifier)
{
MESSAGE_CHECK(clientIdentifier);
if (m_requests.remove(clientIdentifier)) {
if (m_recognizer && m_recognizer->currentClientIdentifier() == clientIdentifier)
m_recognizer->abort();
}
}
void SpeechRecognitionServer::abortForPageIsBecomingInvisible()
{
if (!m_recognizer)
return;
auto currentClientIdentifier = m_recognizer->currentClientIdentifier();
if (!currentClientIdentifier)
return;
auto error = WebCore::SpeechRecognitionError { WebCore::SpeechRecognitionErrorType::Aborted, "Page is no longer visible"_s };
sendUpdate(*currentClientIdentifier, WebCore::SpeechRecognitionUpdateType::Error, error);
m_recognizer->reset();
}
void SpeechRecognitionServer::sendUpdate(WebCore::SpeechRecognitionConnectionClientIdentifier clientIdentifier, WebCore::SpeechRecognitionUpdateType type, Optional<WebCore::SpeechRecognitionError> error, Optional<Vector<WebCore::SpeechRecognitionResultData>> result)
{
auto update = WebCore::SpeechRecognitionUpdate::create(clientIdentifier, type);
if (type == WebCore::SpeechRecognitionUpdateType::Error)
update = WebCore::SpeechRecognitionUpdate::createError(clientIdentifier, *error);
if (type == WebCore::SpeechRecognitionUpdateType::Result)
update = WebCore::SpeechRecognitionUpdate::createResult(clientIdentifier, *result);
sendUpdate(update);
}
void SpeechRecognitionServer::sendUpdate(const WebCore::SpeechRecognitionUpdate& update)
{
send(Messages::WebSpeechRecognitionConnection::DidReceiveUpdate(update));
}
IPC::Connection* SpeechRecognitionServer::messageSenderConnection() const
{
return m_connection.ptr();
}
uint64_t SpeechRecognitionServer::messageSenderDestinationID() const
{
return m_identifier.toUInt64();
}
void SpeechRecognitionServer::mute()
{
if (!m_recognizer)
return;
if (auto* source = m_recognizer->source())
source->mute();
}
}
#undef MESSAGE_CHECK