gecko-dev/widget/TextRecognition.cpp
Nika Layzell ff386ec755 Bug 1781129 - Part 2: Use BigBuffer for ShmemImage, r=edgar
The ShmemImage type was previously implemented using a Shmem, however due to
the usage patterns, `BigBuffer` is probably a better fit, and allows unifying
more code in nsContentUtils.

Differential Revision: https://phabricator.services.mozilla.com/D151853
2022-08-26 16:08:05 +00:00

134 lines
4.9 KiB
C++

/* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
#include "TextRecognition.h"
#include "mozilla/dom/Promise.h"
#include "mozilla/dom/ShadowRoot.h"
#include "mozilla/dom/Document.h"
#include "mozilla/dom/ContentChild.h"
#include "nsTextNode.h"
#include "imgIContainer.h"
#ifdef XP_MACOSX
# include "nsCocoaFeatures.h"
#endif
using namespace mozilla::dom;
namespace mozilla::widget {
auto TextRecognition::FindText(imgIContainer& aImage,
const nsTArray<nsCString>& aLanguages)
-> RefPtr<NativePromise> {
// TODO: Maybe decode async.
RefPtr<gfx::SourceSurface> surface = aImage.GetFrame(
imgIContainer::FRAME_CURRENT,
imgIContainer::FLAG_SYNC_DECODE | imgIContainer::FLAG_ASYNC_NOTIFY);
if (NS_WARN_IF(!surface)) {
return NativePromise::CreateAndReject("Failed to get surface"_ns, __func__);
}
RefPtr<gfx::DataSourceSurface> dataSurface = surface->GetDataSurface();
if (NS_WARN_IF(!dataSurface)) {
return NativePromise::CreateAndReject("Failed to get data surface"_ns,
__func__);
}
return FindText(*dataSurface, aLanguages);
}
auto TextRecognition::FindText(gfx::DataSourceSurface& aSurface,
const nsTArray<nsCString>& aLanguages)
-> RefPtr<NativePromise> {
if (XRE_IsContentProcess()) {
auto* contentChild = ContentChild::GetSingleton();
auto image = nsContentUtils::SurfaceToIPCImage(aSurface);
if (!image) {
return NativePromise::CreateAndReject("Failed to share data surface"_ns,
__func__);
}
auto promise = MakeRefPtr<NativePromise::Private>(__func__);
contentChild->SendFindImageText(std::move(*image), aLanguages)
->Then(
GetCurrentSerialEventTarget(), __func__,
[promise](TextRecognitionResultOrError&& aResultOrError) {
switch (aResultOrError.type()) {
case TextRecognitionResultOrError::Type::TTextRecognitionResult:
promise->Resolve(
std::move(aResultOrError.get_TextRecognitionResult()),
__func__);
break;
case TextRecognitionResultOrError::Type::TnsCString:
promise->Reject(std::move(aResultOrError.get_nsCString()),
__func__);
break;
default:
MOZ_ASSERT_UNREACHABLE("Unknown result?");
promise->Reject("Unknown error"_ns, __func__);
break;
}
},
[promise](mozilla::ipc::ResponseRejectReason) {
promise->Reject("IPC rejection"_ns, __func__);
});
return promise;
}
return DoFindText(aSurface, aLanguages);
}
void TextRecognition::FillShadow(ShadowRoot& aShadow,
const TextRecognitionResult& aResult) {
auto& doc = *aShadow.OwnerDoc();
RefPtr<Element> div = doc.CreateHTMLElement(nsGkAtoms::div);
for (const auto& quad : aResult.quads()) {
RefPtr<Element> span = doc.CreateHTMLElement(nsGkAtoms::span);
// TODO: We probably want to position them here and so on. For now, expose
// the data as attributes so that it's easy to play with the returned values
// in JS.
{
nsAutoString points;
for (const auto& point : quad.points()) {
points.AppendFloat(point.x);
points.Append(u',');
points.AppendFloat(point.y);
points.Append(u',');
}
points.Trim(",");
span->SetAttribute(u"data-points"_ns, points, IgnoreErrors());
nsAutoString confidence;
confidence.AppendFloat(quad.confidence());
span->SetAttribute(u"data-confidence"_ns, confidence, IgnoreErrors());
}
{
RefPtr<nsTextNode> text = doc.CreateTextNode(quad.string());
span->AppendChildTo(text, true, IgnoreErrors());
}
div->AppendChildTo(span, true, IgnoreErrors());
}
aShadow.AppendChildTo(div, true, IgnoreErrors());
}
#ifndef XP_MACOSX
auto TextRecognition::DoFindText(gfx::DataSourceSurface&,
const nsTArray<nsCString>&)
-> RefPtr<NativePromise> {
MOZ_RELEASE_ASSERT(XRE_IsParentProcess(),
"This should only run in the parent process");
return NativePromise::CreateAndReject("Text recognition not available"_ns,
__func__);
}
#endif
bool TextRecognition::IsSupported() {
#ifdef XP_MACOSX
// Catalina (10.15) or higher is required because of the following API:
// VNRecognizeTextRequest - macOS 10.15+
// https://developer.apple.com/documentation/vision/vnrecognizetextrequest?language=objc
return nsCocoaFeatures::OnCatalinaOrLater();
#else
return false;
#endif
}
} // namespace mozilla::widget