mirror of
https://github.com/mozilla/gecko-dev.git
synced 2024-11-30 16:22:00 +00:00
627ac90e0c
Depends on D152497 Differential Revision: https://phabricator.services.mozilla.com/D152498
325 lines
11 KiB
C++
325 lines
11 KiB
C++
/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
|
|
/* vim: set ts=8 sts=2 et sw=2 tw=80: */
|
|
/* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
|
|
|
#include "mozilla/dom/DOMParser.h"
|
|
|
|
#include "nsNetUtil.h"
|
|
#include "nsDOMString.h"
|
|
#include "MainThreadUtils.h"
|
|
#include "SystemPrincipal.h"
|
|
#include "nsIScriptGlobalObject.h"
|
|
#include "nsIStreamListener.h"
|
|
#include "nsStringStream.h"
|
|
#include "nsCRT.h"
|
|
#include "nsStreamUtils.h"
|
|
#include "nsContentUtils.h"
|
|
#include "nsDOMJSUtils.h"
|
|
#include "nsError.h"
|
|
#include "nsPIDOMWindow.h"
|
|
#include "mozilla/BasePrincipal.h"
|
|
#include "mozilla/LoadInfo.h"
|
|
#include "mozilla/NullPrincipal.h"
|
|
#include "mozilla/dom/BindingUtils.h"
|
|
#include "mozilla/dom/Document.h"
|
|
#include "mozilla/dom/ScriptSettings.h"
|
|
|
|
using namespace mozilla;
|
|
using namespace mozilla::dom;
|
|
|
|
DOMParser::DOMParser(nsIGlobalObject* aOwner, nsIPrincipal* aDocPrincipal,
|
|
nsIURI* aDocumentURI, nsIURI* aBaseURI)
|
|
: mOwner(aOwner),
|
|
mPrincipal(aDocPrincipal),
|
|
mDocumentURI(aDocumentURI),
|
|
mBaseURI(aBaseURI),
|
|
mForceEnableXULXBL(false),
|
|
mForceEnableDTD(false) {
|
|
MOZ_ASSERT(aDocPrincipal);
|
|
MOZ_ASSERT(aDocumentURI);
|
|
}
|
|
|
|
DOMParser::~DOMParser() = default;
|
|
|
|
// QueryInterface implementation for DOMParser
|
|
NS_INTERFACE_MAP_BEGIN_CYCLE_COLLECTION(DOMParser)
|
|
NS_WRAPPERCACHE_INTERFACE_MAP_ENTRY
|
|
NS_INTERFACE_MAP_ENTRY(nsISupports)
|
|
NS_INTERFACE_MAP_END
|
|
|
|
NS_IMPL_CYCLE_COLLECTION_WRAPPERCACHE(DOMParser, mOwner)
|
|
|
|
NS_IMPL_CYCLE_COLLECTING_ADDREF(DOMParser)
|
|
NS_IMPL_CYCLE_COLLECTING_RELEASE(DOMParser)
|
|
|
|
already_AddRefed<Document> DOMParser::ParseFromString(const nsAString& aStr,
|
|
SupportedType aType,
|
|
ErrorResult& aRv) {
|
|
if (aType == SupportedType::Text_html) {
|
|
nsCOMPtr<Document> document = SetUpDocument(DocumentFlavorHTML, aRv);
|
|
if (NS_WARN_IF(aRv.Failed())) {
|
|
return nullptr;
|
|
}
|
|
|
|
// Keep the XULXBL state in sync with the XML case.
|
|
if (mForceEnableXULXBL) {
|
|
document->ForceEnableXULXBL();
|
|
}
|
|
|
|
if (mForceEnableDTD) {
|
|
document->ForceSkipDTDSecurityChecks();
|
|
}
|
|
|
|
nsresult rv = nsContentUtils::ParseDocumentHTML(aStr, document, false);
|
|
if (NS_WARN_IF(NS_FAILED(rv))) {
|
|
aRv.Throw(rv);
|
|
return nullptr;
|
|
}
|
|
|
|
return document.forget();
|
|
}
|
|
|
|
nsAutoCString utf8str;
|
|
// Convert from UTF16 to UTF8 using fallible allocations
|
|
if (!AppendUTF16toUTF8(aStr, utf8str, mozilla::fallible)) {
|
|
aRv.Throw(NS_ERROR_OUT_OF_MEMORY);
|
|
return nullptr;
|
|
}
|
|
|
|
// The new stream holds a reference to the buffer
|
|
nsCOMPtr<nsIInputStream> stream;
|
|
nsresult rv = NS_NewByteInputStream(getter_AddRefs(stream), utf8str,
|
|
NS_ASSIGNMENT_DEPEND);
|
|
if (NS_WARN_IF(NS_FAILED(rv))) {
|
|
aRv.Throw(rv);
|
|
return nullptr;
|
|
}
|
|
|
|
return ParseFromStream(stream, u"UTF-8"_ns, utf8str.Length(), aType, aRv);
|
|
}
|
|
|
|
already_AddRefed<Document> DOMParser::ParseFromSafeString(const nsAString& aStr,
|
|
SupportedType aType,
|
|
ErrorResult& aRv) {
|
|
// Create the new document with the same principal as `mOwner`, even if it is
|
|
// the system principal. This will ensure that nodes from the returned
|
|
// document are in the same DocGroup as the owner global's document, allowing
|
|
// nodes to be adopted.
|
|
nsCOMPtr<nsIPrincipal> docPrincipal = mPrincipal;
|
|
if (mOwner && mOwner->PrincipalOrNull()) {
|
|
mPrincipal = mOwner->PrincipalOrNull();
|
|
}
|
|
|
|
RefPtr<Document> ret = ParseFromString(aStr, aType, aRv);
|
|
mPrincipal = docPrincipal;
|
|
return ret.forget();
|
|
}
|
|
|
|
already_AddRefed<Document> DOMParser::ParseFromBuffer(const Uint8Array& aBuf,
|
|
SupportedType aType,
|
|
ErrorResult& aRv) {
|
|
return aBuf.ProcessFixedData([&](const Span<uint8_t>& aData) {
|
|
return ParseFromBuffer(aData, aType, aRv);
|
|
});
|
|
}
|
|
|
|
already_AddRefed<Document> DOMParser::ParseFromBuffer(Span<const uint8_t> aBuf,
|
|
SupportedType aType,
|
|
ErrorResult& aRv) {
|
|
// The new stream holds a reference to the buffer
|
|
nsCOMPtr<nsIInputStream> stream;
|
|
nsresult rv = NS_NewByteInputStream(
|
|
getter_AddRefs(stream),
|
|
Span(reinterpret_cast<const char*>(aBuf.Elements()), aBuf.Length()),
|
|
NS_ASSIGNMENT_DEPEND);
|
|
if (NS_FAILED(rv)) {
|
|
aRv.Throw(rv);
|
|
return nullptr;
|
|
}
|
|
|
|
return ParseFromStream(stream, VoidString(), aBuf.Length(), aType, aRv);
|
|
}
|
|
|
|
already_AddRefed<Document> DOMParser::ParseFromStream(nsIInputStream* aStream,
|
|
const nsAString& aCharset,
|
|
int32_t aContentLength,
|
|
SupportedType aType,
|
|
ErrorResult& aRv) {
|
|
bool svg = (aType == SupportedType::Image_svg_xml);
|
|
|
|
// For now, we can only create XML documents.
|
|
// XXXsmaug Should we create an HTMLDocument (in XHTML mode)
|
|
// for "application/xhtml+xml"?
|
|
if (aType != SupportedType::Text_xml &&
|
|
aType != SupportedType::Application_xml &&
|
|
aType != SupportedType::Application_xhtml_xml && !svg) {
|
|
aRv.Throw(NS_ERROR_NOT_IMPLEMENTED);
|
|
return nullptr;
|
|
}
|
|
|
|
// Put the nsCOMPtr out here so we hold a ref to the stream as needed
|
|
nsCOMPtr<nsIInputStream> stream = aStream;
|
|
if (!NS_InputStreamIsBuffered(stream)) {
|
|
nsCOMPtr<nsIInputStream> bufferedStream;
|
|
nsresult rv = NS_NewBufferedInputStream(getter_AddRefs(bufferedStream),
|
|
stream.forget(), 4096);
|
|
if (NS_WARN_IF(NS_FAILED(rv))) {
|
|
aRv.Throw(rv);
|
|
return nullptr;
|
|
}
|
|
|
|
stream = bufferedStream;
|
|
}
|
|
|
|
nsCOMPtr<Document> document =
|
|
SetUpDocument(svg ? DocumentFlavorSVG : DocumentFlavorLegacyGuess, aRv);
|
|
if (NS_WARN_IF(aRv.Failed())) {
|
|
return nullptr;
|
|
}
|
|
|
|
// Create a fake channel
|
|
nsCOMPtr<nsIChannel> parserChannel;
|
|
NS_NewInputStreamChannel(
|
|
getter_AddRefs(parserChannel), mDocumentURI,
|
|
nullptr, // aStream
|
|
mPrincipal, nsILoadInfo::SEC_FORCE_INHERIT_PRINCIPAL,
|
|
nsIContentPolicy::TYPE_OTHER,
|
|
nsDependentCSubstring(SupportedTypeValues::GetString(aType)));
|
|
if (NS_WARN_IF(!parserChannel)) {
|
|
aRv.Throw(NS_ERROR_UNEXPECTED);
|
|
return nullptr;
|
|
}
|
|
|
|
if (!DOMStringIsNull(aCharset)) {
|
|
parserChannel->SetContentCharset(NS_ConvertUTF16toUTF8(aCharset));
|
|
}
|
|
|
|
// Tell the document to start loading
|
|
nsCOMPtr<nsIStreamListener> listener;
|
|
|
|
// Keep the XULXBL state in sync with the HTML case
|
|
if (mForceEnableXULXBL) {
|
|
document->ForceEnableXULXBL();
|
|
}
|
|
|
|
if (mForceEnableDTD) {
|
|
document->ForceSkipDTDSecurityChecks();
|
|
}
|
|
|
|
// Have to pass false for reset here, else the reset will remove
|
|
// our event listener. Should that listener addition move to later
|
|
// than this call?
|
|
nsresult rv =
|
|
document->StartDocumentLoad(kLoadAsData, parserChannel, nullptr, nullptr,
|
|
getter_AddRefs(listener), false);
|
|
|
|
if (NS_FAILED(rv) || !listener) {
|
|
aRv.Throw(NS_ERROR_FAILURE);
|
|
return nullptr;
|
|
}
|
|
|
|
// Now start pumping data to the listener
|
|
nsresult status;
|
|
|
|
rv = listener->OnStartRequest(parserChannel);
|
|
if (NS_FAILED(rv)) parserChannel->Cancel(rv);
|
|
parserChannel->GetStatus(&status);
|
|
|
|
if (NS_SUCCEEDED(rv) && NS_SUCCEEDED(status)) {
|
|
rv = listener->OnDataAvailable(parserChannel, stream, 0, aContentLength);
|
|
if (NS_FAILED(rv)) parserChannel->Cancel(rv);
|
|
parserChannel->GetStatus(&status);
|
|
}
|
|
|
|
rv = listener->OnStopRequest(parserChannel, status);
|
|
// Failure returned from OnStopRequest does not affect the final status of
|
|
// the channel, so we do not need to call Cancel(rv) as we do above.
|
|
|
|
if (NS_FAILED(rv)) {
|
|
aRv.Throw(NS_ERROR_FAILURE);
|
|
return nullptr;
|
|
}
|
|
|
|
return document.forget();
|
|
}
|
|
|
|
/*static */
|
|
already_AddRefed<DOMParser> DOMParser::Constructor(const GlobalObject& aOwner,
|
|
ErrorResult& rv) {
|
|
MOZ_ASSERT(NS_IsMainThread());
|
|
nsCOMPtr<nsIPrincipal> docPrincipal = aOwner.GetSubjectPrincipal();
|
|
nsCOMPtr<nsIURI> documentURI;
|
|
nsIURI* baseURI = nullptr;
|
|
if (docPrincipal->IsSystemPrincipal()) {
|
|
docPrincipal = NullPrincipal::Create(OriginAttributes());
|
|
documentURI = docPrincipal->GetURI();
|
|
} else {
|
|
// Grab document and base URIs off the window our constructor was
|
|
// called on. Error out if anything untoward happens.
|
|
nsCOMPtr<nsPIDOMWindowInner> window =
|
|
do_QueryInterface(aOwner.GetAsSupports());
|
|
if (!window) {
|
|
rv.Throw(NS_ERROR_UNEXPECTED);
|
|
return nullptr;
|
|
}
|
|
|
|
baseURI = window->GetDocBaseURI();
|
|
documentURI = window->GetDocumentURI();
|
|
}
|
|
|
|
if (!documentURI) {
|
|
rv.Throw(NS_ERROR_UNEXPECTED);
|
|
return nullptr;
|
|
}
|
|
|
|
nsCOMPtr<nsIGlobalObject> global = do_QueryInterface(aOwner.GetAsSupports());
|
|
MOZ_ASSERT(global);
|
|
RefPtr<DOMParser> domParser =
|
|
new DOMParser(global, docPrincipal, documentURI, baseURI);
|
|
return domParser.forget();
|
|
}
|
|
|
|
// static
|
|
already_AddRefed<DOMParser> DOMParser::CreateWithoutGlobal(ErrorResult& aRv) {
|
|
nsCOMPtr<nsIPrincipal> docPrincipal =
|
|
NullPrincipal::Create(OriginAttributes());
|
|
|
|
nsCOMPtr<nsIURI> documentURI = docPrincipal->GetURI();
|
|
if (!documentURI) {
|
|
aRv.Throw(NS_ERROR_UNEXPECTED);
|
|
return nullptr;
|
|
}
|
|
|
|
RefPtr<DOMParser> domParser =
|
|
new DOMParser(nullptr, docPrincipal, documentURI, nullptr);
|
|
return domParser.forget();
|
|
}
|
|
|
|
already_AddRefed<Document> DOMParser::SetUpDocument(DocumentFlavor aFlavor,
|
|
ErrorResult& aRv) {
|
|
// We should really just use mOwner here, but Document gets confused
|
|
// if we pass it a scriptHandlingObject that doesn't QI to
|
|
// nsIScriptGlobalObject, and test_isequalnode.js (an xpcshell test without
|
|
// a window global) breaks. The correct solution is just to wean Document off
|
|
// of nsIScriptGlobalObject, but that's a yak to shave another day.
|
|
nsCOMPtr<nsIScriptGlobalObject> scriptHandlingObject =
|
|
do_QueryInterface(mOwner);
|
|
|
|
// Try to inherit a style backend.
|
|
NS_ASSERTION(mPrincipal, "Must have principal by now");
|
|
NS_ASSERTION(mDocumentURI, "Must have document URI by now");
|
|
|
|
nsCOMPtr<Document> doc;
|
|
nsresult rv = NS_NewDOMDocument(getter_AddRefs(doc), u""_ns, u""_ns, nullptr,
|
|
mDocumentURI, mBaseURI, mPrincipal, true,
|
|
scriptHandlingObject, aFlavor);
|
|
if (NS_WARN_IF(NS_FAILED(rv))) {
|
|
aRv.Throw(rv);
|
|
return nullptr;
|
|
}
|
|
|
|
return doc.forget();
|
|
}
|