From 36d22d82aa202bb199967e9512281e9a53db42c9 Mon Sep 17 00:00:00 2001 From: Daniel Baumann Date: Sun, 7 Apr 2024 21:33:14 +0200 Subject: Adding upstream version 115.7.0esr. Signed-off-by: Daniel Baumann --- parser/html/nsParserUtils.cpp | 127 ++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 127 insertions(+) create mode 100644 parser/html/nsParserUtils.cpp (limited to 'parser/html/nsParserUtils.cpp') diff --git a/parser/html/nsParserUtils.cpp b/parser/html/nsParserUtils.cpp new file mode 100644 index 0000000000..74b86febe8 --- /dev/null +++ b/parser/html/nsParserUtils.cpp @@ -0,0 +1,127 @@ +/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ +/* This Source Code Form is subject to the terms of the Mozilla Public + * License, v. 2.0. If a copy of the MPL was not distributed with this + * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ + +#include "nsParserUtils.h" +#include "mozilla/NullPrincipal.h" +#include "mozilla/UniquePtr.h" +#include "mozilla/dom/DocumentFragment.h" +#include "mozilla/dom/Element.h" +#include "mozilla/dom/ScriptLoader.h" +#include "nsAttrName.h" +#include "nsCOMPtr.h" +#include "nsContentCID.h" +#include "nsContentUtils.h" +#include "nsEscape.h" +#include "nsHTMLParts.h" +#include "nsHtml5Module.h" +#include "nsIContent.h" +#include "nsIContentSink.h" +#include "nsIDTD.h" +#include "mozilla/dom/Document.h" +#include "nsIDocumentEncoder.h" +#include "nsIFragmentContentSink.h" +#include "nsIParser.h" +#include "nsNetCID.h" +#include "nsNetUtil.h" +#include "nsString.h" +#include "nsTreeSanitizer.h" +#include "nsXPCOM.h" + +#define XHTML_DIV_TAG u"div xmlns=\"http://www.w3.org/1999/xhtml\"" + +using namespace mozilla::dom; + +NS_IMPL_ISUPPORTS(nsParserUtils, nsIParserUtils) + +NS_IMETHODIMP +nsParserUtils::ConvertToPlainText(const nsAString& aFromStr, uint32_t aFlags, + uint32_t aWrapCol, nsAString& aToStr) { + return nsContentUtils::ConvertToPlainText(aFromStr, aToStr, aFlags, aWrapCol); +} + +template +static nsresult SanitizeWith(const nsAString& aInput, nsAString& aOutput, + Callable aDoSanitize) { + RefPtr document = nsContentUtils::CreateInertHTMLDocument(nullptr); + if (!document) { + return NS_ERROR_FAILURE; + } + + nsresult rv = nsContentUtils::ParseDocumentHTML(aInput, document, false); + NS_ENSURE_SUCCESS(rv, rv); + + aDoSanitize(document.get()); + + nsCOMPtr encoder = do_createDocumentEncoder("text/html"); + encoder->NativeInit(document, u"text/html"_ns, + nsIDocumentEncoder::OutputDontRewriteEncodingDeclaration | + nsIDocumentEncoder::OutputNoScriptContent | + nsIDocumentEncoder::OutputEncodeBasicEntities | + nsIDocumentEncoder::OutputLFLineBreak | + nsIDocumentEncoder::OutputRaw); + return encoder->EncodeToString(aOutput); +} + +NS_IMETHODIMP +nsParserUtils::Sanitize(const nsAString& aFromStr, uint32_t aFlags, + nsAString& aToStr) { + return SanitizeWith(aFromStr, aToStr, [&](Document* aDocument) { + nsTreeSanitizer sanitizer(aFlags); + sanitizer.Sanitize(aDocument); + }); +} + +NS_IMETHODIMP +nsParserUtils::RemoveConditionalCSS(const nsAString& aFromStr, + nsAString& aToStr) { + return SanitizeWith(aFromStr, aToStr, [](Document* aDocument) { + nsTreeSanitizer::RemoveConditionalCSSFromSubtree(aDocument); + }); +} + +NS_IMETHODIMP +nsParserUtils::ParseFragment(const nsAString& aFragment, uint32_t aFlags, + bool aIsXML, nsIURI* aBaseURI, + Element* aContextElement, + DocumentFragment** aReturn) { + NS_ENSURE_ARG(aContextElement); + *aReturn = nullptr; + + RefPtr document = aContextElement->OwnerDoc(); + + nsAutoScriptBlockerSuppressNodeRemoved autoBlocker; + + // stop scripts + RefPtr loader = document->ScriptLoader(); + bool scripts_enabled = loader->GetEnabled(); + if (scripts_enabled) { + loader->SetEnabled(false); + } + + // Wrap things in a div or body for parsing, but it won't show up in + // the fragment. + nsresult rv = NS_OK; + AutoTArray tagStack; + RefPtr fragment; + if (aIsXML) { + // XHTML + tagStack.AppendElement(nsLiteralString(XHTML_DIV_TAG)); + rv = nsContentUtils::ParseFragmentXML(aFragment, document, tagStack, true, + aFlags, getter_AddRefs(fragment)); + } else { + fragment = new (document->NodeInfoManager()) + DocumentFragment(document->NodeInfoManager()); + rv = nsContentUtils::ParseFragmentHTML(aFragment, fragment, nsGkAtoms::body, + kNameSpaceID_XHTML, false, true, + aFlags); + } + + if (scripts_enabled) { + loader->SetEnabled(true); + } + + fragment.forget(aReturn); + return rv; +} -- cgit v1.2.3