2007-03-22 10:30:00 -07:00
|
|
|
/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
|
|
|
|
/* ***** BEGIN LICENSE BLOCK *****
|
|
|
|
* Version: MPL 1.1/GPL 2.0/LGPL 2.1
|
|
|
|
*
|
|
|
|
* The contents of this file are subject to the Mozilla Public License Version
|
|
|
|
* 1.1 (the "License"); you may not use this file except in compliance with
|
|
|
|
* the License. You may obtain a copy of the License at
|
|
|
|
* http://www.mozilla.org/MPL/
|
|
|
|
*
|
|
|
|
* Software distributed under the License is distributed on an "AS IS" basis,
|
|
|
|
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
|
|
|
|
* for the specific language governing rights and limitations under the
|
|
|
|
* License.
|
|
|
|
*
|
|
|
|
* The Original Code is mozilla.org code.
|
|
|
|
*
|
|
|
|
* The Initial Developer of the Original Code is Robert Sayre.
|
|
|
|
* Portions created by the Initial Developer are Copyright (C) 2006
|
|
|
|
* the Initial Developer. All Rights Reserved.
|
|
|
|
*
|
|
|
|
* Contributor(s):
|
|
|
|
*
|
|
|
|
* Alternatively, the contents of this file may be used under the terms of
|
|
|
|
* either the GNU General Public License Version 2 or later (the "GPL"), or
|
|
|
|
* the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
|
|
|
|
* in which case the provisions of the GPL or the LGPL are applicable instead
|
|
|
|
* of those above. If you wish to allow use of your version of this file only
|
|
|
|
* under the terms of either the GPL or the LGPL, and not to allow others to
|
|
|
|
* use your version of this file under the terms of the MPL, indicate your
|
|
|
|
* decision by deleting the provisions above and replace them with the notice
|
|
|
|
* and other provisions required by the GPL or the LGPL. If you do not delete
|
|
|
|
* the provisions above, a recipient may use your version of this file under
|
|
|
|
* the terms of any one of the MPL, the GPL or the LGPL.
|
|
|
|
*
|
|
|
|
* ***** END LICENSE BLOCK ***** */
|
|
|
|
|
|
|
|
#include "nsString.h"
|
|
|
|
#include "nsIComponentManager.h"
|
|
|
|
#include "nsCOMPtr.h"
|
|
|
|
#include "nsXPCOM.h"
|
|
|
|
#include "nsISupportsPrimitives.h"
|
|
|
|
#include "nsXPIDLString.h"
|
|
|
|
#include "nsScriptLoader.h"
|
|
|
|
#include "nsEscape.h"
|
|
|
|
#include "nsIParser.h"
|
|
|
|
#include "nsIDTD.h"
|
|
|
|
#include "nsNetCID.h"
|
|
|
|
#include "nsNetUtil.h"
|
|
|
|
#include "nsParserCIID.h"
|
|
|
|
#include "nsParserCIID.h"
|
|
|
|
#include "nsIContentSink.h"
|
|
|
|
#include "nsIHTMLToTextSink.h"
|
|
|
|
#include "nsIDocumentEncoder.h"
|
|
|
|
#include "nsIDOMDocumentFragment.h"
|
|
|
|
#include "nsIFragmentContentSink.h"
|
|
|
|
#include "nsIDOMDocument.h"
|
|
|
|
#include "nsIDOMNodeList.h"
|
|
|
|
#include "nsIDOMNode.h"
|
|
|
|
#include "nsIDOMElement.h"
|
|
|
|
#include "nsIDocument.h"
|
|
|
|
#include "nsIContent.h"
|
|
|
|
#include "nsAttrName.h"
|
|
|
|
#include "nsHTMLParts.h"
|
|
|
|
#include "nsContentCID.h"
|
|
|
|
#include "nsIScriptableUnescapeHTML.h"
|
|
|
|
#include "nsScriptableUnescapeHTML.h"
|
|
|
|
#include "nsAutoPtr.h"
|
2011-07-29 04:48:04 -07:00
|
|
|
#include "nsTreeSanitizer.h"
|
|
|
|
#include "nsAHtml5FragmentParser.h"
|
|
|
|
#include "nsHtml5Module.h"
|
2007-03-22 10:30:00 -07:00
|
|
|
|
|
|
|
#define XHTML_DIV_TAG "div xmlns=\"http://www.w3.org/1999/xhtml\""
|
|
|
|
|
|
|
|
NS_IMPL_ISUPPORTS1(nsScriptableUnescapeHTML, nsIScriptableUnescapeHTML)
|
|
|
|
|
|
|
|
static NS_DEFINE_CID(kCParserCID, NS_PARSER_CID);
|
|
|
|
|
|
|
|
// From /widget/HTMLConverter
|
|
|
|
//
|
|
|
|
// Takes HTML and converts it to plain text but in unicode.
|
|
|
|
//
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsScriptableUnescapeHTML::Unescape(const nsAString & aFromStr,
|
|
|
|
nsAString & aToStr)
|
|
|
|
{
|
|
|
|
// create the parser to do the conversion.
|
|
|
|
aToStr.SetLength(0);
|
|
|
|
nsresult rv;
|
|
|
|
nsCOMPtr<nsIParser> parser = do_CreateInstance(kCParserCID, &rv);
|
|
|
|
if (NS_FAILED(rv)) return rv;
|
|
|
|
|
|
|
|
// convert it!
|
|
|
|
nsCOMPtr<nsIContentSink> sink;
|
|
|
|
|
|
|
|
sink = do_CreateInstance(NS_PLAINTEXTSINK_CONTRACTID);
|
|
|
|
NS_ENSURE_TRUE(sink, NS_ERROR_FAILURE);
|
|
|
|
|
|
|
|
nsCOMPtr<nsIHTMLToTextSink> textSink(do_QueryInterface(sink));
|
|
|
|
NS_ENSURE_TRUE(textSink, NS_ERROR_FAILURE);
|
|
|
|
|
|
|
|
textSink->Initialize(&aToStr, nsIDocumentEncoder::OutputSelectionOnly
|
|
|
|
| nsIDocumentEncoder::OutputAbsoluteLinks, 0);
|
|
|
|
|
|
|
|
parser->SetContentSink(sink);
|
|
|
|
|
|
|
|
parser->Parse(aFromStr, 0, NS_LITERAL_CSTRING("text/html"),
|
|
|
|
PR_TRUE, eDTDMode_fragment);
|
|
|
|
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
// The feed version of nsContentUtils::CreateContextualFragment It
|
|
|
|
// creates a fragment, but doesn't go to all the effort to preserve
|
|
|
|
// context like innerHTML does, because feed DOMs shouldn't have that.
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsScriptableUnescapeHTML::ParseFragment(const nsAString &aFragment,
|
|
|
|
PRBool aIsXML,
|
|
|
|
nsIURI* aBaseURI,
|
|
|
|
nsIDOMElement* aContextElement,
|
|
|
|
nsIDOMDocumentFragment** aReturn)
|
|
|
|
{
|
|
|
|
NS_ENSURE_ARG(aContextElement);
|
|
|
|
*aReturn = nsnull;
|
|
|
|
|
|
|
|
nsresult rv;
|
|
|
|
nsCOMPtr<nsIParser> parser = do_CreateInstance(kCParserCID, &rv);
|
|
|
|
NS_ENSURE_SUCCESS(rv, rv);
|
|
|
|
|
|
|
|
nsCOMPtr<nsIDocument> document;
|
|
|
|
nsCOMPtr<nsIDOMDocument> domDocument;
|
|
|
|
nsCOMPtr<nsIDOMNode> contextNode;
|
|
|
|
contextNode = do_QueryInterface(aContextElement);
|
|
|
|
contextNode->GetOwnerDocument(getter_AddRefs(domDocument));
|
|
|
|
document = do_QueryInterface(domDocument);
|
|
|
|
NS_ENSURE_TRUE(document, NS_ERROR_NOT_AVAILABLE);
|
|
|
|
|
|
|
|
// stop scripts
|
|
|
|
nsRefPtr<nsScriptLoader> loader;
|
|
|
|
PRBool scripts_enabled = PR_FALSE;
|
|
|
|
if (document) {
|
2007-05-30 13:43:41 -07:00
|
|
|
loader = document->ScriptLoader();
|
|
|
|
scripts_enabled = loader->GetEnabled();
|
2007-03-22 10:30:00 -07:00
|
|
|
}
|
|
|
|
if (scripts_enabled) {
|
|
|
|
loader->SetEnabled(PR_FALSE);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Wrap things in a div or body for parsing, but it won't show up in
|
|
|
|
// the fragment.
|
2008-04-10 21:38:25 -07:00
|
|
|
nsAutoTArray<nsString, 2> tagStack;
|
2007-03-22 10:30:00 -07:00
|
|
|
nsCAutoString base, spec;
|
|
|
|
if (aIsXML) {
|
|
|
|
// XHTML
|
|
|
|
if (aBaseURI) {
|
|
|
|
base.Append(NS_LITERAL_CSTRING(XHTML_DIV_TAG));
|
|
|
|
base.Append(NS_LITERAL_CSTRING(" xml:base=\""));
|
|
|
|
aBaseURI->GetSpec(spec);
|
|
|
|
// nsEscapeHTML is good enough, because we only need to get
|
|
|
|
// quotes, ampersands, and angle brackets
|
|
|
|
char* escapedSpec = nsEscapeHTML(spec.get());
|
|
|
|
if (escapedSpec)
|
|
|
|
base += escapedSpec;
|
|
|
|
NS_Free(escapedSpec);
|
|
|
|
base.Append(NS_LITERAL_CSTRING("\""));
|
2007-11-12 18:01:13 -08:00
|
|
|
tagStack.AppendElement(NS_ConvertUTF8toUTF16(base));
|
2007-03-22 10:30:00 -07:00
|
|
|
} else {
|
2007-11-12 18:01:13 -08:00
|
|
|
tagStack.AppendElement(NS_LITERAL_STRING(XHTML_DIV_TAG));
|
2007-03-22 10:30:00 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (NS_SUCCEEDED(rv)) {
|
2011-07-29 04:48:04 -07:00
|
|
|
nsCOMPtr<nsIContent> fragment;
|
2007-03-22 10:30:00 -07:00
|
|
|
if (aIsXML) {
|
2011-08-01 00:48:24 -07:00
|
|
|
rv = nsContentUtils::ParseFragmentXML(aFragment,
|
|
|
|
document,
|
|
|
|
tagStack,
|
2011-08-01 00:48:28 -07:00
|
|
|
PR_TRUE,
|
2011-08-01 00:48:24 -07:00
|
|
|
aReturn);
|
|
|
|
fragment = do_QueryInterface(*aReturn);
|
2007-03-22 10:30:00 -07:00
|
|
|
} else {
|
2011-07-29 04:48:04 -07:00
|
|
|
NS_NewDocumentFragment(aReturn,
|
|
|
|
document->NodeInfoManager());
|
|
|
|
fragment = do_QueryInterface(*aReturn);
|
2011-08-01 00:48:24 -07:00
|
|
|
nsContentUtils::ParseFragmentHTML(aFragment,
|
|
|
|
fragment,
|
|
|
|
nsGkAtoms::body,
|
|
|
|
kNameSpaceID_XHTML,
|
|
|
|
PR_FALSE,
|
|
|
|
PR_TRUE);
|
2011-07-29 04:48:04 -07:00
|
|
|
// Now, set the base URI on all subtree roots.
|
|
|
|
aBaseURI->GetSpec(spec);
|
|
|
|
nsAutoString spec16;
|
|
|
|
CopyUTF8toUTF16(spec, spec16);
|
|
|
|
nsIContent* node = fragment->GetFirstChild();
|
|
|
|
while (node) {
|
|
|
|
if (node->IsElement()) {
|
|
|
|
node->SetAttr(kNameSpaceID_XML,
|
|
|
|
nsGkAtoms::base,
|
|
|
|
nsGkAtoms::xml,
|
|
|
|
spec16,
|
|
|
|
PR_FALSE);
|
|
|
|
}
|
|
|
|
node = node->GetNextSibling();
|
|
|
|
}
|
2007-03-22 10:30:00 -07:00
|
|
|
}
|
2011-07-29 04:48:04 -07:00
|
|
|
if (fragment) {
|
|
|
|
nsTreeSanitizer sanitizer(PR_FALSE, PR_FALSE);
|
|
|
|
sanitizer.Sanitize(fragment);
|
2007-03-22 10:30:00 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (scripts_enabled)
|
|
|
|
loader->SetEnabled(PR_TRUE);
|
|
|
|
|
|
|
|
return rv;
|
|
|
|
}
|