2009-06-29 02:44:22 +04:00
|
|
|
/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
|
|
|
|
/* vim: set sw=2 ts=2 et tw=79: */
|
|
|
|
/* ***** BEGIN LICENSE BLOCK *****
|
|
|
|
* Version: MPL 1.1/GPL 2.0/LGPL 2.1
|
|
|
|
*
|
|
|
|
* The contents of this file are subject to the Mozilla Public License Version
|
|
|
|
* 1.1 (the "License"); you may not use this file except in compliance with
|
|
|
|
* the License. You may obtain a copy of the License at
|
|
|
|
* http://www.mozilla.org/MPL/
|
|
|
|
*
|
|
|
|
* Software distributed under the License is distributed on an "AS IS" basis,
|
|
|
|
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
|
|
|
|
* for the specific language governing rights and limitations under the
|
|
|
|
* License.
|
|
|
|
*
|
|
|
|
* The Original Code is mozilla.org code.
|
|
|
|
*
|
|
|
|
* The Initial Developer of the Original Code is
|
|
|
|
* Netscape Communications Corporation.
|
|
|
|
* Portions created by the Initial Developer are Copyright (C) 1998
|
|
|
|
* the Initial Developer. All Rights Reserved.
|
|
|
|
*
|
|
|
|
* Contributor(s):
|
|
|
|
* Pierre Phaneuf <pp@ludusdesign.com>
|
|
|
|
* Henri Sivonen <hsivonen@iki.fi>
|
|
|
|
*
|
|
|
|
* Alternatively, the contents of this file may be used under the terms of
|
|
|
|
* either of the GNU General Public License Version 2 or later (the "GPL"),
|
|
|
|
* or the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
|
|
|
|
* in which case the provisions of the GPL or the LGPL are applicable instead
|
|
|
|
* of those above. If you wish to allow use of your version of this file only
|
|
|
|
* under the terms of either the GPL or the LGPL, and not to allow others to
|
|
|
|
* use your version of this file under the terms of the MPL, indicate your
|
|
|
|
* decision by deleting the provisions above and replace them with the notice
|
|
|
|
* and other provisions required by the GPL or the LGPL. If you do not delete
|
|
|
|
* the provisions above, a recipient may use your version of this file under
|
|
|
|
* the terms of any one of the MPL, the GPL or the LGPL.
|
|
|
|
*
|
|
|
|
* ***** END LICENSE BLOCK ***** */
|
|
|
|
|
|
|
|
#include "nsCompatibility.h"
|
|
|
|
#include "nsScriptLoader.h"
|
|
|
|
#include "nsNetUtil.h"
|
|
|
|
#include "nsIStyleSheetLinkingElement.h"
|
|
|
|
#include "nsICharsetAlias.h"
|
|
|
|
#include "nsIWebShellServices.h"
|
|
|
|
#include "nsIDocShell.h"
|
|
|
|
#include "nsEncoderDecoderUtils.h"
|
|
|
|
#include "nsContentUtils.h"
|
|
|
|
#include "nsICharsetDetector.h"
|
|
|
|
#include "nsIScriptElement.h"
|
|
|
|
#include "nsIMarkupDocumentViewer.h"
|
|
|
|
#include "nsIDocShellTreeItem.h"
|
|
|
|
#include "nsIContentViewer.h"
|
|
|
|
#include "nsIScriptGlobalObjectOwner.h"
|
|
|
|
#include "nsIScriptSecurityManager.h"
|
|
|
|
#include "nsHtml5DocumentMode.h"
|
|
|
|
#include "nsHtml5Tokenizer.h"
|
|
|
|
#include "nsHtml5UTF16Buffer.h"
|
|
|
|
#include "nsHtml5TreeBuilder.h"
|
|
|
|
#include "nsHtml5Parser.h"
|
2009-09-21 15:43:43 +04:00
|
|
|
#include "nsHtml5AtomTable.h"
|
2010-03-09 15:39:32 +03:00
|
|
|
#include "nsICharsetAlias.h"
|
|
|
|
|
|
|
|
static NS_DEFINE_CID(kCharsetAliasCID, NS_CHARSETALIAS_CID);
|
2009-06-29 02:44:22 +04:00
|
|
|
|
2009-09-18 13:21:47 +04:00
|
|
|
NS_INTERFACE_TABLE_HEAD(nsHtml5Parser)
|
2009-10-15 15:29:11 +04:00
|
|
|
NS_INTERFACE_TABLE2(nsHtml5Parser, nsIParser, nsISupportsWeakReference)
|
2009-09-18 13:21:47 +04:00
|
|
|
NS_INTERFACE_TABLE_TO_MAP_SEGUE_CYCLE_COLLECTION(nsHtml5Parser)
|
|
|
|
NS_INTERFACE_MAP_END
|
2009-06-29 02:44:22 +04:00
|
|
|
|
2009-09-18 13:21:47 +04:00
|
|
|
NS_IMPL_CYCLE_COLLECTING_ADDREF(nsHtml5Parser)
|
|
|
|
NS_IMPL_CYCLE_COLLECTING_RELEASE(nsHtml5Parser)
|
2009-06-29 02:44:22 +04:00
|
|
|
|
2009-09-18 13:21:47 +04:00
|
|
|
NS_IMPL_CYCLE_COLLECTION_CLASS(nsHtml5Parser)
|
2009-06-29 02:44:22 +04:00
|
|
|
|
2009-09-18 13:21:47 +04:00
|
|
|
NS_IMPL_CYCLE_COLLECTION_TRAVERSE_BEGIN(nsHtml5Parser)
|
|
|
|
NS_IMPL_CYCLE_COLLECTION_TRAVERSE_NSCOMPTR_AMBIGUOUS(mExecutor, nsIContentSink)
|
|
|
|
NS_IMPL_CYCLE_COLLECTION_TRAVERSE_NSCOMPTR_AMBIGUOUS(mStreamParser, nsIStreamListener)
|
2009-06-29 02:44:22 +04:00
|
|
|
NS_IMPL_CYCLE_COLLECTION_TRAVERSE_END
|
|
|
|
|
2009-09-18 13:21:47 +04:00
|
|
|
NS_IMPL_CYCLE_COLLECTION_UNLINK_BEGIN(nsHtml5Parser)
|
|
|
|
NS_IMPL_CYCLE_COLLECTION_UNLINK_NSCOMPTR(mExecutor)
|
|
|
|
NS_IMPL_CYCLE_COLLECTION_UNLINK_NSCOMPTR(mStreamParser)
|
2009-06-29 02:44:22 +04:00
|
|
|
NS_IMPL_CYCLE_COLLECTION_UNLINK_END
|
|
|
|
|
|
|
|
nsHtml5Parser::nsHtml5Parser()
|
2009-09-18 13:21:47 +04:00
|
|
|
: mFirstBuffer(new nsHtml5UTF16Buffer(0))
|
|
|
|
, mLastBuffer(mFirstBuffer)
|
|
|
|
, mExecutor(new nsHtml5TreeOpExecutor())
|
2010-02-02 10:43:18 +03:00
|
|
|
, mTreeBuilder(new nsHtml5TreeBuilder(mExecutor, nsnull))
|
2009-09-18 13:21:47 +04:00
|
|
|
, mTokenizer(new nsHtml5Tokenizer(mTreeBuilder))
|
2009-10-28 16:48:37 +03:00
|
|
|
, mRootContextLineNumber(1)
|
2009-06-29 02:44:22 +04:00
|
|
|
{
|
2009-09-21 17:18:20 +04:00
|
|
|
mAtomTable.Init(); // we aren't checking for OOM anyway...
|
|
|
|
mTokenizer->setInterner(&mAtomTable);
|
2009-06-29 02:44:22 +04:00
|
|
|
// There's a zeroing operator new for everything else
|
|
|
|
}
|
|
|
|
|
|
|
|
nsHtml5Parser::~nsHtml5Parser()
|
|
|
|
{
|
2009-09-21 17:18:20 +04:00
|
|
|
mTokenizer->end();
|
2009-10-12 17:08:04 +04:00
|
|
|
mFirstBuffer = nsnull;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(void)
|
|
|
|
nsHtml5Parser::SetContentSink(nsIContentSink* aSink)
|
|
|
|
{
|
2009-09-18 13:21:47 +04:00
|
|
|
NS_ASSERTION(aSink == static_cast<nsIContentSink*> (mExecutor),
|
2009-07-15 15:30:33 +04:00
|
|
|
"Attempt to set a foreign sink.");
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(nsIContentSink*)
|
|
|
|
nsHtml5Parser::GetContentSink(void)
|
|
|
|
{
|
2009-09-18 13:21:47 +04:00
|
|
|
return static_cast<nsIContentSink*> (mExecutor);
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(void)
|
|
|
|
nsHtml5Parser::GetCommand(nsCString& aCommand)
|
|
|
|
{
|
|
|
|
aCommand.Assign("view");
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(void)
|
|
|
|
nsHtml5Parser::SetCommand(const char* aCommand)
|
|
|
|
{
|
|
|
|
NS_ASSERTION(!strcmp(aCommand, "view"), "Parser command was not view");
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(void)
|
|
|
|
nsHtml5Parser::SetCommand(eParserCommands aParserCommand)
|
|
|
|
{
|
2009-07-15 15:30:33 +04:00
|
|
|
NS_ASSERTION(aParserCommand == eViewNormal,
|
|
|
|
"Parser command was not eViewNormal.");
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(void)
|
|
|
|
nsHtml5Parser::SetDocumentCharset(const nsACString& aCharset, PRInt32 aCharsetSource)
|
|
|
|
{
|
2009-10-12 17:08:04 +04:00
|
|
|
NS_PRECONDITION(!mExecutor->HasStarted(),
|
2009-09-18 13:21:47 +04:00
|
|
|
"Document charset set too late.");
|
|
|
|
NS_PRECONDITION(mStreamParser, "Tried to set charset on a script-only parser.");
|
|
|
|
mStreamParser->SetDocumentCharset(aCharset, aCharsetSource);
|
2010-03-09 15:39:32 +03:00
|
|
|
mExecutor->SetDocumentCharsetAndSource((nsACString&)aCharset, aCharsetSource);
|
|
|
|
mCharsetSource = aCharsetSource; // used for the document.open() case only
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(void)
|
|
|
|
nsHtml5Parser::SetParserFilter(nsIParserFilter* aFilter)
|
|
|
|
{
|
|
|
|
NS_ERROR("Attempt to set a parser filter on HTML5 parser.");
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::GetChannel(nsIChannel** aChannel)
|
|
|
|
{
|
2009-09-18 13:21:47 +04:00
|
|
|
if (mStreamParser) {
|
|
|
|
return mStreamParser->GetChannel(aChannel);
|
|
|
|
} else {
|
|
|
|
return NS_ERROR_NOT_AVAILABLE;
|
|
|
|
}
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::GetDTD(nsIDTD** aDTD)
|
|
|
|
{
|
|
|
|
*aDTD = nsnull;
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
2009-09-18 13:21:47 +04:00
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::GetStreamListener(nsIStreamListener** aListener)
|
|
|
|
{
|
2009-10-15 15:29:11 +04:00
|
|
|
NS_IF_ADDREF(*aListener = mStreamParser);
|
2009-09-18 13:21:47 +04:00
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
2009-06-29 02:44:22 +04:00
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::ContinueInterruptedParsing()
|
|
|
|
{
|
|
|
|
// If there are scripts executing, then the content sink is jumping the gun
|
|
|
|
// (probably due to a synchronous XMLHttpRequest) and will re-enable us
|
|
|
|
// later, see bug 460706.
|
2009-09-18 13:21:47 +04:00
|
|
|
if (mExecutor->IsScriptExecuting()) {
|
2009-06-29 02:44:22 +04:00
|
|
|
return NS_OK;
|
|
|
|
}
|
2009-10-27 11:00:22 +03:00
|
|
|
if (mExecutor->IsFlushing()) {
|
|
|
|
// A nested event loop dequeued the continue event and there aren't
|
|
|
|
// scripts executing. What's currently causing the flush is running to
|
|
|
|
// completion or there will be a script later and the script will cause
|
|
|
|
// another continue event.
|
|
|
|
return NS_OK;
|
|
|
|
}
|
2009-06-29 02:44:22 +04:00
|
|
|
// If the stream has already finished, there's a good chance
|
|
|
|
// that we might start closing things down when the parser
|
|
|
|
// is reenabled. To make sure that we're not deleted across
|
|
|
|
// the reenabling process, hold a reference to ourselves.
|
|
|
|
nsCOMPtr<nsIParser> kungFuDeathGrip(this);
|
2009-09-18 13:21:47 +04:00
|
|
|
nsRefPtr<nsHtml5StreamParser> streamKungFuDeathGrip(mStreamParser);
|
|
|
|
nsRefPtr<nsHtml5TreeOpExecutor> treeOpKungFuDeathGrip(mExecutor);
|
2009-10-27 10:44:17 +03:00
|
|
|
ParseUntilBlocked();
|
2009-06-29 02:44:22 +04:00
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(void)
|
|
|
|
nsHtml5Parser::BlockParser()
|
|
|
|
{
|
2009-09-18 13:21:47 +04:00
|
|
|
mBlocked = PR_TRUE;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(void)
|
|
|
|
nsHtml5Parser::UnblockParser()
|
|
|
|
{
|
|
|
|
mBlocked = PR_FALSE;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(PRBool)
|
|
|
|
nsHtml5Parser::IsParserEnabled()
|
|
|
|
{
|
|
|
|
return !mBlocked;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP_(PRBool)
|
|
|
|
nsHtml5Parser::IsComplete()
|
|
|
|
{
|
2009-09-18 13:21:47 +04:00
|
|
|
return mExecutor->IsComplete();
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::Parse(nsIURI* aURL, // legacy parameter; ignored
|
|
|
|
nsIRequestObserver* aObserver,
|
|
|
|
void* aKey,
|
|
|
|
nsDTDMode aMode) // legacy; ignored
|
|
|
|
{
|
2009-09-18 13:21:47 +04:00
|
|
|
/*
|
|
|
|
* Do NOT cause WillBuildModel to be called synchronously from here!
|
|
|
|
* The document won't be ready for it until OnStartRequest!
|
|
|
|
*/
|
2009-10-12 17:08:04 +04:00
|
|
|
NS_PRECONDITION(!mExecutor->HasStarted(),
|
2009-07-15 15:30:33 +04:00
|
|
|
"Tried to start parse without initializing the parser properly.");
|
2009-10-15 15:29:11 +04:00
|
|
|
NS_PRECONDITION(mStreamParser,
|
|
|
|
"Can't call this variant of Parse() on script-created parser");
|
2009-09-18 13:21:47 +04:00
|
|
|
mStreamParser->SetObserver(aObserver);
|
|
|
|
mExecutor->SetStreamParser(mStreamParser);
|
|
|
|
mExecutor->SetParser(this);
|
|
|
|
mRootContextKey = aKey;
|
2009-06-29 02:44:22 +04:00
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::Parse(const nsAString& aSourceBuffer,
|
|
|
|
void* aKey,
|
|
|
|
const nsACString& aContentType, // ignored
|
|
|
|
PRBool aLastCall,
|
|
|
|
nsDTDMode aMode) // ignored
|
|
|
|
{
|
2009-11-06 16:06:48 +03:00
|
|
|
NS_PRECONDITION(!mExecutor->IsFragmentMode(), "Document.write called in fragment mode!");
|
2009-09-18 13:21:47 +04:00
|
|
|
|
|
|
|
// Maintain a reference to ourselves so we don't go away
|
|
|
|
// till we're completely done. The old parser grips itself in this method.
|
|
|
|
nsCOMPtr<nsIParser> kungFuDeathGrip(this);
|
|
|
|
|
|
|
|
// Gripping the other objects just in case, since the other old grip
|
|
|
|
// required grips to these, too.
|
|
|
|
nsRefPtr<nsHtml5StreamParser> streamKungFuDeathGrip(mStreamParser);
|
|
|
|
nsRefPtr<nsHtml5TreeOpExecutor> treeOpKungFuDeathGrip(mExecutor);
|
|
|
|
|
2009-06-29 02:44:22 +04:00
|
|
|
// Return early if the parser has processed EOF
|
2009-10-12 17:08:04 +04:00
|
|
|
if (!mExecutor->HasStarted()) {
|
|
|
|
NS_ASSERTION(!mStreamParser,
|
|
|
|
"Had stream parser but document.write started life cycle.");
|
2010-03-09 15:39:32 +03:00
|
|
|
// This is the first document.write() on a document.open()ed document
|
2009-10-12 17:08:04 +04:00
|
|
|
mExecutor->SetParser(this);
|
2010-03-09 15:39:32 +03:00
|
|
|
mTokenizer->setEncodingDeclarationHandler(this);
|
2009-10-12 17:08:04 +04:00
|
|
|
mTreeBuilder->setScriptingEnabled(mExecutor->IsScriptEnabled());
|
|
|
|
mTokenizer->start();
|
|
|
|
mExecutor->Start();
|
|
|
|
/*
|
|
|
|
* If you move the following line, be very careful not to cause
|
|
|
|
* WillBuildModel to be called before the document has had its
|
|
|
|
* script global object set.
|
|
|
|
*/
|
|
|
|
mExecutor->WillBuildModel(eDTDMode_unknown);
|
|
|
|
}
|
|
|
|
if (mExecutor->IsComplete()) {
|
|
|
|
return NS_OK;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
if (aLastCall && aSourceBuffer.IsEmpty() && aKey == GetRootContextKey()) {
|
|
|
|
// document.close()
|
2009-10-27 10:44:17 +03:00
|
|
|
NS_ASSERTION(!mStreamParser,
|
|
|
|
"Had stream parser but got document.close().");
|
2009-09-21 17:18:20 +04:00
|
|
|
mDocumentClosed = PR_TRUE;
|
2009-10-27 10:44:17 +03:00
|
|
|
if (!mBlocked) {
|
|
|
|
ParseUntilBlocked();
|
|
|
|
}
|
2009-06-29 02:44:22 +04:00
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
2009-10-15 15:29:11 +04:00
|
|
|
NS_PRECONDITION(IsInsertionPointDefined(),
|
|
|
|
"Document.write called when insertion point not defined.");
|
|
|
|
|
2009-10-28 16:48:37 +03:00
|
|
|
NS_PRECONDITION(!(mStreamParser && !aKey), "Got a null key in a non-script-created parser");
|
|
|
|
|
2009-10-15 15:29:11 +04:00
|
|
|
if (aSourceBuffer.IsEmpty()) {
|
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
nsRefPtr<nsHtml5UTF16Buffer> buffer = new nsHtml5UTF16Buffer(aSourceBuffer.Length());
|
|
|
|
memcpy(buffer->getBuffer(), aSourceBuffer.BeginReading(), aSourceBuffer.Length() * sizeof(PRUnichar));
|
|
|
|
buffer->setEnd(aSourceBuffer.Length());
|
|
|
|
|
|
|
|
// The buffer is inserted to the stream here in case it won't be parsed
|
|
|
|
// to completion.
|
|
|
|
// The script is identified by aKey. If there's nothing in the buffer
|
|
|
|
// chain for that key, we'll insert at the head of the queue.
|
|
|
|
// When the script leaves something in the queue, a zero-length
|
|
|
|
// key-holder "buffer" is inserted in the queue. If the same script
|
|
|
|
// leaves something in the chain again, it will be inserted immediately
|
|
|
|
// before the old key holder belonging to the same script.
|
|
|
|
nsHtml5UTF16Buffer* prevSearchBuf = nsnull;
|
|
|
|
nsHtml5UTF16Buffer* searchBuf = mFirstBuffer;
|
|
|
|
if (aKey) { // after document.open, the first level of document.write has null key
|
|
|
|
while (searchBuf != mLastBuffer) {
|
|
|
|
if (searchBuf->key == aKey) {
|
|
|
|
// found a key holder
|
|
|
|
// now insert the new buffer between the previous buffer
|
|
|
|
// and the key holder.
|
|
|
|
buffer->next = searchBuf;
|
|
|
|
if (prevSearchBuf) {
|
|
|
|
prevSearchBuf->next = buffer;
|
|
|
|
} else {
|
|
|
|
mFirstBuffer = buffer;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
2009-10-15 15:29:11 +04:00
|
|
|
break;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
2009-10-15 15:29:11 +04:00
|
|
|
prevSearchBuf = searchBuf;
|
|
|
|
searchBuf = searchBuf->next;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
2010-01-18 16:39:17 +03:00
|
|
|
if (searchBuf == mLastBuffer) {
|
|
|
|
// key was not found
|
|
|
|
nsHtml5UTF16Buffer* keyHolder = new nsHtml5UTF16Buffer(aKey);
|
|
|
|
keyHolder->next = mFirstBuffer;
|
|
|
|
buffer->next = keyHolder;
|
|
|
|
mFirstBuffer = buffer;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// we have a first level document.write after document.open()
|
|
|
|
// insert immediately before mLastBuffer
|
|
|
|
while (searchBuf != mLastBuffer) {
|
|
|
|
prevSearchBuf = searchBuf;
|
|
|
|
searchBuf = searchBuf->next;
|
|
|
|
}
|
|
|
|
buffer->next = mLastBuffer;
|
|
|
|
if (prevSearchBuf) {
|
|
|
|
prevSearchBuf->next = buffer;
|
|
|
|
} else {
|
|
|
|
mFirstBuffer = buffer;
|
|
|
|
}
|
2009-10-15 15:29:11 +04:00
|
|
|
}
|
2009-06-29 02:44:22 +04:00
|
|
|
|
2009-10-15 15:29:11 +04:00
|
|
|
if (!mBlocked) {
|
|
|
|
// mExecutor->WillResume();
|
|
|
|
while (buffer->hasMore()) {
|
|
|
|
buffer->adjust(mLastWasCR);
|
|
|
|
mLastWasCR = PR_FALSE;
|
|
|
|
if (buffer->hasMore()) {
|
2009-10-28 16:48:37 +03:00
|
|
|
|
|
|
|
PRInt32 lineNumberSave;
|
|
|
|
PRBool inRootContext = (!mStreamParser && (aKey == mRootContextKey));
|
|
|
|
if (inRootContext) {
|
|
|
|
mTokenizer->setLineNumber(mRootContextLineNumber);
|
|
|
|
} else {
|
|
|
|
// we aren't the root context, so save the line number on the
|
|
|
|
// *stack* so that we can restore it.
|
|
|
|
lineNumberSave = mTokenizer->getLineNumber();
|
|
|
|
}
|
|
|
|
|
2009-10-15 15:29:11 +04:00
|
|
|
mLastWasCR = mTokenizer->tokenizeBuffer(buffer);
|
2009-10-28 16:48:37 +03:00
|
|
|
|
|
|
|
if (inRootContext) {
|
|
|
|
mRootContextLineNumber = mTokenizer->getLineNumber();
|
|
|
|
} else {
|
|
|
|
mTokenizer->setLineNumber(lineNumberSave);
|
|
|
|
}
|
|
|
|
|
2009-10-15 15:29:11 +04:00
|
|
|
if (mTreeBuilder->HasScript()) {
|
|
|
|
// No need to flush characters, because an end tag was tokenized last
|
|
|
|
mTreeBuilder->Flush(); // Move ops to the executor
|
2010-01-14 16:58:27 +03:00
|
|
|
mExecutor->Flush(PR_TRUE); // run the ops
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
2009-10-15 15:29:11 +04:00
|
|
|
if (mBlocked) {
|
|
|
|
// mExecutor->WillInterrupt();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
// Ignore suspension requests
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2009-10-15 15:29:11 +04:00
|
|
|
if (!mBlocked) { // buffer was tokenized to completion
|
2009-10-28 16:48:37 +03:00
|
|
|
NS_ASSERTION(!buffer->hasMore(), "Buffer wasn't tokenized to completion?");
|
2009-10-15 15:29:11 +04:00
|
|
|
// Scripting semantics require a forced tree builder flush here
|
|
|
|
mTreeBuilder->flushCharacters(); // Flush trailing characters
|
|
|
|
mTreeBuilder->Flush(); // Move ops to the executor
|
2010-01-14 16:58:27 +03:00
|
|
|
mExecutor->Flush(PR_TRUE); // run the ops
|
2009-10-15 15:29:11 +04:00
|
|
|
}
|
|
|
|
|
2009-06-29 02:44:22 +04:00
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* This magic value is passed to the previous method on document.close()
|
|
|
|
*/
|
|
|
|
NS_IMETHODIMP_(void *)
|
|
|
|
nsHtml5Parser::GetRootContextKey()
|
|
|
|
{
|
|
|
|
return mRootContextKey;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::Terminate(void)
|
|
|
|
{
|
|
|
|
// We should only call DidBuildModel once, so don't do anything if this is
|
|
|
|
// the second time that Terminate has been called.
|
2009-10-12 17:08:04 +04:00
|
|
|
if (mExecutor->IsComplete()) {
|
2009-06-29 02:44:22 +04:00
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
// XXX - [ until we figure out a way to break parser-sink circularity ]
|
|
|
|
// Hack - Hold a reference until we are completely done...
|
|
|
|
nsCOMPtr<nsIParser> kungFuDeathGrip(this);
|
2009-09-18 13:21:47 +04:00
|
|
|
nsRefPtr<nsHtml5StreamParser> streamKungFuDeathGrip(mStreamParser);
|
|
|
|
nsRefPtr<nsHtml5TreeOpExecutor> treeOpKungFuDeathGrip(mExecutor);
|
2009-09-21 17:18:20 +04:00
|
|
|
if (mStreamParser) {
|
|
|
|
mStreamParser->Terminate();
|
|
|
|
}
|
2009-10-02 15:13:59 +04:00
|
|
|
return mExecutor->DidBuildModel(PR_TRUE);
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::ParseFragment(const nsAString& aSourceBuffer,
|
|
|
|
void* aKey,
|
|
|
|
nsTArray<nsString>& aTagStack,
|
|
|
|
PRBool aXMLMode,
|
|
|
|
const nsACString& aContentType,
|
|
|
|
nsDTDMode aMode)
|
|
|
|
{
|
|
|
|
return NS_ERROR_NOT_IMPLEMENTED;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::ParseFragment(const nsAString& aSourceBuffer,
|
|
|
|
nsISupports* aTargetNode,
|
|
|
|
nsIAtom* aContextLocalName,
|
|
|
|
PRInt32 aContextNamespace,
|
|
|
|
PRBool aQuirks)
|
|
|
|
{
|
|
|
|
nsCOMPtr<nsIContent> target = do_QueryInterface(aTargetNode);
|
|
|
|
NS_ASSERTION(target, "Target did not QI to nsIContent");
|
2009-07-15 15:28:27 +04:00
|
|
|
|
|
|
|
nsIDocument* doc = target->GetOwnerDoc();
|
|
|
|
NS_ENSURE_TRUE(doc, NS_ERROR_NOT_AVAILABLE);
|
|
|
|
|
|
|
|
nsIURI* uri = doc->GetDocumentURI();
|
|
|
|
NS_ENSURE_TRUE(uri, NS_ERROR_NOT_AVAILABLE);
|
|
|
|
|
2009-09-21 15:43:43 +04:00
|
|
|
nsCOMPtr<nsISupports> container = doc->GetContainer();
|
2010-02-22 15:17:31 +03:00
|
|
|
// Can be null if owner document is synthetic
|
2009-09-21 15:43:43 +04:00
|
|
|
|
|
|
|
Initialize(doc, uri, container, nsnull);
|
2009-07-15 15:28:27 +04:00
|
|
|
|
|
|
|
// Initialize() doesn't deal with base URI
|
2009-09-18 13:21:47 +04:00
|
|
|
mExecutor->SetBaseUriFromDocument();
|
|
|
|
mExecutor->SetParser(this);
|
|
|
|
mExecutor->SetNodeInfoManager(target->GetOwnerDoc()->NodeInfoManager());
|
2009-07-15 15:28:27 +04:00
|
|
|
|
2009-09-21 15:43:43 +04:00
|
|
|
nsIContent* weakTarget = target;
|
|
|
|
mTreeBuilder->setFragmentContext(aContextLocalName, aContextNamespace, &weakTarget, aQuirks);
|
2009-11-06 16:06:48 +03:00
|
|
|
mExecutor->EnableFragmentMode();
|
2009-09-18 13:21:47 +04:00
|
|
|
|
2009-10-12 17:08:04 +04:00
|
|
|
NS_PRECONDITION(!mExecutor->HasStarted(), "Tried to start parse without initializing the parser properly.");
|
2009-09-18 13:21:47 +04:00
|
|
|
mTreeBuilder->setScriptingEnabled(mExecutor->IsScriptEnabled());
|
2009-06-29 02:44:22 +04:00
|
|
|
mTokenizer->start();
|
2009-09-21 17:18:20 +04:00
|
|
|
mExecutor->Start(); // Don't call WillBuildModel in fragment case
|
2009-06-29 02:44:22 +04:00
|
|
|
if (!aSourceBuffer.IsEmpty()) {
|
|
|
|
PRBool lastWasCR = PR_FALSE;
|
|
|
|
nsHtml5UTF16Buffer buffer(aSourceBuffer.Length());
|
|
|
|
memcpy(buffer.getBuffer(), aSourceBuffer.BeginReading(), aSourceBuffer.Length() * sizeof(PRUnichar));
|
|
|
|
buffer.setEnd(aSourceBuffer.Length());
|
|
|
|
while (buffer.hasMore()) {
|
|
|
|
buffer.adjust(lastWasCR);
|
|
|
|
lastWasCR = PR_FALSE;
|
|
|
|
if (buffer.hasMore()) {
|
|
|
|
lastWasCR = mTokenizer->tokenizeBuffer(&buffer);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
mTokenizer->eof();
|
2009-09-21 17:18:20 +04:00
|
|
|
mTreeBuilder->StreamEnded();
|
|
|
|
mTreeBuilder->Flush();
|
2010-01-14 16:58:27 +03:00
|
|
|
mExecutor->Flush(PR_TRUE);
|
2009-08-27 11:57:57 +04:00
|
|
|
mTokenizer->end();
|
2009-09-18 13:21:47 +04:00
|
|
|
mExecutor->DropParserAndPerfHint();
|
2009-09-21 17:18:20 +04:00
|
|
|
mAtomTable.Clear();
|
2009-06-29 02:44:22 +04:00
|
|
|
return NS_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::BuildModel(void)
|
|
|
|
{
|
2009-09-21 17:18:20 +04:00
|
|
|
NS_NOTREACHED("Don't call this!");
|
|
|
|
return NS_ERROR_NOT_IMPLEMENTED;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
NS_IMETHODIMP
|
|
|
|
nsHtml5Parser::CancelParsingEvents()
|
|
|
|
{
|
2009-10-27 11:00:22 +03:00
|
|
|
NS_NOTREACHED("Don't call this!");
|
|
|
|
return NS_ERROR_NOT_IMPLEMENTED;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
nsHtml5Parser::Reset()
|
|
|
|
{
|
2009-09-18 13:21:47 +04:00
|
|
|
mExecutor->Reset();
|
2009-07-15 15:30:33 +04:00
|
|
|
mLastWasCR = PR_FALSE;
|
2009-09-18 13:21:47 +04:00
|
|
|
UnblockParser();
|
2009-09-21 17:18:20 +04:00
|
|
|
mDocumentClosed = PR_FALSE;
|
2009-09-18 13:21:47 +04:00
|
|
|
mStreamParser = nsnull;
|
2009-10-28 16:48:37 +03:00
|
|
|
mRootContextLineNumber = 1;
|
2009-10-15 15:29:11 +04:00
|
|
|
mParserInsertedScriptsBeingEvaluated = 0;
|
2009-07-15 15:30:33 +04:00
|
|
|
mRootContextKey = nsnull;
|
2009-09-21 17:18:20 +04:00
|
|
|
mAtomTable.Clear(); // should be already cleared in the fragment case anyway
|
2009-07-15 15:30:33 +04:00
|
|
|
// Portable parser objects
|
2009-10-12 17:08:04 +04:00
|
|
|
mFirstBuffer->next = nsnull;
|
2009-07-15 15:30:33 +04:00
|
|
|
mFirstBuffer->setStart(0);
|
|
|
|
mFirstBuffer->setEnd(0);
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
PRBool
|
|
|
|
nsHtml5Parser::CanInterrupt()
|
|
|
|
{
|
2009-11-06 16:06:48 +03:00
|
|
|
return !mExecutor->IsFragmentMode();
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
2009-10-15 15:29:11 +04:00
|
|
|
PRBool
|
|
|
|
nsHtml5Parser::IsInsertionPointDefined()
|
|
|
|
{
|
|
|
|
return !mExecutor->IsFlushing() &&
|
|
|
|
(!mStreamParser || mParserInsertedScriptsBeingEvaluated);
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
nsHtml5Parser::BeginEvaluatingParserInsertedScript()
|
|
|
|
{
|
|
|
|
++mParserInsertedScriptsBeingEvaluated;
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
nsHtml5Parser::EndEvaluatingParserInsertedScript()
|
|
|
|
{
|
|
|
|
--mParserInsertedScriptsBeingEvaluated;
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
nsHtml5Parser::MarkAsNotScriptCreated()
|
|
|
|
{
|
|
|
|
NS_PRECONDITION(!mStreamParser, "Must not call this twice.");
|
|
|
|
mStreamParser = new nsHtml5StreamParser(mExecutor, this);
|
|
|
|
}
|
|
|
|
|
|
|
|
PRBool
|
|
|
|
nsHtml5Parser::IsScriptCreated()
|
|
|
|
{
|
|
|
|
return !mStreamParser;
|
|
|
|
}
|
|
|
|
|
2009-06-29 02:44:22 +04:00
|
|
|
/* End nsIParser */
|
|
|
|
|
|
|
|
// not from interface
|
|
|
|
void
|
2009-10-27 10:44:17 +03:00
|
|
|
nsHtml5Parser::ParseUntilBlocked()
|
2009-06-29 02:44:22 +04:00
|
|
|
{
|
2009-11-06 16:06:48 +03:00
|
|
|
NS_PRECONDITION(!mExecutor->IsFragmentMode(), "ParseUntilBlocked called in fragment mode.");
|
2009-06-29 02:44:22 +04:00
|
|
|
|
|
|
|
if (mBlocked) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2009-10-12 17:08:04 +04:00
|
|
|
if (mExecutor->IsComplete()) {
|
|
|
|
return;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
2009-10-12 17:08:04 +04:00
|
|
|
NS_ASSERTION(mExecutor->HasStarted(), "Bad life cycle.");
|
2009-06-29 02:44:22 +04:00
|
|
|
|
2009-09-18 13:21:47 +04:00
|
|
|
mExecutor->WillResume();
|
2009-06-29 02:44:22 +04:00
|
|
|
for (;;) {
|
|
|
|
if (!mFirstBuffer->hasMore()) {
|
|
|
|
if (mFirstBuffer == mLastBuffer) {
|
2009-10-12 17:08:04 +04:00
|
|
|
if (mExecutor->IsComplete()) {
|
|
|
|
// something like cache manisfests stopped the parse in mid-flight
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (mDocumentClosed) {
|
|
|
|
NS_ASSERTION(!mStreamParser,
|
|
|
|
"This should only happen with script-created parser.");
|
|
|
|
mTokenizer->eof();
|
|
|
|
mTreeBuilder->StreamEnded();
|
|
|
|
mTreeBuilder->Flush();
|
2010-01-14 16:58:27 +03:00
|
|
|
mExecutor->Flush(PR_TRUE);
|
2009-10-12 17:08:04 +04:00
|
|
|
mTokenizer->end();
|
|
|
|
return;
|
|
|
|
} else {
|
|
|
|
// never release the last buffer.
|
|
|
|
NS_ASSERTION(!mLastBuffer->getStart(),
|
|
|
|
"Sentinel buffer had its indeces changed.");
|
|
|
|
NS_ASSERTION(!mLastBuffer->getEnd(),
|
|
|
|
"Sentinel buffer had its indeces changed.");
|
|
|
|
if (mStreamParser &&
|
|
|
|
mReturnToStreamParserPermitted &&
|
|
|
|
!mExecutor->IsScriptExecuting()) {
|
2009-10-30 14:47:17 +03:00
|
|
|
mTreeBuilder->flushCharacters();
|
|
|
|
mTreeBuilder->Flush();
|
2009-10-12 17:08:04 +04:00
|
|
|
mReturnToStreamParserPermitted = PR_FALSE;
|
|
|
|
mStreamParser->ContinueAfterScripts(mTokenizer,
|
|
|
|
mTreeBuilder,
|
|
|
|
mLastWasCR);
|
|
|
|
}
|
|
|
|
return; // no more data for now but expecting more
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
mFirstBuffer = mFirstBuffer->next;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2009-10-12 17:08:04 +04:00
|
|
|
if (mBlocked || mExecutor->IsComplete()) {
|
2009-06-29 02:44:22 +04:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// now we have a non-empty buffer
|
|
|
|
mFirstBuffer->adjust(mLastWasCR);
|
|
|
|
mLastWasCR = PR_FALSE;
|
|
|
|
if (mFirstBuffer->hasMore()) {
|
2009-10-28 16:48:37 +03:00
|
|
|
PRBool inRootContext = (!mStreamParser && (mFirstBuffer->key == mRootContextKey));
|
|
|
|
if (inRootContext) {
|
|
|
|
mTokenizer->setLineNumber(mRootContextLineNumber);
|
|
|
|
}
|
2009-06-29 02:44:22 +04:00
|
|
|
mLastWasCR = mTokenizer->tokenizeBuffer(mFirstBuffer);
|
2009-10-28 16:48:37 +03:00
|
|
|
if (inRootContext) {
|
|
|
|
mRootContextLineNumber = mTokenizer->getLineNumber();
|
|
|
|
}
|
2009-09-21 17:18:20 +04:00
|
|
|
if (mTreeBuilder->HasScript()) {
|
|
|
|
mTreeBuilder->Flush();
|
2010-01-14 16:58:27 +03:00
|
|
|
mExecutor->Flush(PR_TRUE);
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
2009-09-21 17:18:20 +04:00
|
|
|
if (mBlocked) {
|
|
|
|
// mExecutor->WillInterrupt();
|
2009-06-29 02:44:22 +04:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2009-07-15 15:30:33 +04:00
|
|
|
continue;
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
nsresult
|
|
|
|
nsHtml5Parser::Initialize(nsIDocument* aDoc,
|
|
|
|
nsIURI* aURI,
|
|
|
|
nsISupports* aContainer,
|
|
|
|
nsIChannel* aChannel)
|
|
|
|
{
|
2009-09-18 13:21:47 +04:00
|
|
|
return mExecutor->Init(aDoc, aURI, aContainer, aChannel);
|
2009-06-29 02:44:22 +04:00
|
|
|
}
|
|
|
|
|
2009-09-21 17:18:20 +04:00
|
|
|
void
|
|
|
|
nsHtml5Parser::StartTokenizer(PRBool aScriptingEnabled) {
|
|
|
|
mTreeBuilder->setScriptingEnabled(aScriptingEnabled);
|
|
|
|
mTokenizer->start();
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
2009-10-28 16:48:37 +03:00
|
|
|
nsHtml5Parser::InitializeDocWriteParserState(nsAHtml5TreeBuilderState* aState, PRInt32 aLine)
|
2009-09-21 17:18:20 +04:00
|
|
|
{
|
|
|
|
mTokenizer->resetToDataState();
|
2009-10-28 16:48:37 +03:00
|
|
|
mTokenizer->setLineNumber(aLine);
|
2009-09-21 17:18:20 +04:00
|
|
|
mTreeBuilder->loadState(aState, &mAtomTable);
|
|
|
|
mLastWasCR = PR_FALSE;
|
2009-10-12 17:08:04 +04:00
|
|
|
mReturnToStreamParserPermitted = PR_TRUE;
|
2009-09-21 17:18:20 +04:00
|
|
|
}
|
2009-10-21 16:12:50 +04:00
|
|
|
|
|
|
|
void
|
|
|
|
nsHtml5Parser::ContinueAfterFailedCharsetSwitch()
|
|
|
|
{
|
|
|
|
NS_PRECONDITION(mStreamParser,
|
|
|
|
"Tried to continue after failed charset switch without a stream parser");
|
|
|
|
mStreamParser->ContinueAfterFailedCharsetSwitch();
|
|
|
|
}
|
2010-03-09 15:39:32 +03:00
|
|
|
|
|
|
|
void
|
|
|
|
nsHtml5Parser::internalEncodingDeclaration(nsString* aEncoding)
|
|
|
|
{
|
|
|
|
// Note: This handler is only installed when parsing a document.open()ed doc
|
|
|
|
// See bug 539887 and bug 255820.
|
|
|
|
if (mCharsetSource >= kCharsetFromMetaTag) { // this threshold corresponds to "confident" in the HTML5 spec
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
nsresult rv = NS_OK;
|
|
|
|
nsCOMPtr<nsICharsetAlias> calias(do_GetService(kCharsetAliasCID, &rv));
|
|
|
|
if (NS_FAILED(rv)) {
|
|
|
|
NS_NOTREACHED("Charset alias service not available.");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
nsCAutoString newEncoding;
|
|
|
|
CopyUTF16toUTF8(*aEncoding, newEncoding);
|
|
|
|
|
|
|
|
// XXX check HTML5 non-IANA aliases here
|
|
|
|
|
|
|
|
nsCAutoString preferred;
|
|
|
|
|
|
|
|
rv = calias->GetPreferred(newEncoding, preferred);
|
|
|
|
if (NS_FAILED(rv)) {
|
|
|
|
// the encoding name is bogus
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
mCharsetSource = kCharsetFromMetaTag;
|
|
|
|
mTreeBuilder->SetDocumentCharset(preferred, mCharsetSource);
|
|
|
|
}
|