2001-08-04 01:15:15 +04:00
|
|
|
/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
|
2001-09-26 04:40:45 +04:00
|
|
|
/* ***** BEGIN LICENSE BLOCK *****
|
2004-04-23 17:24:28 +04:00
|
|
|
* Version: MPL 1.1/GPL 2.0/LGPL 2.1
|
2001-08-04 01:15:15 +04:00
|
|
|
*
|
2004-04-23 17:24:28 +04:00
|
|
|
* The contents of this file are subject to the Mozilla Public License Version
|
|
|
|
* 1.1 (the "License"); you may not use this file except in compliance with
|
|
|
|
* the License. You may obtain a copy of the License at
|
|
|
|
* http://www.mozilla.org/MPL/
|
2001-09-26 04:40:45 +04:00
|
|
|
*
|
|
|
|
* Software distributed under the License is distributed on an "AS IS" basis,
|
|
|
|
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
|
|
|
|
* for the specific language governing rights and limitations under the
|
|
|
|
* License.
|
2001-08-04 01:15:15 +04:00
|
|
|
*
|
|
|
|
* The Original Code is mozilla.org code.
|
|
|
|
*
|
2004-04-23 17:24:28 +04:00
|
|
|
* The Initial Developer of the Original Code is
|
2001-09-26 04:40:45 +04:00
|
|
|
* Netscape Communications Corporation.
|
|
|
|
* Portions created by the Initial Developer are Copyright (C) 1998
|
|
|
|
* the Initial Developer. All Rights Reserved.
|
|
|
|
*
|
|
|
|
* Contributor(s):
|
|
|
|
*
|
|
|
|
* Alternatively, the contents of this file may be used under the terms of
|
2004-04-23 17:24:28 +04:00
|
|
|
* either of the GNU General Public License Version 2 or later (the "GPL"),
|
|
|
|
* or the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
|
2001-09-26 04:40:45 +04:00
|
|
|
* in which case the provisions of the GPL or the LGPL are applicable instead
|
|
|
|
* of those above. If you wish to allow use of your version of this file only
|
|
|
|
* under the terms of either the GPL or the LGPL, and not to allow others to
|
2004-04-23 17:24:28 +04:00
|
|
|
* use your version of this file under the terms of the MPL, indicate your
|
2001-09-26 04:40:45 +04:00
|
|
|
* decision by deleting the provisions above and replace them with the notice
|
|
|
|
* and other provisions required by the GPL or the LGPL. If you do not delete
|
|
|
|
* the provisions above, a recipient may use your version of this file under
|
2004-04-23 17:24:28 +04:00
|
|
|
* the terms of any one of the MPL, the GPL or the LGPL.
|
2001-08-04 01:15:15 +04:00
|
|
|
*
|
2001-09-26 04:40:45 +04:00
|
|
|
* ***** END LICENSE BLOCK ***** */
|
2001-08-04 01:15:15 +04:00
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* MODULE NOTES:
|
|
|
|
* @update gess 4/1/98
|
|
|
|
*
|
|
|
|
* This class is defines the basic notion of a token
|
|
|
|
* within our system. All other tokens are derived from
|
|
|
|
* this one. It offers a few basic interfaces, but the
|
|
|
|
* most important is consume(). The consume() method gets
|
|
|
|
* called during the tokenization process when an instance
|
|
|
|
* of that particular token type gets detected in the
|
|
|
|
* input stream.
|
|
|
|
*
|
|
|
|
* CToken objects that are allocated from the heap _must_ be allocated
|
|
|
|
* using the nsTokenAllocator: the nsTokenAllocator object uses an
|
|
|
|
* arena to manage the tokens.
|
|
|
|
*
|
|
|
|
* The nsTokenAllocator object's arena implementation requires
|
|
|
|
* object size at destruction time to properly recycle the object;
|
|
|
|
* therefore, CToken::operator delete() is not public. Instead,
|
|
|
|
* heap-allocated tokens should be destroyed using the static
|
|
|
|
* Destroy() method, which accepts a token and the arena from which
|
|
|
|
* the token was allocated.
|
|
|
|
*
|
|
|
|
* Leaf classes (that are actually instantiated from the heap) must
|
|
|
|
* implement the SizeOf() method, which Destroy() uses to determine
|
|
|
|
* the size of the token in order to properly recycle it.
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
|
|
#ifndef CTOKEN__
|
|
|
|
#define CTOKEN__
|
|
|
|
|
|
|
|
#include "prtypes.h"
|
|
|
|
#include "nsString.h"
|
|
|
|
#include "nsError.h"
|
|
|
|
#include "nsFixedSizeAllocator.h"
|
|
|
|
|
|
|
|
#define NS_HTMLTOKENS_NOT_AN_ENTITY \
|
|
|
|
NS_ERROR_GENERATE_SUCCESS(NS_ERROR_MODULE_HTMLPARSER,2000)
|
|
|
|
|
|
|
|
class nsScanner;
|
|
|
|
class nsTokenAllocator;
|
|
|
|
|
2002-12-13 03:28:47 +03:00
|
|
|
enum eContainerInfo {
|
|
|
|
eWellFormed,
|
|
|
|
eMalformed,
|
|
|
|
eFormUnknown
|
|
|
|
};
|
|
|
|
|
2001-08-04 01:15:15 +04:00
|
|
|
/**
|
|
|
|
* Implement the SizeOf() method; leaf classes derived from CToken
|
|
|
|
* must declare this.
|
|
|
|
*/
|
|
|
|
#define CTOKEN_IMPL_SIZEOF \
|
|
|
|
protected: \
|
|
|
|
virtual size_t SizeOf() const { return sizeof(*this); } \
|
|
|
|
public:
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Token objects represent sequences of characters as they
|
|
|
|
* are consumed from the input stream (URL). While they're
|
|
|
|
* pretty general in nature, we use subclasses (found in
|
|
|
|
* nsHTMLTokens.h) to define <start>, </end>, <text>,
|
|
|
|
* <comment>, <&entity>, <newline>, and <whitespace> tokens.
|
|
|
|
*
|
|
|
|
* @update gess 3/25/98
|
|
|
|
*/
|
|
|
|
class CToken {
|
|
|
|
public:
|
|
|
|
|
|
|
|
enum eTokenOrigin {eSource,eResidualStyle};
|
|
|
|
|
|
|
|
protected:
|
|
|
|
|
|
|
|
// nsTokenAllocator should be the only class that tries to
|
|
|
|
// allocate tokens from the heap.
|
|
|
|
friend class nsTokenAllocator;
|
|
|
|
|
|
|
|
/**
|
|
|
|
*
|
|
|
|
* @update harishd 08/01/00
|
|
|
|
* @param aSize -
|
|
|
|
* @param aArena - Allocate memory from this pool.
|
|
|
|
*/
|
2002-07-03 00:25:30 +04:00
|
|
|
static void * operator new (size_t aSize,nsFixedSizeAllocator& anArena) CPP_THROW_NEW
|
2001-08-04 01:15:15 +04:00
|
|
|
{
|
|
|
|
return anArena.Alloc(aSize);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Hide operator delete; clients should use Destroy() instead.
|
|
|
|
*/
|
|
|
|
static void operator delete (void*,size_t) {}
|
|
|
|
|
2007-11-07 20:28:22 +03:00
|
|
|
protected:
|
2001-08-04 01:15:15 +04:00
|
|
|
/**
|
|
|
|
* destructor
|
|
|
|
* @update gess5/11/98
|
|
|
|
*/
|
|
|
|
virtual ~CToken();
|
|
|
|
|
2007-11-07 20:28:22 +03:00
|
|
|
private:
|
2001-08-04 01:15:15 +04:00
|
|
|
/**
|
|
|
|
* Destroy a token.
|
|
|
|
*/
|
|
|
|
static void Destroy(CToken* aToken,nsFixedSizeAllocator& aArenaPool)
|
|
|
|
{
|
|
|
|
size_t sz = aToken->SizeOf();
|
|
|
|
aToken->~CToken();
|
|
|
|
aArenaPool.Free(aToken, sz);
|
|
|
|
}
|
|
|
|
|
2007-11-07 20:28:22 +03:00
|
|
|
public:
|
2001-08-04 01:15:15 +04:00
|
|
|
/**
|
|
|
|
* Make a note on number of times you have been referenced
|
|
|
|
* @update harishd 08/02/00
|
|
|
|
*/
|
2007-11-07 20:28:22 +03:00
|
|
|
void AddRef() {
|
|
|
|
++mUseCount;
|
|
|
|
NS_LOG_ADDREF(this, mUseCount, "CToken", sizeof(*this));
|
|
|
|
}
|
2001-08-04 01:15:15 +04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Free yourself if no one is holding you.
|
|
|
|
* @update harishd 08/02/00
|
|
|
|
*/
|
|
|
|
void Release(nsFixedSizeAllocator& aArenaPool) {
|
2007-11-07 20:28:22 +03:00
|
|
|
--mUseCount;
|
|
|
|
NS_LOG_RELEASE(this, mUseCount, "CToken");
|
|
|
|
if (mUseCount==0)
|
2001-08-04 01:15:15 +04:00
|
|
|
Destroy(this, aArenaPool);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Default constructor
|
|
|
|
* @update gess7/21/98
|
|
|
|
*/
|
|
|
|
CToken(PRInt32 aTag=0);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Retrieve string value of the token
|
|
|
|
* @update gess5/11/98
|
|
|
|
* @return reference to string containing string value
|
|
|
|
*/
|
2004-11-11 07:05:51 +03:00
|
|
|
virtual const nsSubstring& GetStringValue(void) = 0;
|
2001-08-04 01:15:15 +04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Get string of full contents, suitable for debug dump.
|
|
|
|
* It should look exactly like the input source.
|
|
|
|
* @update gess5/11/98
|
|
|
|
* @return reference to string containing string value
|
|
|
|
*/
|
2002-12-13 03:28:47 +03:00
|
|
|
virtual void GetSource(nsString& anOutputString);
|
2001-08-04 01:15:15 +04:00
|
|
|
|
|
|
|
/** @update harishd 03/23/00
|
|
|
|
* @return reference to string containing string value
|
|
|
|
*/
|
2002-04-11 02:16:46 +04:00
|
|
|
virtual void AppendSourceTo(nsAString& anOutputString);
|
2001-08-04 01:15:15 +04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Sets the ordinal value of this token (not currently used)
|
|
|
|
* @update gess5/11/98
|
|
|
|
* @param value is the new ord value for this token
|
|
|
|
*/
|
2004-04-23 17:29:02 +04:00
|
|
|
void SetTypeID(PRInt32 aValue) {
|
|
|
|
mTypeID = aValue;
|
|
|
|
}
|
2001-08-04 01:15:15 +04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Getter which retrieves the current ordinal value for this token
|
|
|
|
* @update gess5/11/98
|
|
|
|
* @return current ordinal value
|
|
|
|
*/
|
|
|
|
virtual PRInt32 GetTypeID(void);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Getter which retrieves the current attribute count for this token
|
|
|
|
* @update gess5/11/98
|
|
|
|
* @return current attribute count
|
|
|
|
*/
|
|
|
|
virtual PRInt16 GetAttributeCount(void);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Causes token to consume data from given scanner.
|
|
|
|
* Note that behavior varies wildly between CToken subclasses.
|
|
|
|
* @update gess5/11/98
|
|
|
|
* @param aChar -- most recent char consumed
|
|
|
|
* @param aScanner -- input source where token should get data
|
|
|
|
* @return error code (0 means ok)
|
|
|
|
*/
|
|
|
|
virtual nsresult Consume(PRUnichar aChar,nsScanner& aScanner,PRInt32 aMode);
|
|
|
|
|
2002-12-13 01:38:40 +03:00
|
|
|
/**
|
|
|
|
* Getter which retrieves type of token
|
|
|
|
* @update gess5/11/98
|
|
|
|
* @return int containing token type
|
|
|
|
*/
|
|
|
|
virtual PRInt32 GetTokenType(void);
|
2001-08-04 01:15:15 +04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* For tokens who care, this can tell us whether the token is
|
|
|
|
* well formed or not.
|
|
|
|
*
|
|
|
|
* @update gess 8/30/00
|
|
|
|
* @return PR_FALSE; subclasses MUST override if they care.
|
|
|
|
*/
|
|
|
|
virtual PRBool IsWellFormed(void) const {return PR_FALSE;}
|
|
|
|
|
2002-04-11 02:16:46 +04:00
|
|
|
virtual PRBool IsEmpty(void) { return PR_FALSE; }
|
|
|
|
|
|
|
|
/**
|
|
|
|
* If aValue is TRUE then the token represents a short-hand tag
|
|
|
|
*/
|
|
|
|
virtual void SetEmpty(PRBool aValue) { return ; }
|
|
|
|
|
|
|
|
PRInt32 GetNewlineCount()
|
|
|
|
{
|
|
|
|
return mNewlineCount;
|
|
|
|
}
|
|
|
|
|
|
|
|
void SetNewlineCount(PRInt32 aCount)
|
|
|
|
{
|
|
|
|
mNewlineCount = aCount;
|
|
|
|
}
|
|
|
|
|
|
|
|
PRInt32 GetLineNumber()
|
|
|
|
{
|
|
|
|
return mLineNumber;
|
|
|
|
}
|
|
|
|
|
|
|
|
void SetLineNumber(PRInt32 aLineNumber)
|
|
|
|
{
|
|
|
|
mLineNumber = mLineNumber == 0 ? aLineNumber : mLineNumber;
|
|
|
|
}
|
|
|
|
|
2004-10-17 07:03:46 +04:00
|
|
|
void SetInError(PRBool aInError)
|
|
|
|
{
|
|
|
|
mInError = aInError;
|
|
|
|
}
|
|
|
|
|
|
|
|
PRBool IsInError()
|
|
|
|
{
|
|
|
|
return mInError;
|
|
|
|
}
|
|
|
|
|
2002-12-13 03:28:47 +03:00
|
|
|
void SetAttributeCount(PRInt16 aValue) { mAttrCount = aValue; }
|
|
|
|
|
2001-08-04 01:15:15 +04:00
|
|
|
/**
|
|
|
|
* perform self test.
|
|
|
|
* @update gess5/11/98
|
|
|
|
*/
|
|
|
|
virtual void SelfTest(void);
|
|
|
|
|
|
|
|
static int GetTokenCount();
|
|
|
|
|
2002-04-11 02:16:46 +04:00
|
|
|
|
2001-08-04 01:15:15 +04:00
|
|
|
|
|
|
|
protected:
|
|
|
|
/**
|
|
|
|
* Returns the size of the token object.
|
|
|
|
*/
|
|
|
|
virtual size_t SizeOf() const = 0;
|
|
|
|
|
2002-12-13 03:28:47 +03:00
|
|
|
PRInt32 mTypeID;
|
|
|
|
PRInt32 mUseCount;
|
|
|
|
PRInt32 mNewlineCount;
|
2004-10-17 07:03:46 +04:00
|
|
|
PRUint32 mLineNumber : 31;
|
|
|
|
PRUint32 mInError : 1;
|
2002-12-13 03:28:47 +03:00
|
|
|
PRInt16 mAttrCount;
|
2001-08-04 01:15:15 +04:00
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|