gecko-dev/layout/style/nsCSSScanner.cpp

936 строки
24 KiB
C++
Исходник Обычный вид История

1998-04-14 00:24:54 +04:00
/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
*
* The contents of this file are subject to the Netscape Public
* License Version 1.1 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy of
* the License at http://www.mozilla.org/NPL/
1998-04-14 00:24:54 +04:00
*
* Software distributed under the License is distributed on an "AS
* IS" basis, WITHOUT WARRANTY OF ANY KIND, either express or
* implied. See the License for the specific language governing
* rights and limitations under the License.
1998-04-14 00:24:54 +04:00
*
* The Original Code is mozilla.org code.
*
* The Initial Developer of the Original Code is Netscape
1998-04-14 00:24:54 +04:00
* Communications Corporation. Portions created by Netscape are
* Copyright (C) 1998 Netscape Communications Corporation. All
* Rights Reserved.
*
* Contributor(s):
* L. David Baron <dbaron@fas.harvard.edu>
* Daniel Glazman <glazman@netscape.com>
1998-04-14 00:24:54 +04:00
*/
#include "nsCSSScanner.h"
#include "nsIInputStream.h"
#include "nsIUnicharInputStream.h"
#include "nsString.h"
#include "nsCRT.h"
#ifdef NS_DEBUG
static char* kNullPointer = "null pointer";
#endif
// for #ifdef CSS_REPORT_PARSE_ERRORS
#include "nsCOMPtr.h"
#include "nsIServiceManager.h"
#include "nsReadableUtils.h"
#include "nsIURI.h"
#include "nsIConsoleService.h"
#include "nsIScriptError.h"
#include "nsComponentManagerUtils.h" // put this higher and gcc barfs...
1998-04-14 00:24:54 +04:00
// Don't bother collecting whitespace characters in token's mIdent buffer
#undef COLLECT_WHITESPACE
#define BUFFER_SIZE 256
static const PRUnichar CSS_ESCAPE = PRUnichar('\\');
static const PRUint8 IS_LATIN1 = 0x01;
static const PRUint8 IS_DIGIT = 0x02;
static const PRUint8 IS_HEX_DIGIT = 0x04;
static const PRUint8 IS_ALPHA = 0x08;
static const PRUint8 START_IDENT = 0x10;
static const PRUint8 IS_IDENT = 0x20;
static const PRUint8 IS_WHITESPACE = 0x40;
static PRBool gLexTableSetup = PR_FALSE;
static PRUint8 gLexTable[256];
1998-04-14 00:24:54 +04:00
static void BuildLexTable()
{
gLexTableSetup = PR_TRUE;
1998-04-14 00:24:54 +04:00
PRUint8* lt = gLexTable;
1998-04-14 00:24:54 +04:00
int i;
lt[CSS_ESCAPE] = START_IDENT;
lt['-'] |= IS_IDENT;
// XXX add in other whitespace chars
1999-05-19 03:13:27 +04:00
lt[' '] |= IS_WHITESPACE; // space
lt['\t'] |= IS_WHITESPACE; // horizontal tab
lt['\v'] |= IS_WHITESPACE; // vertical tab
lt['\r'] |= IS_WHITESPACE; // carriage return
lt['\n'] |= IS_WHITESPACE; // line feed
lt['\f'] |= IS_WHITESPACE; // form feed
1998-04-14 00:24:54 +04:00
for (i = 161; i <= 255; i++) {
lt[i] |= IS_LATIN1 | IS_IDENT | START_IDENT;
}
for (i = '0'; i <= '9'; i++) {
lt[i] |= IS_DIGIT | IS_HEX_DIGIT | IS_IDENT;
}
for (i = 'A'; i <= 'Z'; i++) {
if ((i >= 'A') && (i <= 'F')) {
lt[i] |= IS_HEX_DIGIT;
lt[i+32] |= IS_HEX_DIGIT;
}
lt[i] |= IS_ALPHA | IS_IDENT | START_IDENT;
lt[i+32] |= IS_ALPHA | IS_IDENT | START_IDENT;
}
}
nsCSSToken::nsCSSToken()
{
mType = eCSSToken_Symbol;
}
void
nsCSSToken::AppendToString(nsString& aBuffer)
{
switch (mType) {
case eCSSToken_AtKeyword:
aBuffer.Append(PRUnichar('@')); // fall through intentional
case eCSSToken_Ident:
case eCSSToken_WhiteSpace:
case eCSSToken_Function:
case eCSSToken_URL:
case eCSSToken_InvalidURL:
case eCSSToken_HTMLComment:
aBuffer.Append(mIdent);
break;
case eCSSToken_Number:
if (mIntegerValid) {
2000-04-16 00:15:37 +04:00
aBuffer.AppendInt(mInteger, 10);
}
else {
2000-04-16 00:15:37 +04:00
aBuffer.AppendFloat(mNumber);
}
break;
case eCSSToken_Percentage:
if (mIntegerValid) {
2000-04-16 00:15:37 +04:00
aBuffer.AppendInt(mInteger, 10);
}
else {
2000-04-16 00:15:37 +04:00
aBuffer.AppendFloat(mNumber);
}
2000-04-16 00:15:37 +04:00
aBuffer.Append(PRUnichar('%')); // STRING USE WARNING: technically, this should be |AppendWithConversion|
break;
case eCSSToken_Dimension:
if (mIntegerValid) {
2000-04-16 00:15:37 +04:00
aBuffer.AppendInt(mInteger, 10);
}
else {
2000-04-16 00:15:37 +04:00
aBuffer.AppendFloat(mNumber);
}
aBuffer.Append(mIdent);
break;
case eCSSToken_String:
aBuffer.Append(mSymbol);
aBuffer.Append(mIdent); // fall through intentional
case eCSSToken_Symbol:
aBuffer.Append(mSymbol);
break;
case eCSSToken_ID:
aBuffer.Append(PRUnichar('#'));
aBuffer.Append(mIdent);
break;
case eCSSToken_Includes:
aBuffer.Append(PRUnichar('~'));
aBuffer.Append(PRUnichar('='));
break;
case eCSSToken_Dashmatch:
aBuffer.Append(PRUnichar('|'));
aBuffer.Append(PRUnichar('='));
break;
default:
NS_ERROR("invalid token type");
break;
}
}
MOZ_DECL_CTOR_COUNTER(nsCSSScanner)
1998-04-14 00:24:54 +04:00
nsCSSScanner::nsCSSScanner()
{
MOZ_COUNT_CTOR(nsCSSScanner);
if (!gLexTableSetup) {
1998-04-14 00:24:54 +04:00
// XXX need a monitor
BuildLexTable();
}
mInput = nsnull;
mBuffer = new PRUnichar[BUFFER_SIZE];
mOffset = 0;
mCount = 0;
1998-09-25 05:50:51 +04:00
mPushback = mLocalPushback;
mPushbackCount = 0;
mPushbackSize = 4;
mLineNumber = 1;
mLastRead = 0;
1998-04-14 00:24:54 +04:00
}
nsCSSScanner::~nsCSSScanner()
{
MOZ_COUNT_DTOR(nsCSSScanner);
1998-04-14 00:24:54 +04:00
Close();
if (nsnull != mBuffer) {
1998-09-25 05:50:51 +04:00
delete [] mBuffer;
1998-04-14 00:24:54 +04:00
mBuffer = nsnull;
}
1998-09-25 05:50:51 +04:00
if (mLocalPushback != mPushback) {
delete [] mPushback;
}
1998-04-14 00:24:54 +04:00
}
void nsCSSScanner::Init(nsIUnicharInputStream* aInput, nsIURI* aURI)
1998-04-14 00:24:54 +04:00
{
NS_PRECONDITION(nsnull != aInput, kNullPointer);
Close();
mInput = aInput;
NS_IF_ADDREF(aInput);
1998-04-14 00:24:54 +04:00
#ifdef CSS_REPORT_PARSE_ERRORS
if (aURI) {
aURI->GetSpec(getter_Copies(mFileName));
} else {
mFileName = "from DOM";
}
mColNumber = 0;
#endif // CSS_REPORT_PARSE_ERRORS
}
#ifdef CSS_REPORT_PARSE_ERRORS
void nsCSSScanner::AddToError(const nsAReadableString& aErrorText)
{
if (!mError.Length()) {
mErrorLineNumber = mLineNumber;
mErrorColNumber = mColNumber;
mError = aErrorText;
} else {
//mError.Append(NS_LITERAL_STRING(" ") + aErrorText);
mError.AppendWithConversion(" ");
mError.Append(aErrorText);
}
}
void nsCSSScanner::ClearError()
{
mError.Truncate();
}
void nsCSSScanner::OutputError()
{
if (!mError.Length()) return;
#ifdef DEBUG
printf("CSS Error (%s :%u.%u): %s\n",
mFileName.get(),
mErrorLineNumber,
mErrorColNumber,
NS_ConvertUCS2toUTF8(mError).get());
#endif
// Log it to the JavaScript console
nsCOMPtr<nsIConsoleService> consoleService
(do_GetService(NS_CONSOLESERVICE_CONTRACTID));
nsCOMPtr<nsIScriptError> errorObject
(do_CreateInstance(NS_SCRIPTERROR_CONTRACTID));
if (consoleService && errorObject) {
nsresult rv;
PRUnichar *error = ToNewUnicode(mError);
rv = errorObject->Init(error,
NS_ConvertASCIItoUCS2(mFileName.get()).get(),
NS_LITERAL_STRING("").get(),
mErrorLineNumber,
mErrorColNumber,
0,
"CSS Parser");
nsMemory::Free(error);
if (NS_SUCCEEDED(rv))
consoleService->LogMessage(errorObject);
}
ClearError();
}
#endif // CSS_REPORT_PARSE_ERRORS
PRUint32 nsCSSScanner::GetLineNumber()
{
return mLineNumber;
}
1998-04-14 00:24:54 +04:00
void nsCSSScanner::Close()
{
NS_IF_RELEASE(mInput);
}
#ifdef CSS_REPORT_PARSE_ERRORS
#define TAB_STOP_WIDTH 8
#endif
1998-04-14 00:24:54 +04:00
// Returns -1 on error or eof
1998-10-27 02:22:40 +03:00
PRInt32 nsCSSScanner::Read(PRInt32& aErrorCode)
1998-04-14 00:24:54 +04:00
{
PRInt32 rv;
1998-09-25 05:50:51 +04:00
if (0 < mPushbackCount) {
rv = PRInt32(mPushback[--mPushbackCount]);
1998-04-14 00:24:54 +04:00
} else {
if (mCount < 0) {
return -1;
}
if (mOffset == mCount) {
mOffset = 0;
aErrorCode = mInput->Read(mBuffer, 0, BUFFER_SIZE, (PRUint32*)&mCount);
if (NS_FAILED(aErrorCode) || mCount == 0) {
1998-07-24 00:35:43 +04:00
mCount = 0;
1998-04-14 00:24:54 +04:00
return -1;
}
}
rv = PRInt32(mBuffer[mOffset++]);
if (((rv == '\n') && (mLastRead != '\r')) || (rv == '\r')) {
mLineNumber++;
#ifdef CSS_REPORT_PARSE_ERRORS
mColNumber = 0;
#endif
}
#ifdef CSS_REPORT_PARSE_ERRORS
else if (rv == '\t') {
mColNumber = ((mColNumber - 1 + TAB_STOP_WIDTH) / TAB_STOP_WIDTH)
* TAB_STOP_WIDTH;
} else if (rv != '\n') {
mColNumber++;
}
#endif
1998-04-14 00:24:54 +04:00
}
mLastRead = rv;
//printf("Read => %x\n", rv);
1998-04-14 00:24:54 +04:00
return rv;
}
1998-10-27 02:22:40 +03:00
PRInt32 nsCSSScanner::Peek(PRInt32& aErrorCode)
1998-04-14 00:24:54 +04:00
{
1998-09-25 05:50:51 +04:00
if (0 == mPushbackCount) {
1998-10-27 02:22:40 +03:00
PRInt32 ch = Read(aErrorCode);
if (ch < 0) {
1998-04-14 00:24:54 +04:00
return -1;
}
1998-10-27 02:22:40 +03:00
mPushback[0] = PRUnichar(ch);
1998-09-25 05:50:51 +04:00
mPushbackCount++;
1998-04-14 00:24:54 +04:00
}
//printf("Peek => %x\n", mLookAhead);
1998-09-25 05:50:51 +04:00
return PRInt32(mPushback[mPushbackCount - 1]);
1998-04-14 00:24:54 +04:00
}
void nsCSSScanner::Unread()
{
1998-09-25 05:50:51 +04:00
NS_PRECONDITION((mLastRead >= 0), "double pushback");
Pushback(PRUnichar(mLastRead));
1998-04-14 00:24:54 +04:00
mLastRead = -1;
}
1998-09-25 05:50:51 +04:00
void nsCSSScanner::Pushback(PRUnichar aChar)
{
if (mPushbackCount == mPushbackSize) { // grow buffer
PRUnichar* newPushback = new PRUnichar[mPushbackSize + 4];
if (nsnull == newPushback) {
return;
}
mPushbackSize += 4;
nsCRT::memcpy(newPushback, mPushback, sizeof(PRUnichar) * mPushbackCount);
if (mPushback != mLocalPushback) {
delete [] mPushback;
}
mPushback = newPushback;
}
mPushback[mPushbackCount++] = aChar;
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::LookAhead(PRInt32& aErrorCode, PRUnichar aChar)
1998-04-14 00:24:54 +04:00
{
PRInt32 ch = Read(aErrorCode);
if (ch < 0) {
return PR_FALSE;
}
if (ch == aChar) {
return PR_TRUE;
}
Unread();
return PR_FALSE;
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::EatWhiteSpace(PRInt32& aErrorCode)
1998-04-14 00:24:54 +04:00
{
PRBool eaten = PR_FALSE;
for (;;) {
PRInt32 ch = Read(aErrorCode);
if (ch < 0) {
break;
}
if ((ch == ' ') || (ch == '\n') || (ch == '\r') || (ch == '\t')) {
eaten = PR_TRUE;
continue;
}
Unread();
break;
}
return eaten;
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::EatNewline(PRInt32& aErrorCode)
1998-04-14 00:24:54 +04:00
{
PRInt32 ch = Read(aErrorCode);
if (ch < 0) {
return PR_FALSE;
}
PRBool eaten = PR_FALSE;
if (ch == '\r') {
eaten = PR_TRUE;
ch = Peek(aErrorCode);
if (ch == '\n') {
(void) Read(aErrorCode);
}
} else if (ch == '\n') {
eaten = PR_TRUE;
} else {
Unread();
}
return eaten;
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::Next(PRInt32& aErrorCode, nsCSSToken& aToken)
1998-04-14 00:24:54 +04:00
{
PRInt32 ch = Read(aErrorCode);
if (ch < 0) {
return PR_FALSE;
}
if (ch < 256) {
PRUint8* lexTable = gLexTable;
// IDENT
if ((lexTable[ch] & START_IDENT) != 0) {
return ParseIdent(aErrorCode, ch, aToken);
}
if (ch == '-') { // possible ident
PRInt32 nextChar = Peek(aErrorCode);
if ((0 <= nextChar) && (0 != (lexTable[nextChar] & START_IDENT))) {
return ParseIdent(aErrorCode, ch, aToken);
}
}
1998-04-14 00:24:54 +04:00
// AT_KEYWORD
if (ch == '@') {
PRInt32 nextChar = Peek(aErrorCode);
if ((nextChar >= 0) && (nextChar <= 255)) {
if ((lexTable[nextChar] & START_IDENT) != 0) {
return ParseAtKeyword(aErrorCode, ch, aToken);
}
}
}
// NUMBER or DIM
if ((ch == '.') || (ch == '+') || (ch == '-')) {
PRInt32 nextChar = Peek(aErrorCode);
if ((nextChar >= 0) && (nextChar <= 255)) {
if ((lexTable[nextChar] & IS_DIGIT) != 0) {
1998-04-14 00:24:54 +04:00
return ParseNumber(aErrorCode, ch, aToken);
}
else if (('.' == nextChar) && ('.' != ch)) {
PRInt32 holdNext = Read(aErrorCode);
nextChar = Peek(aErrorCode);
if ((0 <= nextChar) && (nextChar <= 255)) {
if ((lexTable[nextChar] & IS_DIGIT) != 0) {
Pushback(holdNext);
return ParseNumber(aErrorCode, ch, aToken);
}
}
Pushback(holdNext);
}
1998-04-14 00:24:54 +04:00
}
}
if ((lexTable[ch] & IS_DIGIT) != 0) {
return ParseNumber(aErrorCode, ch, aToken);
}
// ID
if (ch == '#') {
return ParseID(aErrorCode, ch, aToken);
}
// STRING
if ((ch == '"') || (ch == '\'')) {
return ParseString(aErrorCode, ch, aToken);
}
// WS
if ((lexTable[ch] & IS_WHITESPACE) != 0) {
1998-10-27 02:22:40 +03:00
aToken.mType = eCSSToken_WhiteSpace;
aToken.mIdent.SetLength(0);
aToken.mIdent.Append(PRUnichar(ch));
1998-04-14 00:24:54 +04:00
(void) EatWhiteSpace(aErrorCode);
return PR_TRUE;
}
if (ch == '/') {
PRInt32 nextChar = Peek(aErrorCode);
if (nextChar == '*') {
1998-04-14 00:24:54 +04:00
(void) Read(aErrorCode);
1998-10-27 02:22:40 +03:00
aToken.mIdent.SetLength(0);
aToken.mIdent.Append(PRUnichar(ch));
aToken.mIdent.Append(PRUnichar(nextChar));
1998-04-14 00:24:54 +04:00
return ParseCComment(aErrorCode, aToken);
}
}
if (ch == '<') { // consume HTML comment tags
if (LookAhead(aErrorCode, '!')) {
if (LookAhead(aErrorCode, '-')) {
if (LookAhead(aErrorCode, '-')) {
aToken.mType = eCSSToken_HTMLComment;
aToken.mIdent.SetLength(0);
aToken.mIdent.Append(PRUnichar('<'));
aToken.mIdent.Append(PRUnichar('!'));
aToken.mIdent.Append(PRUnichar('-'));
aToken.mIdent.Append(PRUnichar('-'));
return PR_TRUE;
}
Pushback('-');
1998-09-25 05:50:51 +04:00
}
Pushback('!');
1998-09-25 05:50:51 +04:00
}
}
if (ch == '-') { // check for HTML comment end
if (LookAhead(aErrorCode, '-')) {
if (LookAhead(aErrorCode, '>')) {
aToken.mType = eCSSToken_HTMLComment;
1998-10-27 02:22:40 +03:00
aToken.mIdent.SetLength(0);
aToken.mIdent.AppendWithConversion('-');
aToken.mIdent.AppendWithConversion('-');
2000-04-16 00:15:37 +04:00
aToken.mIdent.AppendWithConversion('>');
1998-09-25 05:50:51 +04:00
return PR_TRUE;
}
Pushback('-');
}
}
// INCLUDES ("~=") and DASHMATCH ("|=")
if (( ch == '|' ) || ( ch == '~' ) || ( ch == '^' ) ||
( ch == '$' ) || ( ch == '*' )) {
PRInt32 nextChar = Read(aErrorCode);
if ( nextChar == '=' ) {
if (ch == '~') {
aToken.mType = eCSSToken_Includes;
}
else if (ch == '|') {
aToken.mType = eCSSToken_Dashmatch;
}
else if (ch == '^') {
aToken.mType = eCSSToken_Beginsmatch;
}
else if (ch == '$') {
aToken.mType = eCSSToken_Endsmatch;
}
else if (ch == '*') {
aToken.mType = eCSSToken_Containsmatch;
}
return PR_TRUE;
} else {
Pushback(nextChar);
1998-09-25 05:50:51 +04:00
}
}
} else {
return ParseIdent(aErrorCode, ch, aToken);
1998-04-14 00:24:54 +04:00
}
1998-10-27 02:22:40 +03:00
aToken.mType = eCSSToken_Symbol;
aToken.mSymbol = ch;
return PR_TRUE;
}
PRBool nsCSSScanner::NextURL(PRInt32& aErrorCode, nsCSSToken& aToken)
{
PRInt32 ch = Read(aErrorCode);
if (ch < 0) {
return PR_FALSE;
}
if (ch < 256) {
PRUint8* lexTable = gLexTable;
// STRING
if ((ch == '"') || (ch == '\'')) {
return ParseString(aErrorCode, ch, aToken);
}
// WS
if ((lexTable[ch] & IS_WHITESPACE) != 0) {
aToken.mType = eCSSToken_WhiteSpace;
aToken.mIdent.SetLength(0);
aToken.mIdent.Append(PRUnichar(ch));
(void) EatWhiteSpace(aErrorCode);
return PR_TRUE;
}
if (ch == '/') {
PRInt32 nextChar = Peek(aErrorCode);
if (nextChar == '*') {
1998-10-27 02:22:40 +03:00
(void) Read(aErrorCode);
aToken.mIdent.SetLength(0);
aToken.mIdent.Append(PRUnichar(ch));
aToken.mIdent.Append(PRUnichar(nextChar));
return ParseCComment(aErrorCode, aToken);
}
}
// Process a url lexical token. A CSS1 url token can contain
// characters beyond identifier characters (e.g. '/', ':', etc.)
// Because of this the normal rules for tokenizing the input don't
// apply very well. To simplify the parser and relax some of the
// requirements on the scanner we parse url's here. If we find a
// malformed URL then we emit a token of type "InvalidURL" so that
// the CSS1 parser can ignore the invalid input. We attempt to eat
// the right amount of input data when an invalid URL is presented.
aToken.mType = eCSSToken_InvalidURL;
nsString& ident = aToken.mIdent;
ident.SetLength(0);
if (ch == ')') {
Pushback(ch);
1998-10-27 02:22:40 +03:00
// empty url spec: this is invalid
} else {
// start of a non-quoted url
Pushback(ch);
1998-10-27 02:22:40 +03:00
PRBool ok = PR_TRUE;
for (;;) {
ch = Read(aErrorCode);
if (ch < 0) break;
if (ch == CSS_ESCAPE) {
ch = ParseEscape(aErrorCode);
if (0 < ch) {
ident.Append(PRUnichar(ch));
}
1998-10-27 02:22:40 +03:00
} else if ((ch == '"') || (ch == '\'') || (ch == '(')) {
// This is an invalid URL spec
ok = PR_FALSE;
} else if ((256 >= ch) && ((gLexTable[ch] & IS_WHITESPACE) != 0)) {
// Whitespace is allowed at the end of the URL
(void) EatWhiteSpace(aErrorCode);
if (LookAhead(aErrorCode, ')')) {
1998-11-26 04:30:51 +03:00
Pushback(')'); // leave the closing symbol
1998-10-27 02:22:40 +03:00
// done!
break;
}
// Whitespace is followed by something other than a
// ")". This is an invalid url spec.
ok = PR_FALSE;
} else if (ch == ')') {
Unread();
// All done
break;
} else {
// A regular url character.
ident.Append(PRUnichar(ch));
}
}
// If the result of the above scanning is ok then change the token
// type to a useful one.
if (ok) {
aToken.mType = eCSSToken_URL;
}
}
}
1998-04-14 00:24:54 +04:00
return PR_TRUE;
}
1998-10-27 02:22:40 +03:00
PRInt32 nsCSSScanner::ParseEscape(PRInt32& aErrorCode)
1998-04-14 00:24:54 +04:00
{
PRUint8* lexTable = gLexTable;
PRInt32 ch = Peek(aErrorCode);
if (ch < 0) {
return CSS_ESCAPE;
}
if ((ch <= 255) && ((lexTable[ch] & IS_HEX_DIGIT) != 0)) {
PRInt32 rv = 0;
int i;
for (i = 0; i < 6; i++) { // up to six digits
1998-04-14 00:24:54 +04:00
ch = Read(aErrorCode);
if (ch < 0) {
// Whoops: error or premature eof
break;
}
if ((lexTable[ch] & IS_HEX_DIGIT) != 0) {
if ((lexTable[ch] & IS_DIGIT) != 0) {
rv = rv * 16 + (ch - '0');
} else {
// Note: c&7 just keeps the low three bits which causes
// upper and lower case alphabetics to both yield their
// "relative to 10" value for computing the hex value.
1999-05-19 03:13:27 +04:00
rv = rv * 16 + ((ch & 0x7) + 9);
1998-04-14 00:24:54 +04:00
}
1999-05-19 03:13:27 +04:00
}
else if ((lexTable[ch] & IS_WHITESPACE) != 0) { // single space ends escape
1999-05-27 03:53:39 +04:00
if (ch == '\r') { // if CR/LF, eat LF too
ch = Peek(aErrorCode);
if (ch == '\n') {
ch = Read(aErrorCode);
}
}
1999-05-19 03:13:27 +04:00
break;
}
else {
1998-04-14 00:24:54 +04:00
Unread();
break;
}
}
1999-05-19 03:13:27 +04:00
if (6 == i) { // look for trailing whitespace and eat it
ch = Peek(aErrorCode);
if ((0 <= ch) && (ch <= 255) &&
((lexTable[ch] & IS_WHITESPACE) != 0)) {
ch = Read(aErrorCode);
// special case: if trailing whitespace is CR/LF, eat both chars (not part of spec, but should be)
if (ch == '\r') {
ch = Peek(aErrorCode);
if (ch == '\n') {
ch = Read(aErrorCode);
}
}
1999-05-19 03:13:27 +04:00
}
}
1998-04-14 00:24:54 +04:00
return rv;
} else {
// "Any character except a hexidecimal digit can be escaped to
// remove its special meaning by putting a backslash in front"
// -- CSS1 spec section 7.1
if (EatNewline(aErrorCode)) { // skip escaped newline
ch = 0;
}
else {
(void) Read(aErrorCode);
}
1998-04-14 00:24:54 +04:00
return ch;
}
}
/**
* Gather up the characters in an identifier. The identfier was
* started by "aChar" which will be appended to aIdent. The result
* will be aIdent with all of the identifier characters appended
* until the first non-identifier character is seen. The termination
* character is unread for the future re-reading.
*/
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::GatherIdent(PRInt32& aErrorCode, PRInt32 aChar,
1998-04-14 00:24:54 +04:00
nsString& aIdent)
{
if (aChar == CSS_ESCAPE) {
aChar = ParseEscape(aErrorCode);
}
1999-05-19 03:13:27 +04:00
if (0 < aChar) {
aIdent.Append(PRUnichar(aChar));
}
1998-04-14 00:24:54 +04:00
for (;;) {
aChar = Read(aErrorCode);
if (aChar < 0) break;
if (aChar == CSS_ESCAPE) {
aChar = ParseEscape(aErrorCode);
if (0 < aChar) {
aIdent.Append(PRUnichar(aChar));
}
} else if ((aChar > 255) || ((gLexTable[aChar] & IS_IDENT) != 0)) {
1998-04-14 00:24:54 +04:00
aIdent.Append(PRUnichar(aChar));
} else {
Unread();
break;
}
}
return PR_TRUE;
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::ParseID(PRInt32& aErrorCode,
1998-04-14 00:24:54 +04:00
PRInt32 aChar,
1998-10-27 02:22:40 +03:00
nsCSSToken& aToken)
1998-04-14 00:24:54 +04:00
{
1998-10-27 02:22:40 +03:00
aToken.mIdent.SetLength(0);
aToken.mType = eCSSToken_ID;
1999-05-19 03:13:27 +04:00
return GatherIdent(aErrorCode, 0, aToken.mIdent);
1998-04-14 00:24:54 +04:00
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::ParseIdent(PRInt32& aErrorCode,
1998-04-14 00:24:54 +04:00
PRInt32 aChar,
1998-10-27 02:22:40 +03:00
nsCSSToken& aToken)
1998-04-14 00:24:54 +04:00
{
1998-10-27 02:22:40 +03:00
nsString& ident = aToken.mIdent;
1998-04-14 00:24:54 +04:00
ident.SetLength(0);
if (!GatherIdent(aErrorCode, aChar, ident)) {
return PR_FALSE;
}
nsCSSTokenType tokenType = eCSSToken_Ident;
1998-10-27 02:22:40 +03:00
// look for functions (ie: "ident(")
if (PRUnichar('(') == PRUnichar(Peek(aErrorCode))) { // this is a function definition
tokenType = eCSSToken_Function;
1998-04-14 00:24:54 +04:00
}
1998-10-27 02:22:40 +03:00
aToken.mType = tokenType;
1998-04-14 00:24:54 +04:00
return PR_TRUE;
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::ParseAtKeyword(PRInt32& aErrorCode, PRInt32 aChar,
nsCSSToken& aToken)
1998-04-14 00:24:54 +04:00
{
1998-10-27 02:22:40 +03:00
aToken.mIdent.SetLength(0);
aToken.mType = eCSSToken_AtKeyword;
1999-05-19 03:13:27 +04:00
return GatherIdent(aErrorCode, 0, aToken.mIdent);
1998-04-14 00:24:54 +04:00
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::ParseNumber(PRInt32& aErrorCode, PRInt32 c,
nsCSSToken& aToken)
1998-04-14 00:24:54 +04:00
{
1998-10-27 02:22:40 +03:00
nsString& ident = aToken.mIdent;
1998-04-14 00:24:54 +04:00
ident.SetLength(0);
PRBool gotDot = (c == '.') ? PR_TRUE : PR_FALSE;
if (c != '+') {
ident.Append(PRUnichar(c));
}
// Gather up characters that make up the number
PRUint8* lexTable = gLexTable;
for (;;) {
c = Read(aErrorCode);
if (c < 0) break;
if (!gotDot && (c == '.')) {
gotDot = PR_TRUE;
} else if ((c > 255) || ((lexTable[c] & IS_DIGIT) == 0)) {
break;
}
ident.Append(PRUnichar(c));
}
// Convert number to floating point
nsCSSTokenType type = eCSSToken_Number;
PRInt32 ec;
float value = ident.ToFloat(&ec);
// Look at character that terminated the number
1998-10-27 02:22:40 +03:00
aToken.mIntegerValid = PR_FALSE;
1998-04-14 00:24:54 +04:00
if (c >= 0) {
if ((c <= 255) && ((lexTable[c] & START_IDENT) != 0)) {
ident.SetLength(0);
if (!GatherIdent(aErrorCode, c, ident)) {
return PR_FALSE;
}
type = eCSSToken_Dimension;
} else if ('%' == c) {
type = eCSSToken_Percentage;
value = value / 100.0f;
ident.SetLength(0);
1998-04-14 00:24:54 +04:00
} else {
// Put back character that stopped numeric scan
Unread();
if (!gotDot) {
1998-10-27 02:22:40 +03:00
aToken.mInteger = ident.ToInteger(&ec);
aToken.mIntegerValid = PR_TRUE;
1998-04-14 00:24:54 +04:00
}
ident.SetLength(0);
}
}
else { // stream ended
if (!gotDot) {
aToken.mInteger = ident.ToInteger(&ec);
aToken.mIntegerValid = PR_TRUE;
}
ident.SetLength(0);
}
1998-10-27 02:22:40 +03:00
aToken.mNumber = value;
aToken.mType = type;
1998-04-14 00:24:54 +04:00
return PR_TRUE;
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::ParseCComment(PRInt32& aErrorCode, nsCSSToken& aToken)
1998-04-14 00:24:54 +04:00
{
1998-10-27 02:22:40 +03:00
nsString& ident = aToken.mIdent;
1998-04-14 00:24:54 +04:00
for (;;) {
PRInt32 ch = Read(aErrorCode);
if (ch < 0) break;
if (ch == '*') {
if (LookAhead(aErrorCode, '/')) {
2000-04-16 00:15:37 +04:00
ident.Append(PRUnichar(ch)); // STRING USE WARNING: technically, this should be |AppendWithConversion|
ident.AppendWithConversion('/');
1998-04-14 00:24:54 +04:00
break;
}
}
#ifdef COLLECT_WHITESPACE
ident.Append(PRUnichar(ch));
#endif
}
1998-10-27 02:22:40 +03:00
aToken.mType = eCSSToken_WhiteSpace;
1998-04-14 00:24:54 +04:00
return PR_TRUE;
}
#if 0
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::ParseEOLComment(PRInt32& aErrorCode, nsCSSToken& aToken)
1998-04-14 00:24:54 +04:00
{
1998-10-27 02:22:40 +03:00
nsString& ident = aToken.mIdent;
1998-04-14 00:24:54 +04:00
ident.SetLength(0);
for (;;) {
if (EatNewline(aErrorCode)) {
break;
}
PRInt32 ch = Read(aErrorCode);
if (ch < 0) {
break;
}
#ifdef COLLECT_WHITESPACE
ident.Append(PRUnichar(ch));
#endif
}
1998-10-27 02:22:40 +03:00
aToken.mType = eCSSToken_WhiteSpace;
1998-04-14 00:24:54 +04:00
return PR_TRUE;
}
#endif // 0
1998-04-14 00:24:54 +04:00
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::GatherString(PRInt32& aErrorCode, PRInt32 aStop,
1998-04-14 00:24:54 +04:00
nsString& aBuffer)
{
for (;;) {
if (EatNewline(aErrorCode)) {
break;
}
1998-04-14 00:24:54 +04:00
PRInt32 ch = Read(aErrorCode);
if (ch < 0) {
return PR_FALSE;
}
if (ch == aStop) {
break;
}
if (ch == CSS_ESCAPE) {
ch = ParseEscape(aErrorCode);
if (ch < 0) {
return PR_FALSE;
}
}
if (0 < ch) {
aBuffer.Append(PRUnichar(ch));
}
1998-04-14 00:24:54 +04:00
}
return PR_TRUE;
}
1998-10-27 02:22:40 +03:00
PRBool nsCSSScanner::ParseString(PRInt32& aErrorCode, PRInt32 aStop,
nsCSSToken& aToken)
1998-04-14 00:24:54 +04:00
{
1998-10-27 02:22:40 +03:00
aToken.mIdent.SetLength(0);
aToken.mType = eCSSToken_String;
aToken.mSymbol = PRUnichar(aStop); // remember how it's quoted
return GatherString(aErrorCode, aStop, aToken.mIdent);
1998-04-14 00:24:54 +04:00
}