gecko-dev/layout/generic/nsTextTransformer.cpp

/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
 *
 * The contents of this file are subject to the Netscape Public License
 * Version 1.0 (the "License"); you may not use this file except in
 * compliance with the License.  You may obtain a copy of the License at
 * http://www.mozilla.org/NPL/
 *
 * Software distributed under the License is distributed on an "AS IS"
 * basis, WITHOUT WARRANTY OF ANY KIND, either express or implied.  See
 * the License for the specific language governing rights and limitations
 * under the License.
 *
 * The Original Code is Mozilla Communicator client code.
 *
 * The Initial Developer of the Original Code is Netscape Communications
 * Corporation.  Portions created by Netscape are Copyright (C) 1998
 * Netscape Communications Corporation.  All Rights Reserved.
 */
#include "nsTextTransformer.h"
#include "nsIContent.h"
#include "nsIFrame.h"
#include "nsIStyleContext.h"
#include "nsITextContent.h"
#include "nsStyleConsts.h"
#include "nsILineBreaker.h"


#include "nsIServiceManager.h"
#include "nsUnicharUtilCIID.h"
#include "nsICaseConversion.h"

static NS_DEFINE_IID(kUnicharUtilCID, NS_UNICHARUTIL_CID);
static NS_DEFINE_IID(kICaseConversionIID, NS_ICASECONVERSION_IID);
static nsICaseConversion* gCaseConv =  nsnull;

// XXX put a copy in nsHTMLIIDs
static NS_DEFINE_IID(kITextContentIID, NS_ITEXT_CONTENT_IID);

// XXX I'm sure there are other special characters
#define CH_NBSP 160

#define MAX_UNIBYTE 127

nsTextTransformer::nsTextTransformer(PRUnichar* aBuffer, PRInt32 aBufLen, 
                                     nsILineBreaker* aLineBreaker)
  : mAutoBuffer(aBuffer),
    mBuffer(aBuffer),
    mBufferLength(aBufLen < 0 ? 0 : aBufLen),
    mHasMultibyte(PR_FALSE),
    mLineBreaker(aLineBreaker)
{
  NS_IF_ADDREF(mLineBreaker);
}

nsTextTransformer::~nsTextTransformer()
{
  if (mBuffer != mAutoBuffer) {
    delete [] mBuffer;
  }
  NS_IF_RELEASE(mLineBreaker);
}

nsresult
nsTextTransformer::Init(/*nsTextRun& aTextRun, XXX*/
                        nsIFrame* aFrame,
                        PRInt32 aStartingOffset)
{
  // Make sure we have *some* space in case arguments to the ctor were
  // bizzare.
  if (mBufferLength < 100) {
    if (!GrowBuffer()) {
      return NS_ERROR_OUT_OF_MEMORY;
    }
  }

  // Get the frames text content
  nsIContent* content;
  aFrame->GetContent(&content);
  nsITextContent* tc;
  if (NS_OK != content->QueryInterface(kITextContentIID, (void**) &tc)) {
    NS_RELEASE(content);
    return NS_OK;
  }
  tc->GetText(mFrags, mNumFrags);
  NS_RELEASE(tc);
  NS_RELEASE(content);
  mStartingOffset = aStartingOffset;
  mOffset = mStartingOffset;

  // Compute the total length of the text content.
  PRInt32 sum = 0;
  PRInt32 n = mNumFrags;
  const nsTextFragment* frag = mFrags;
  for (; --n >= 0; frag++) {
    sum += frag->GetLength();
  }
  mContentLength = sum;

  // Set current fragment and current fragment offset
  mCurrentFrag = mFrags;
  mCurrentFragOffset = 0;
  PRInt32 offset = 0;
  n = mNumFrags;
  for (frag = mFrags; --n >= 0; frag++) {
    if (aStartingOffset < offset + frag->GetLength()) {
      mCurrentFrag = frag;
      mCurrentFragOffset = aStartingOffset - offset;
      break;
    }
    offset += frag->GetLength();
  }
  if (mNumFrags && aStartingOffset == mContentLength){
    mCurrentFrag = mFrags + (mNumFrags -1);
    mCurrentFragOffset = mCurrentFrag->GetLength();
  }

  // Get the frames style and choose a transform proc
  const nsStyleText* styleText;
  aFrame->GetStyleData(eStyleStruct_Text, (const nsStyleStruct*&) styleText);
  mWhiteSpace = styleText->mWhiteSpace;
  mTextTransform = styleText->mTextTransform;

  if(NS_STYLE_TEXT_TRANSFORM_NONE != mTextTransform)
  {
     if(nsnull == gCaseConv) {
        nsresult res;
        res = nsServiceManager::GetService(kUnicharUtilCID, kICaseConversionIID,
                                 (nsISupports**)&gCaseConv);
        NS_ASSERTION( NS_SUCCEEDED(res), "cannot get UnicharUtil");
        NS_ASSERTION( gCaseConv != NULL, "cannot get UnicharUtil");
     }
  }
  return NS_OK;
}

PRBool
nsTextTransformer::GrowBuffer()
{
  PRInt32 newLen = mBufferLength * 2;
  if (newLen <= 100) {
    newLen = 100;
  }
  PRUnichar* newBuffer = new PRUnichar[newLen];
  if (nsnull == newBuffer) {
    return PR_FALSE;
  }
  if (0 != mBufferLength) {
    nsCRT::memcpy(newBuffer, mBuffer, sizeof(PRUnichar) * mBufferLength);
    if (mBuffer != mAutoBuffer) {
      delete [] mBuffer;
    }
  }
  mBuffer = newBuffer;
  mBufferLength = newLen;
  return PR_TRUE;
}

PRUnichar*
nsTextTransformer::GetNextWord(PRBool aInWord,
                               PRInt32& aWordLenResult,
                               PRInt32& aContentLenResult,
                               PRBool& aIsWhitespaceResult)
{
  NS_PRECONDITION(mOffset <= mContentLength, "bad offset");

  // See if the content has been exhausted
  if (mOffset == mContentLength) {
    aWordLenResult = 0;
    aContentLenResult = 0;
    return nsnull;
  }

  PRUnichar* bp = mBuffer;
  PRUnichar* bufEnd = mBuffer + mBufferLength;
  const nsTextFragment* frag = mCurrentFrag;
  const nsTextFragment* lastFrag = mFrags + mNumFrags;
  PRInt32 wordLen = 1;
  PRInt32 contentLen = 1;

  // Set the isWhitespace flag by examining the next character in the
  // text fragment.
  PRInt32 offset = mCurrentFragOffset;
  PRUnichar firstChar;
  if (frag->Is2b()) {
    const PRUnichar* up = frag->Get2b();
    firstChar = up[offset];
  }
  else {
    const unsigned char* cp = (const unsigned char*) frag->Get1b();
    firstChar = PRUnichar(cp[offset]);
  }
  PRBool isWhitespace = XP_IS_SPACE(firstChar);
  offset++;
  if (isWhitespace) {
    if (NS_STYLE_WHITESPACE_PRE == mWhiteSpace) {
      if ('\t' == firstChar) {
        // Leave tab alone so that caller can expand it
      }
      else if ('\n' == firstChar) {
        // Advance content past newline but do not allow newline to
        // remain in the word.
        wordLen--;
      }
      else {
        firstChar = ' ';
      }
    }
    else {
      firstChar = ' ';
    }
  }
  else if (CH_NBSP == firstChar) {
    firstChar = ' ';
  }
  if (firstChar > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;
  *bp++ = firstChar;
  if (offset == frag->GetLength()) {
    mCurrentFrag = ++frag;
    offset = 0;
  }
  mCurrentFragOffset = offset;
  if (isWhitespace && (NS_STYLE_WHITESPACE_PRE == mWhiteSpace)) {
    goto really_done;
  }

  PRInt32 numChars;
  while (frag < lastFrag) {
    PRInt32 fragLen = frag->GetLength();

    // Scan characters in this fragment that are the same kind as the
    // isWhitespace flag indicates.
    if (frag->Is2b()) {
      const PRUnichar* cp0 = frag->Get2b();
      const PRUnichar* end = cp0 + fragLen;
      const PRUnichar* cp = cp0 + offset;
      if (isWhitespace) {
        while (cp < end) {
          PRUnichar ch = *cp;
          if (XP_IS_SPACE(ch)) {
            cp++;
            continue;
          }
          numChars = (cp - offset) - cp0;
          contentLen += numChars;
          mCurrentFragOffset += numChars;
          goto done;
        }
        numChars = (cp - offset) - cp0;
        contentLen += numChars;
      }
      else {
		if(wordLen > 0) {
			nsresult res = NS_OK;
			PRBool breakBetween = PR_FALSE;
			res = mLineBreaker->BreakInBetween(mBuffer, wordLen, 
				                         cp, (fragLen-offset), &breakBetween);
			if ( breakBetween )
				goto done;

			PRBool tryNextFrag = PR_FALSE;
			PRUint32 next;

			// Find next position
			res = mLineBreaker->Next(cp0, fragLen, offset, &next, &tryNextFrag);
			
			numChars = (next - offset);
			// check buffer size before copy
			if((bp + numChars ) > bufEnd) {
				PRInt32 delta = bp - mBuffer;
				if(!GrowBuffer()) {
					goto done;
				}
				bp = mBuffer + delta;
				bufEnd = mBuffer + mBufferLength;
			}

			wordLen += numChars;
			mCurrentFragOffset += numChars;
			contentLen += numChars;
			end = cp + numChars;

			// 1. convert nbsp into space
			// 2. check mHasMultibyte flag
			// 3. copy buffer

			while(cp < end) {
		        PRUnichar ch = *cp++;
				if (CH_NBSP == ch) ch = ' ';
				if (ch > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;
				*bp++ = ch;
			}
			if(! tryNextFrag) {
				// can decide break position inside this TextFrag
				goto done;
			}
		}
      }
    }
    else {
      const unsigned char* cp0 = (const unsigned char*) frag->Get1b();
      const unsigned char* end = cp0 + fragLen;
      const unsigned char* cp = cp0 + offset;
      if (isWhitespace) {
        while (cp < end) {
          PRUnichar ch = PRUnichar(*cp);
          if (XP_IS_SPACE(ch)) {
            cp++;
            continue;
          }
          numChars = (cp - offset) - cp0;
          contentLen += numChars;
          mCurrentFragOffset += numChars;
          goto done;
        }
        numChars = (cp - offset) - cp0;
        contentLen += numChars;
      }
      else {
        while (cp < end) {
          PRUnichar ch = PRUnichar(*cp);
          if (!XP_IS_SPACE(ch)) {
            if (CH_NBSP == ch) ch = ' ';
            if (ch > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;
            cp++;

            // Store character in buffer; grow buffer if we have to
            NS_ASSERTION(bp < bufEnd, "whoops");
            *bp++ = ch;
            if (bp == bufEnd) {
              PRInt32 delta = bp - mBuffer;
              if (!GrowBuffer()) {
                goto done;
              }
              bp = mBuffer + delta;
              bufEnd = mBuffer + mBufferLength;
            }
            continue;
          }
          numChars = (cp - offset) - cp0;
          wordLen += numChars;
          contentLen += numChars;
          mCurrentFragOffset += numChars;
          goto done;
        }
        numChars = (cp - offset) - cp0;
        wordLen += numChars;
        contentLen += numChars;
      }
    }

    // Advance to next text fragment
    frag++;
    mCurrentFrag = frag;
    mCurrentFragOffset = 0;
    offset = 0;
  }

 done:;

  if (!isWhitespace)
  {
     switch(mTextTransform)
     {
       case NS_STYLE_TEXT_TRANSFORM_CAPITALIZE:
           gCaseConv->ToTitle(mBuffer, mBuffer, wordLen, !aInWord);
         break;
       case NS_STYLE_TEXT_TRANSFORM_LOWERCASE:
           gCaseConv->ToLower(mBuffer, mBuffer, wordLen );
         break;
       case NS_STYLE_TEXT_TRANSFORM_UPPERCASE:
           gCaseConv->ToUpper(mBuffer, mBuffer, wordLen );
         break;
       default:
         break;
     }
  }

 really_done:;
  mOffset += contentLen;
  NS_ASSERTION(mOffset <= mContentLength, "whoops");
  aWordLenResult = wordLen;
  aContentLenResult = contentLen;
  aIsWhitespaceResult = isWhitespace;

  return mBuffer;
}

PRUnichar*
nsTextTransformer::GetPrevWord(PRBool aInWord,
                               PRInt32& aWordLenResult,
                               PRInt32& aContentLenResult,
                               PRBool& aIsWhitespaceResult)
{
  NS_PRECONDITION(mOffset <= mContentLength, "bad offset");

  // See if the content has been exhausted
  if (mOffset == 0) {
    aWordLenResult = 0;
    aContentLenResult = 0;
    return nsnull;
  }

  PRUnichar* bp = mBuffer;
  PRUnichar* bufEnd = mBuffer + mBufferLength;
  const nsTextFragment* frag = mCurrentFrag;
  const nsTextFragment* lastFrag = mFrags;//1st is the last
  PRInt32 wordLen = 1;
  PRInt32 contentLen = 1;

  // Set the isWhitespace flag by examining the next character in the
  // text fragment.
  PRInt32 offset = mCurrentFragOffset-1;
  PRUnichar firstChar;
  if (frag->Is2b()) {
    const PRUnichar* up = frag->Get2b();
    firstChar = up[offset];
  }
  else {
    const unsigned char* cp = (const unsigned char*) frag->Get1b();
    if (offset > 0)
      firstChar = PRUnichar(cp[offset]);
    else
      firstChar = PRUnichar(cp[0]);
  }
  PRBool isWhitespace = XP_IS_SPACE(firstChar);
  offset--;
  if (isWhitespace) {
    if (NS_STYLE_WHITESPACE_PRE == mWhiteSpace) {
      if ('\t' == firstChar) {
        // Leave tab alone so that caller can expand it
      }
      else if ('\n' == firstChar) {
        // Advance content past newline but do not allow newline to
        // remain in the word.
        wordLen--;
      }
      else {
        firstChar = ' ';
      }
    }
    else {
      firstChar = ' ';
    }
  }
  else if (CH_NBSP == firstChar) {
    firstChar = ' ';
  }
  *bp++ = firstChar;
  mCurrentFragOffset = offset +1;
  if (offset < 0) {
    if (mCurrentFrag == mFrags){
      goto really_done;
    }
    mCurrentFrag = --frag;
    offset = mCurrentFrag->GetLength()-1;
  }
  if (isWhitespace && (NS_STYLE_WHITESPACE_PRE == mWhiteSpace)) {
    goto really_done;
  }

  PRInt32 numChars;
  do {
    // Scan characters in this fragment that are the same kind as the
    // isWhitespace flag indicates.
    if (frag->Is2b()) {
      const PRUnichar* cp0 = frag->Get2b();
      const PRUnichar* end = cp0;
      const PRUnichar* cp = cp0 + offset;
      if (isWhitespace) {
        while (cp > end) {
          PRUnichar ch = *cp;
          if (XP_IS_SPACE(ch)) {
            cp--;
            continue;
          }
          numChars = (cp0 + offset) - cp;
          contentLen += numChars;
          mCurrentFragOffset -= numChars;
          goto done;
        }
        numChars = (cp0 + offset) - cp;
        contentLen += numChars;
      }
      else {
        while (cp >= end) {
          PRUnichar ch = *cp;
          if (!XP_IS_SPACE(ch)) {
            if (CH_NBSP == ch) ch = ' ';
            if (ch > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;
            cp--;

            // Store character in buffer; grow buffer if we have to
            NS_ASSERTION(bp < bufEnd, "whoops");
            *bp++ = ch;
            if (bp == bufEnd) {
              PRInt32 delta = bp - mBuffer;
              if (!GrowBuffer()) {
                goto done;
              }
              bp = mBuffer + delta;
              bufEnd = mBuffer + mBufferLength;
            }
            continue;
          }
          numChars = (cp0 + offset) - cp;
          wordLen += numChars;
          contentLen += numChars;
          mCurrentFragOffset -= numChars;
          goto done;
        }
        numChars = (cp0 + offset) - cp;
        wordLen += numChars;
        contentLen += numChars;
      }
    }
    else {
      const unsigned char* cp0 = (const unsigned char*) frag->Get1b();
      const unsigned char* end = cp0;
      const unsigned char* cp = cp0 + offset;
      if (isWhitespace) {
        while (cp > end) {
          PRUnichar ch = PRUnichar(*cp);
          if (XP_IS_SPACE(ch)) {
            cp--;
            continue;
          }
          numChars = (cp0 + offset) - cp;
          contentLen += numChars;
          mCurrentFragOffset -= numChars;
          goto done;
        }
        numChars = (cp0 + offset) - cp;
        contentLen += numChars;
      }
      else {
        while (cp >= end) {
          PRUnichar ch = PRUnichar(*cp);
          if (!XP_IS_SPACE(ch)) {
            if (CH_NBSP == ch) ch = ' ';
            if (ch > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;
            cp--;

            // Store character in buffer; grow buffer if we have to
            NS_ASSERTION(bp < bufEnd, "whoops");
            *bp++ = ch;
            if (bp == bufEnd) {
              PRInt32 delta = bp - mBuffer;
              if (!GrowBuffer()) {
                goto done;
              }
              bp = mBuffer + delta;
              bufEnd = mBuffer + mBufferLength;
            }
            continue;
          }
          numChars = (cp0 + offset) - cp;
          wordLen += numChars;
          contentLen += numChars;
          mCurrentFragOffset -= numChars;
          goto done;
        }
        numChars = (cp0 + offset) - cp;
        wordLen += numChars;
        contentLen += numChars;
      }
    }

    // Advance to next text fragment
    if (frag != lastFrag)
    {
      frag--;
      mCurrentFrag = frag;
      mCurrentFragOffset = mCurrentFrag->GetLength()-1;
      offset = mCurrentFragOffset;
    }
    else
      mCurrentFragOffset = 0;
  }
  while (frag > lastFrag);

 done:;

  if (!isWhitespace)
  {
     switch(mTextTransform)
     {
       case NS_STYLE_TEXT_TRANSFORM_CAPITALIZE:
           gCaseConv->ToTitle(mBuffer, mBuffer, wordLen, !aInWord);
         break;
       case NS_STYLE_TEXT_TRANSFORM_LOWERCASE:
           gCaseConv->ToLower(mBuffer, mBuffer, wordLen );
         break;
       case NS_STYLE_TEXT_TRANSFORM_UPPERCASE:
           gCaseConv->ToUpper(mBuffer, mBuffer, wordLen );
         break;
       default:
         break;
     }
  }


 really_done:;
  mOffset -= contentLen;
  NS_ASSERTION(mOffset >= 0, "whoops");
  aWordLenResult = wordLen;
  aContentLenResult = contentLen;
  aIsWhitespaceResult = isWhitespace;

  return mBuffer;
}

PRUnichar*
nsTextTransformer::GetTextAt(PRInt32 aOffset)
{
  // XXX
  return mBuffer + aOffset;
}
new 1998-10-20 04:17:17 +04:00			`/* -- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 --`
			`*`
			`* The contents of this file are subject to the Netscape Public License`
			`* Version 1.0 (the "License"); you may not use this file except in`
			`* compliance with the License. You may obtain a copy of the License at`
			`* http://www.mozilla.org/NPL/`
			`*`
			`* Software distributed under the License is distributed on an "AS IS"`
			`* basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See`
			`* the License for the specific language governing rights and limitations`
			`* under the License.`
			`*`
			`* The Original Code is Mozilla Communicator client code.`
			`*`
			`* The Initial Developer of the Original Code is Netscape Communications`
			`* Corporation. Portions created by Netscape are Copyright (C) 1998`
			`* Netscape Communications Corporation. All Rights Reserved.`
			`*/`
			`#include "nsTextTransformer.h"`
			`#include "nsIContent.h"`
			`#include "nsIFrame.h"`
			`#include "nsIStyleContext.h"`
			`#include "nsITextContent.h"`
			`#include "nsStyleConsts.h"`
change nsTextTransformer to break line by calling nsILineBreak and make nsTextFrame pass the nsILineBreaker to nsTextTransformer 1999-02-24 21:21:23 +03:00			`#include "nsILineBreaker.h"`
new 1998-10-20 04:17:17 +04:00
Make Case conversion work for non-Latin1 Unicode. Reviewed by kipp. Perofrmance is the same after changing this. 1999-02-23 05:27:54 +03:00
			`#include "nsIServiceManager.h"`
			`#include "nsUnicharUtilCIID.h"`
			`#include "nsICaseConversion.h"`

			`static NS_DEFINE_IID(kUnicharUtilCID, NS_UNICHARUTIL_CID);`
			`static NS_DEFINE_IID(kICaseConversionIID, NS_ICASECONVERSION_IID);`
			`static nsICaseConversion* gCaseConv = nsnull;`

new 1998-10-20 04:17:17 +04:00			`// XXX put a copy in nsHTMLIIDs`
			`static NS_DEFINE_IID(kITextContentIID, NS_ITEXT_CONTENT_IID);`

Added support for capitalization transform 1998-10-20 20:45:14 +04:00			`// XXX I'm sure there are other special characters`
new 1998-10-20 04:17:17 +04:00			`#define CH_NBSP 160`

			`#define MAX_UNIBYTE 127`

change nsTextTransformer to break line by calling nsILineBreak and make nsTextFrame pass the nsILineBreaker to nsTextTransformer 1999-02-24 21:21:23 +03:00			`nsTextTransformer::nsTextTransformer(PRUnichar* aBuffer, PRInt32 aBufLen,`
			`nsILineBreaker* aLineBreaker)`
new 1998-10-20 04:17:17 +04:00			`: mAutoBuffer(aBuffer),`
			`mBuffer(aBuffer),`
			`mBufferLength(aBufLen < 0 ? 0 : aBufLen),`
Eliminate some compiler warnings 1999-03-05 07:28:54 +03:00			`mHasMultibyte(PR_FALSE),`
			`mLineBreaker(aLineBreaker)`
new 1998-10-20 04:17:17 +04:00			`{`
change nsTextTransformer to break line by calling nsILineBreak and make nsTextFrame pass the nsILineBreaker to nsTextTransformer 1999-02-24 21:21:23 +03:00			`NS_IF_ADDREF(mLineBreaker);`
new 1998-10-20 04:17:17 +04:00			`}`

			`nsTextTransformer::~nsTextTransformer()`
			`{`
			`if (mBuffer != mAutoBuffer) {`
			`delete [] mBuffer;`
			`}`
change nsTextTransformer to break line by calling nsILineBreak and make nsTextFrame pass the nsILineBreaker to nsTextTransformer 1999-02-24 21:21:23 +03:00			`NS_IF_RELEASE(mLineBreaker);`
new 1998-10-20 04:17:17 +04:00			`}`

			`nsresult`
			`nsTextTransformer::Init(/nsTextRun& aTextRun, XXX/`
			`nsIFrame* aFrame,`
			`PRInt32 aStartingOffset)`
			`{`
			`// Make sure we have some space in case arguments to the ctor were`
			`// bizzare.`
			`if (mBufferLength < 100) {`
			`if (!GrowBuffer()) {`
			`return NS_ERROR_OUT_OF_MEMORY;`
			`}`
			`}`

			`// Get the frames text content`
			`nsIContent* content;`
Changed some nsIFrame member functions to use ** instead of *& for OUT paremeters 1999-02-10 03:42:56 +03:00			`aFrame->GetContent(&content);`
new 1998-10-20 04:17:17 +04:00			`nsITextContent* tc;`
			`if (NS_OK != content->QueryInterface(kITextContentIID, (void**) &tc)) {`
			`NS_RELEASE(content);`
			`return NS_OK;`
			`}`
			`tc->GetText(mFrags, mNumFrags);`
			`NS_RELEASE(tc);`
			`NS_RELEASE(content);`
			`mStartingOffset = aStartingOffset;`
			`mOffset = mStartingOffset;`

			`// Compute the total length of the text content.`
			`PRInt32 sum = 0;`
			`PRInt32 n = mNumFrags;`
			`const nsTextFragment* frag = mFrags;`
			`for (; --n >= 0; frag++) {`
			`sum += frag->GetLength();`
			`}`
			`mContentLength = sum;`

			`// Set current fragment and current fragment offset`
			`mCurrentFrag = mFrags;`
			`mCurrentFragOffset = 0;`
			`PRInt32 offset = 0;`
			`n = mNumFrags;`
			`for (frag = mFrags; --n >= 0; frag++) {`
			`if (aStartingOffset < offset + frag->GetLength()) {`
			`mCurrentFrag = frag;`
			`mCurrentFragOffset = aStartingOffset - offset;`
			`break;`
			`}`
			`offset += frag->GetLength();`
			`}`
Added, jump to prev word, modified INIT of nsTextTransformer to better prepare for a start offset at the end of the mFrags list. added implementation of extra parameter to nsIFrame::PeekOffset to keep state for the next word problem of eating ws. nsTextFrame should be all set on implementation of jumping words. 1999-02-22 07:59:52 +03:00			`if (mNumFrags && aStartingOffset == mContentLength){`
			`mCurrentFrag = mFrags + (mNumFrags -1);`
			`mCurrentFragOffset = mCurrentFrag->GetLength();`
			`}`
new 1998-10-20 04:17:17 +04:00
			`// Get the frames style and choose a transform proc`
			`const nsStyleText* styleText;`
			`aFrame->GetStyleData(eStyleStruct_Text, (const nsStyleStruct*&) styleText);`
Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`mWhiteSpace = styleText->mWhiteSpace;`
Added support for capitalization transform 1998-10-20 20:45:14 +04:00			`mTextTransform = styleText->mTextTransform;`
new 1998-10-20 04:17:17 +04:00
Make Case conversion work for non-Latin1 Unicode. Reviewed by kipp. Perofrmance is the same after changing this. 1999-02-23 05:27:54 +03:00			`if(NS_STYLE_TEXT_TRANSFORM_NONE != mTextTransform)`
			`{`
			`if(nsnull == gCaseConv) {`
			`nsresult res;`
			`res = nsServiceManager::GetService(kUnicharUtilCID, kICaseConversionIID,`
			`(nsISupports**)&gCaseConv);`
			`NS_ASSERTION( NS_SUCCEEDED(res), "cannot get UnicharUtil");`
			`NS_ASSERTION( gCaseConv != NULL, "cannot get UnicharUtil");`
			`}`
			`}`
new 1998-10-20 04:17:17 +04:00			`return NS_OK;`
			`}`

			`PRBool`
			`nsTextTransformer::GrowBuffer()`
			`{`
			`PRInt32 newLen = mBufferLength * 2;`
			`if (newLen <= 100) {`
			`newLen = 100;`
			`}`
			`PRUnichar* newBuffer = new PRUnichar[newLen];`
			`if (nsnull == newBuffer) {`
			`return PR_FALSE;`
			`}`
			`if (0 != mBufferLength) {`
			`nsCRT::memcpy(newBuffer, mBuffer, sizeof(PRUnichar) * mBufferLength);`
			`if (mBuffer != mAutoBuffer) {`
			`delete [] mBuffer;`
			`}`
			`}`
			`mBuffer = newBuffer;`
Fixed bug #1257: the bug was that we were overrunning the transformers malloc'd buffer because the mBufferLength was never being updated 1998-11-15 01:27:50 +03:00			`mBufferLength = newLen;`
new 1998-10-20 04:17:17 +04:00			`return PR_TRUE;`
			`}`

			`PRUnichar*`
Added support for capitalization transform 1998-10-20 20:45:14 +04:00			`nsTextTransformer::GetNextWord(PRBool aInWord,`
			`PRInt32& aWordLenResult,`
new 1998-10-20 04:17:17 +04:00			`PRInt32& aContentLenResult,`
			`PRBool& aIsWhitespaceResult)`
			`{`
			`NS_PRECONDITION(mOffset <= mContentLength, "bad offset");`

			`// See if the content has been exhausted`
			`if (mOffset == mContentLength) {`
			`aWordLenResult = 0;`
			`aContentLenResult = 0;`
			`return nsnull;`
			`}`

			`PRUnichar* bp = mBuffer;`
			`PRUnichar* bufEnd = mBuffer + mBufferLength;`
			`const nsTextFragment* frag = mCurrentFrag;`
Fixed lastFrag computation 1998-10-21 07:07:37 +04:00			`const nsTextFragment* lastFrag = mFrags + mNumFrags;`
Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`PRInt32 wordLen = 1;`
			`PRInt32 contentLen = 1;`
new 1998-10-20 04:17:17 +04:00
			`// Set the isWhitespace flag by examining the next character in the`
			`// text fragment.`
			`PRInt32 offset = mCurrentFragOffset;`
			`PRUnichar firstChar;`
			`if (frag->Is2b()) {`
			`const PRUnichar* up = frag->Get2b();`
			`firstChar = up[offset];`
			`}`
			`else {`
			`const unsigned char* cp = (const unsigned char*) frag->Get1b();`
			`firstChar = PRUnichar(cp[offset]);`
			`}`
			`PRBool isWhitespace = XP_IS_SPACE(firstChar);`
			`offset++;`
Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`if (isWhitespace) {`
			`if (NS_STYLE_WHITESPACE_PRE == mWhiteSpace) {`
			`if ('\t' == firstChar) {`
			`// Leave tab alone so that caller can expand it`
			`}`
			`else if ('\n' == firstChar) {`
			`// Advance content past newline but do not allow newline to`
			`// remain in the word.`
			`wordLen--;`
			`}`
			`else {`
			`firstChar = ' ';`
			`}`
			`}`
			`else {`
			`firstChar = ' ';`
			`}`
			`}`
			`else if (CH_NBSP == firstChar) {`
			`firstChar = ' ';`
new 1998-10-20 04:17:17 +04:00			`}`
fix mHasMultibyte hint problem when the first character of the word is not ASCII 1999-03-11 06:00:33 +03:00			`if (firstChar > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;`
Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`*bp++ = firstChar;`
new 1998-10-20 04:17:17 +04:00			`if (offset == frag->GetLength()) {`
			`mCurrentFrag = ++frag;`
			`offset = 0;`
			`}`
			`mCurrentFragOffset = offset;`
Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`if (isWhitespace && (NS_STYLE_WHITESPACE_PRE == mWhiteSpace)) {`
			`goto really_done;`
Added support for capitalization transform 1998-10-20 20:45:14 +04:00			`}`
new 1998-10-20 04:17:17 +04:00
			`PRInt32 numChars;`
			`while (frag < lastFrag) {`
			`PRInt32 fragLen = frag->GetLength();`

			`// Scan characters in this fragment that are the same kind as the`
			`// isWhitespace flag indicates.`
			`if (frag->Is2b()) {`
			`const PRUnichar* cp0 = frag->Get2b();`
			`const PRUnichar* end = cp0 + fragLen;`
			`const PRUnichar* cp = cp0 + offset;`
Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`if (isWhitespace) {`
Added support for capitalization transform 1998-10-20 20:45:14 +04:00			`while (cp < end) {`
			`PRUnichar ch = *cp;`
			`if (XP_IS_SPACE(ch)) {`
			`cp++;`
			`continue;`
			`}`
			`numChars = (cp - offset) - cp0;`
			`contentLen += numChars;`
			`mCurrentFragOffset += numChars;`
			`goto done;`
			`}`
			`numChars = (cp - offset) - cp0;`
			`contentLen += numChars;`
			`}`
			`else {`
change nsTextTransformer to break line by calling nsILineBreak and make nsTextFrame pass the nsILineBreaker to nsTextTransformer 1999-02-24 21:21:23 +03:00			`if(wordLen > 0) {`
			`nsresult res = NS_OK;`
			`PRBool breakBetween = PR_FALSE;`
			`res = mLineBreaker->BreakInBetween(mBuffer, wordLen,`
			`cp, (fragLen-offset), &breakBetween);`
			`if ( breakBetween )`
			`goto done;`
Added support for capitalization transform 1998-10-20 20:45:14 +04:00
change nsTextTransformer to break line by calling nsILineBreak and make nsTextFrame pass the nsILineBreaker to nsTextTransformer 1999-02-24 21:21:23 +03:00			`PRBool tryNextFrag = PR_FALSE;`
			`PRUint32 next;`

			`// Find next position`
			`res = mLineBreaker->Next(cp0, fragLen, offset, &next, &tryNextFrag);`

			`numChars = (next - offset);`
			`// check buffer size before copy`
			`if((bp + numChars ) > bufEnd) {`
			`PRInt32 delta = bp - mBuffer;`
			`if(!GrowBuffer()) {`
			`goto done;`
			`}`
			`bp = mBuffer + delta;`
			`bufEnd = mBuffer + mBufferLength;`
			`}`

			`wordLen += numChars;`
			`mCurrentFragOffset += numChars;`
			`contentLen += numChars;`
			`end = cp + numChars;`

			`// 1. convert nbsp into space`
			`// 2. check mHasMultibyte flag`
			`// 3. copy buffer`

			`while(cp < end) {`
			`PRUnichar ch = *cp++;`
			`if (CH_NBSP == ch) ch = ' ';`
			`if (ch > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;`
			`*bp++ = ch;`
			`}`
			`if(! tryNextFrag) {`
			`// can decide break position inside this TextFrag`
			`goto done;`
			`}`
			`}`
Added support for capitalization transform 1998-10-20 20:45:14 +04:00			`}`
			`}`
			`else {`
			`const unsigned char* cp0 = (const unsigned char*) frag->Get1b();`
			`const unsigned char* end = cp0 + fragLen;`
			`const unsigned char* cp = cp0 + offset;`
Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`if (isWhitespace) {`
Added support for capitalization transform 1998-10-20 20:45:14 +04:00			`while (cp < end) {`
			`PRUnichar ch = PRUnichar(*cp);`
			`if (XP_IS_SPACE(ch)) {`
			`cp++;`
			`continue;`
			`}`
			`numChars = (cp - offset) - cp0;`
			`contentLen += numChars;`
			`mCurrentFragOffset += numChars;`
			`goto done;`
			`}`
			`numChars = (cp - offset) - cp0;`
			`contentLen += numChars;`
			`}`
			`else {`
			`while (cp < end) {`
			`PRUnichar ch = PRUnichar(*cp);`
			`if (!XP_IS_SPACE(ch)) {`
			`if (CH_NBSP == ch) ch = ' ';`
			`if (ch > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;`
			`cp++;`

			`// Store character in buffer; grow buffer if we have to`
Fixed bug #1257: the bug was that we were overrunning the transformers malloc'd buffer because the mBufferLength was never being updated 1998-11-15 01:27:50 +03:00			`NS_ASSERTION(bp < bufEnd, "whoops");`
Added support for capitalization transform 1998-10-20 20:45:14 +04:00			`*bp++ = ch;`
			`if (bp == bufEnd) {`
			`PRInt32 delta = bp - mBuffer;`
			`if (!GrowBuffer()) {`
			`goto done;`
			`}`
			`bp = mBuffer + delta;`
			`bufEnd = mBuffer + mBufferLength;`
			`}`
			`continue;`
			`}`
			`numChars = (cp - offset) - cp0;`
			`wordLen += numChars;`
			`contentLen += numChars;`
			`mCurrentFragOffset += numChars;`
			`goto done;`
			`}`
			`numChars = (cp - offset) - cp0;`
			`wordLen += numChars;`
			`contentLen += numChars;`
			`}`
			`}`

			`// Advance to next text fragment`
			`frag++;`
			`mCurrentFrag = frag;`
			`mCurrentFragOffset = 0;`
			`offset = 0;`
			`}`

			`done:;`
new 1998-10-20 04:17:17 +04:00
Make Case conversion work for non-Latin1 Unicode. Reviewed by kipp. Perofrmance is the same after changing this. 1999-02-23 05:27:54 +03:00			`if (!isWhitespace)`
			`{`
			`switch(mTextTransform)`
			`{`
			`case NS_STYLE_TEXT_TRANSFORM_CAPITALIZE:`
			`gCaseConv->ToTitle(mBuffer, mBuffer, wordLen, !aInWord);`
			`break;`
			`case NS_STYLE_TEXT_TRANSFORM_LOWERCASE:`
			`gCaseConv->ToLower(mBuffer, mBuffer, wordLen );`
			`break;`
			`case NS_STYLE_TEXT_TRANSFORM_UPPERCASE:`
			`gCaseConv->ToUpper(mBuffer, mBuffer, wordLen );`
			`break;`
			`default:`
			`break;`
			`}`
new 1998-10-20 04:17:17 +04:00			`}`

Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`really_done:;`
new 1998-10-20 04:17:17 +04:00			`mOffset += contentLen;`
			`NS_ASSERTION(mOffset <= mContentLength, "whoops");`
Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`aWordLenResult = wordLen;`
new 1998-10-20 04:17:17 +04:00			`aContentLenResult = contentLen;`
Slimmed down the implementation 1998-10-22 00:05:31 +04:00			`aIsWhitespaceResult = isWhitespace;`

new 1998-10-20 04:17:17 +04:00			`return mBuffer;`
			`}`

gettig word jumping to work, adding GetPrevWord to texttransformer 1999-02-22 06:20:59 +03:00			`PRUnichar*`
			`nsTextTransformer::GetPrevWord(PRBool aInWord,`
			`PRInt32& aWordLenResult,`
			`PRInt32& aContentLenResult,`
			`PRBool& aIsWhitespaceResult)`
			`{`
			`NS_PRECONDITION(mOffset <= mContentLength, "bad offset");`

			`// See if the content has been exhausted`
			`if (mOffset == 0) {`
			`aWordLenResult = 0;`
			`aContentLenResult = 0;`
			`return nsnull;`
			`}`

			`PRUnichar* bp = mBuffer;`
			`PRUnichar* bufEnd = mBuffer + mBufferLength;`
			`const nsTextFragment* frag = mCurrentFrag;`
			`const nsTextFragment* lastFrag = mFrags;//1st is the last`
			`PRInt32 wordLen = 1;`
			`PRInt32 contentLen = 1;`

			`// Set the isWhitespace flag by examining the next character in the`
			`// text fragment.`
			`PRInt32 offset = mCurrentFragOffset-1;`
			`PRUnichar firstChar;`
			`if (frag->Is2b()) {`
			`const PRUnichar* up = frag->Get2b();`
			`firstChar = up[offset];`
			`}`
			`else {`
			`const unsigned char* cp = (const unsigned char*) frag->Get1b();`
			`if (offset > 0)`
			`firstChar = PRUnichar(cp[offset]);`
			`else`
			`firstChar = PRUnichar(cp[0]);`
			`}`
			`PRBool isWhitespace = XP_IS_SPACE(firstChar);`
			`offset--;`
			`if (isWhitespace) {`
			`if (NS_STYLE_WHITESPACE_PRE == mWhiteSpace) {`
			`if ('\t' == firstChar) {`
			`// Leave tab alone so that caller can expand it`
			`}`
			`else if ('\n' == firstChar) {`
			`// Advance content past newline but do not allow newline to`
			`// remain in the word.`
			`wordLen--;`
			`}`
			`else {`
			`firstChar = ' ';`
			`}`
			`}`
			`else {`
			`firstChar = ' ';`
			`}`
			`}`
			`else if (CH_NBSP == firstChar) {`
			`firstChar = ' ';`
			`}`
			`*bp++ = firstChar;`
			`mCurrentFragOffset = offset +1;`
			`if (offset < 0) {`
			`if (mCurrentFrag == mFrags){`
			`goto really_done;`
			`}`
			`mCurrentFrag = --frag;`
			`offset = mCurrentFrag->GetLength()-1;`
			`}`
			`if (isWhitespace && (NS_STYLE_WHITESPACE_PRE == mWhiteSpace)) {`
			`goto really_done;`
			`}`

			`PRInt32 numChars;`
			`do {`
			`// Scan characters in this fragment that are the same kind as the`
			`// isWhitespace flag indicates.`
			`if (frag->Is2b()) {`
			`const PRUnichar* cp0 = frag->Get2b();`
			`const PRUnichar* end = cp0;`
			`const PRUnichar* cp = cp0 + offset;`
			`if (isWhitespace) {`
			`while (cp > end) {`
			`PRUnichar ch = *cp;`
			`if (XP_IS_SPACE(ch)) {`
			`cp--;`
			`continue;`
			`}`
			`numChars = (cp0 + offset) - cp;`
			`contentLen += numChars;`
			`mCurrentFragOffset -= numChars;`
			`goto done;`
			`}`
			`numChars = (cp0 + offset) - cp;`
			`contentLen += numChars;`
			`}`
			`else {`
Added, jump to prev word, modified INIT of nsTextTransformer to better prepare for a start offset at the end of the mFrags list. added implementation of extra parameter to nsIFrame::PeekOffset to keep state for the next word problem of eating ws. nsTextFrame should be all set on implementation of jumping words. 1999-02-22 07:59:52 +03:00			`while (cp >= end) {`
gettig word jumping to work, adding GetPrevWord to texttransformer 1999-02-22 06:20:59 +03:00			`PRUnichar ch = *cp;`
			`if (!XP_IS_SPACE(ch)) {`
			`if (CH_NBSP == ch) ch = ' ';`
			`if (ch > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;`
			`cp--;`

			`// Store character in buffer; grow buffer if we have to`
			`NS_ASSERTION(bp < bufEnd, "whoops");`
			`*bp++ = ch;`
			`if (bp == bufEnd) {`
			`PRInt32 delta = bp - mBuffer;`
			`if (!GrowBuffer()) {`
			`goto done;`
			`}`
			`bp = mBuffer + delta;`
			`bufEnd = mBuffer + mBufferLength;`
			`}`
			`continue;`
			`}`
			`numChars = (cp0 + offset) - cp;`
			`wordLen += numChars;`
			`contentLen += numChars;`
			`mCurrentFragOffset -= numChars;`
			`goto done;`
			`}`
			`numChars = (cp0 + offset) - cp;`
			`wordLen += numChars;`
			`contentLen += numChars;`
			`}`
			`}`
			`else {`
			`const unsigned char* cp0 = (const unsigned char*) frag->Get1b();`
			`const unsigned char* end = cp0;`
			`const unsigned char* cp = cp0 + offset;`
			`if (isWhitespace) {`
			`while (cp > end) {`
			`PRUnichar ch = PRUnichar(*cp);`
			`if (XP_IS_SPACE(ch)) {`
			`cp--;`
			`continue;`
			`}`
			`numChars = (cp0 + offset) - cp;`
			`contentLen += numChars;`
			`mCurrentFragOffset -= numChars;`
			`goto done;`
			`}`
			`numChars = (cp0 + offset) - cp;`
			`contentLen += numChars;`
			`}`
			`else {`
Added, jump to prev word, modified INIT of nsTextTransformer to better prepare for a start offset at the end of the mFrags list. added implementation of extra parameter to nsIFrame::PeekOffset to keep state for the next word problem of eating ws. nsTextFrame should be all set on implementation of jumping words. 1999-02-22 07:59:52 +03:00			`while (cp >= end) {`
gettig word jumping to work, adding GetPrevWord to texttransformer 1999-02-22 06:20:59 +03:00			`PRUnichar ch = PRUnichar(*cp);`
			`if (!XP_IS_SPACE(ch)) {`
			`if (CH_NBSP == ch) ch = ' ';`
			`if (ch > MAX_UNIBYTE) mHasMultibyte = PR_TRUE;`
			`cp--;`

			`// Store character in buffer; grow buffer if we have to`
			`NS_ASSERTION(bp < bufEnd, "whoops");`
			`*bp++ = ch;`
			`if (bp == bufEnd) {`
			`PRInt32 delta = bp - mBuffer;`
			`if (!GrowBuffer()) {`
			`goto done;`
			`}`
			`bp = mBuffer + delta;`
			`bufEnd = mBuffer + mBufferLength;`
			`}`
			`continue;`
			`}`
			`numChars = (cp0 + offset) - cp;`
			`wordLen += numChars;`
			`contentLen += numChars;`
			`mCurrentFragOffset -= numChars;`
			`goto done;`
			`}`
			`numChars = (cp0 + offset) - cp;`
			`wordLen += numChars;`
			`contentLen += numChars;`
			`}`
			`}`

			`// Advance to next text fragment`
			`if (frag != lastFrag)`
			`{`
			`frag--;`
			`mCurrentFrag = frag;`
			`mCurrentFragOffset = mCurrentFrag->GetLength()-1;`
			`offset = mCurrentFragOffset;`
			`}`
			`else`
			`mCurrentFragOffset = 0;`
			`}`
			`while (frag > lastFrag);`

			`done:;`

Make Case conversion work for non-Latin1 Unicode. Reviewed by kipp. Perofrmance is the same after changing this. 1999-02-23 05:27:54 +03:00			`if (!isWhitespace)`
			`{`
			`switch(mTextTransform)`
			`{`
			`case NS_STYLE_TEXT_TRANSFORM_CAPITALIZE:`
			`gCaseConv->ToTitle(mBuffer, mBuffer, wordLen, !aInWord);`
			`break;`
			`case NS_STYLE_TEXT_TRANSFORM_LOWERCASE:`
			`gCaseConv->ToLower(mBuffer, mBuffer, wordLen );`
			`break;`
			`case NS_STYLE_TEXT_TRANSFORM_UPPERCASE:`
			`gCaseConv->ToUpper(mBuffer, mBuffer, wordLen );`
			`break;`
			`default:`
			`break;`
			`}`
gettig word jumping to work, adding GetPrevWord to texttransformer 1999-02-22 06:20:59 +03:00			`}`

Make Case conversion work for non-Latin1 Unicode. Reviewed by kipp. Perofrmance is the same after changing this. 1999-02-23 05:27:54 +03:00
gettig word jumping to work, adding GetPrevWord to texttransformer 1999-02-22 06:20:59 +03:00			`really_done:;`
			`mOffset -= contentLen;`
			`NS_ASSERTION(mOffset >= 0, "whoops");`
			`aWordLenResult = wordLen;`
			`aContentLenResult = contentLen;`
			`aIsWhitespaceResult = isWhitespace;`

			`return mBuffer;`
			`}`

new 1998-10-20 04:17:17 +04:00			`PRUnichar*`
			`nsTextTransformer::GetTextAt(PRInt32 aOffset)`
			`{`
			`// XXX`
			`return mBuffer + aOffset;`
			`}`