pjs/layout/generic/nsTextTransformer.h

/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
 *
 * The contents of this file are subject to the Netscape Public
 * License Version 1.1 (the "License"); you may not use this file
 * except in compliance with the License. You may obtain a copy of
 * the License at http://www.mozilla.org/NPL/
 *
 * Software distributed under the License is distributed on an "AS
 * IS" basis, WITHOUT WARRANTY OF ANY KIND, either express or
 * implied. See the License for the specific language governing
 * rights and limitations under the License.
 *
 * The Original Code is Mozilla Communicator client code.
 *
 * The Initial Developer of the Original Code is Netscape Communications
 * Corporation.  Portions created by Netscape are
 * Copyright (C) 1998 Netscape Communications Corporation. All
 * Rights Reserved.
 *
 * Contributor(s): 
 */
#ifndef nsTextTransformer_h___
#define nsTextTransformer_h___

#include "nsTextFragment.h"
#include "nsISupports.h"
#include "nsIPresContext.h"

class nsIContent;
class nsIFrame;
class nsILineBreaker;
class nsIWordBreaker;

// XXX I'm sure there are other special characters
#define CH_NBSP 160
#define CH_ENSP 8194		//<!ENTITY ensp    CDATA "&#8194;" -- en space, U+2002 ISOpub -->
#define CH_EMSP 8195		//<!ENTITY emsp    CDATA "&#8195;" -- em space, U+2003 ISOpub -->
#define CH_THINSP 8291	//<!ENTITY thinsp  CDATA "&#8201;" -- thin space, U+2009 ISOpub -->
#define CH_ZWNJ	8204	//<!ENTITY zwnj    CDATA "&#8204;" -- zero width non-joiner, U+200C NEW RFC 2070#define CH_SHY  173
#define CH_SHY  173

#define NS_TEXT_TRANSFORMER_AUTO_WORD_BUF_SIZE 128 // used to be 256

// Indicates whether the transformed text should be left as ascii
#define NS_TEXT_TRANSFORMER_LEAVE_AS_ASCII					1

// If at any point during GetNextWord or GetPrevWord we
// run across a multibyte (> 127) unicode character.
#define NS_TEXT_TRANSFORMER_HAS_MULTIBYTE					2

// The text in the transform buffer is ascii
#define NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII		4

// A growable text buffer that tries to avoid using malloc by having a
// builtin buffer. Ideally used as an automatic variable.
class nsAutoTextBuffer {
public:
  nsAutoTextBuffer();
  ~nsAutoTextBuffer();

  nsresult GrowBy(PRInt32 aAtLeast, PRBool aCopyToHead = PR_TRUE);

  nsresult GrowTo(PRInt32 aNewSize, PRBool aCopyToHead = PR_TRUE);

  PRUnichar* GetBuffer() { return mBuffer; }
  PRUnichar* GetBufferEnd() { return mBuffer + mBufferLen; }
  PRInt32 GetBufferLength() const { return mBufferLen; }

  PRUnichar* mBuffer;
  PRInt32 mBufferLen;
  PRUnichar mAutoBuffer[NS_TEXT_TRANSFORMER_AUTO_WORD_BUF_SIZE];
};

//----------------------------------------

/**
 * This object manages the transformation of text:
 *
 * <UL>
 * <LI>whitespace compression
 * <LI>capitalization
 * <LI>lowercasing
 * <LI>uppercasing
 * <LI>ascii to Unicode (if requested)
 * <LI>discarded characters
 * <LI>conversion of &nbsp that is not part of whitespace into a space
 * <LI>tab and newline characters to space (normal text only)
 * </UL>
 *
 * Note that no transformations are applied that would impact word
 * breaking (like mapping &nbsp; into space, for example). In
 * addition, this logic will not strip leading or trailing whitespace
 * (across the entire run of text; leading whitespace can be skipped
 * for a frames text because of whitespace compression).
 */
class nsTextTransformer {
public:
  // Note: The text transformer does not hold a reference to the line
  // breaker and work breaker objects
  nsTextTransformer(nsILineBreaker* aLineBreaker,
                    nsIWordBreaker* aWordBreaker,
                    nsIPresContext* aPresContext);

  ~nsTextTransformer();

  /**
   * Initialize the text transform. Use GetNextWord() and GetPrevWord()
   * to iterate the text
   *
   * The default is to transform all text to Unicode; however, you can
   * specify that the text should be left as ascii if possible. Note that
   * we don't step the text down from Unicode to ascii (even if it doesn't
   * contain multibyte characters) so this only happens for text fragments
   * that contain 1-byte text.
   * XXX This is currently not implemented for GetPreviousWord()
   * @see TransformedTextIsAscii()
   */
  nsresult Init(nsIFrame* aFrame,
                nsIContent* aContent,
                PRInt32 aStartingOffset,
                PRBool aLeaveAsAscii = PR_FALSE);

  PRInt32 GetContentLength() const {
    return mFrag ? mFrag->GetLength() : 0;
  }

  /**
   * Iterates the next word in the text fragment.
   *
   * Returns a pointer to the word, the number of characters in the word, the
   * content length of the word, whether it is whitespace, and whether the
   * text was transformed (any of the transformations listed above). The content
   * length can be greater than the word length if whitespace compression occured
   * or if characters were discarded
   *
   * The default behavior is to reset the transform buffer to the beginning,
   * but you can choose to not reste it and buffer across multiple words
   */
  PRUnichar* GetNextWord(PRBool aInWord,
                         PRInt32* aWordLenResult,
                         PRInt32* aContentLenResult,
                         PRBool* aIsWhitespaceResult,
                         PRBool* aWasTransformed,
                         PRBool aResetTransformBuf = PR_TRUE,
                         PRBool aForLineBreak = PR_TRUE);

  PRUnichar* GetPrevWord(PRBool aInWord,
                         PRInt32* aWordLenResult,
                         PRInt32* aContentLenResult,
                         PRBool* aIsWhitespaceResult,
                         PRBool aForLineBreak = PR_TRUE);

  
  // Returns PR_TRUE if the LEAVE_AS_ASCII flag is set
  PRBool LeaveAsAscii() const {
      return (mFlags & NS_TEXT_TRANSFORMER_LEAVE_AS_ASCII) ? PR_TRUE : PR_FALSE;
  }

  // Returns PR_TRUE if any of the characters are multibyte (greater than 127)
  PRBool HasMultibyte() const {
      return (mFlags & NS_TEXT_TRANSFORMER_HAS_MULTIBYTE) ? PR_TRUE : PR_FALSE;
  }

  // Returns PR_TRUE if the text in the transform bufer is ascii (i.e., it
  // doesn't contain any multibyte characters)
  PRBool TransformedTextIsAscii() const {
      return (mFlags & NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII) ? PR_TRUE : PR_FALSE;
  }

  // Set or clears the LEAVE_AS_ASCII bit
  void SetLeaveAsAscii(PRBool aValue) {
      aValue ? mFlags |= NS_TEXT_TRANSFORMER_LEAVE_AS_ASCII : 
               mFlags &= (~NS_TEXT_TRANSFORMER_LEAVE_AS_ASCII);
  }
      
  // Set or clears the NS_TEXT_TRANSFORMER_HAS_MULTIBYTE bit
  void SetHasMultibyte(PRBool aValue) {
      aValue ? mFlags |= NS_TEXT_TRANSFORMER_HAS_MULTIBYTE : 
               mFlags &= (~NS_TEXT_TRANSFORMER_HAS_MULTIBYTE);
  }

  // Set or clears the NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII bit
  void SetTransformedTextIsAscii(PRBool aValue) {
      aValue ? mFlags |= NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII : 
               mFlags &= (~NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII);
  }

  PRUnichar* GetWordBuffer() {
    return mTransformBuf.GetBuffer();
  }

  PRInt32 GetWordBufferLength() const {
    return mTransformBuf.GetBufferLength();
  }

  
  static nsresult Initialize();
  static void Shutdown();

protected:
  // Helper methods for GetNextWord (F == forwards)
  PRInt32 ScanNormalWhiteSpace_F();
  PRInt32 ScanNormalAsciiText_F(PRInt32* aWordLen,
                                PRBool*  aWasTransformed);
  PRInt32 ScanNormalAsciiText_F_ForWordBreak(PRInt32* aWordLen,
                                PRBool*  aWasTransformed);
  PRInt32 ScanNormalUnicodeText_F(PRBool aForLineBreak,
                                  PRInt32* aWordLen,
                                  PRBool*  aWasTransformed);
  PRInt32 ScanPreWrapWhiteSpace_F(PRInt32* aWordLen);
  PRInt32 ScanPreAsciiData_F(PRInt32* aWordLen,
                             PRBool*  aWasTransformed);
  PRInt32 ScanPreData_F(PRInt32* aWordLen,
                        PRBool*  aWasTransformed);

  // Helper methods for GetPrevWord (B == backwards)
  PRInt32 ScanNormalWhiteSpace_B();
  PRInt32 ScanNormalAsciiText_B(PRInt32* aWordLen);
  PRInt32 ScanNormalUnicodeText_B(PRBool aForLineBreak, PRInt32* aWordLen);
  PRInt32 ScanPreWrapWhiteSpace_B(PRInt32* aWordLen);
  PRInt32 ScanPreData_B(PRInt32* aWordLen);

  // Converts the current text in the transform buffer from ascii to
  // Unicode
  void ConvertTransformedTextToUnicode();
  
  void LanguageSpecificTransform(PRUnichar* aText, PRInt32 aLen,
                                 PRBool* aWasTransformed);

  // The text fragment that we are looking at
  const nsTextFragment* mFrag;

  // Our current offset into the text fragment
  PRInt32 mOffset;

  // The frame's white-space mode we are using to process text
  enum {
    eNormal,
    ePreformatted,
    ePreWrap
  } mMode;
  
  nsILineBreaker* mLineBreaker;  // [WEAK]

  nsIWordBreaker* mWordBreaker;  // [WEAK]

  nsLanguageSpecificTransformType mLanguageSpecificTransformType;

  // Buffer used to hold the transformed words from GetNextWord or
  // GetPrevWord
  nsAutoTextBuffer mTransformBuf;

  // Our current position within the buffer. Used when iterating the next
  // word, because we may be requested to buffer across multiple words
  PRInt32 mBufferPos;
  
  // The frame's text-transform state
  PRUint8 mTextTransform;

  // Flag for controling mLeaveAsAscii, mHasMultibyte, mTransformedTextIsAscii
  PRUint8 mFlags;

#ifdef DEBUG
  static void SelfTest(nsILineBreaker* aLineBreaker,
                       nsIWordBreaker* aWordBreaker,
                       nsIPresContext* aPresContext);

  nsresult Init2(const nsTextFragment* aFrag,
                 PRInt32 aStartingOffset,
                 PRUint8 aWhiteSpace,
                 PRUint8 aTextTransform);
#endif
};

#endif /* nsTextTransformer_h___ */
new 1998-10-20 04:17:17 +04:00			`/* -- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 --`
			`*`
updated license boilerplate to xPL 1.1, a=chofmann@netscape.com,r=endico@mozilla.org 1999-11-06 06:40:37 +03:00			`* The contents of this file are subject to the Netscape Public`
			`* License Version 1.1 (the "License"); you may not use this file`
			`* except in compliance with the License. You may obtain a copy of`
			`* the License at http://www.mozilla.org/NPL/`
new 1998-10-20 04:17:17 +04:00			`*`
updated license boilerplate to xPL 1.1, a=chofmann@netscape.com,r=endico@mozilla.org 1999-11-06 06:40:37 +03:00			`* Software distributed under the License is distributed on an "AS`
			`* IS" basis, WITHOUT WARRANTY OF ANY KIND, either express or`
			`* implied. See the License for the specific language governing`
			`* rights and limitations under the License.`
new 1998-10-20 04:17:17 +04:00			`*`
			`* The Original Code is Mozilla Communicator client code.`
			`*`
			`* The Initial Developer of the Original Code is Netscape Communications`
updated license boilerplate to xPL 1.1, a=chofmann@netscape.com,r=endico@mozilla.org 1999-11-06 06:40:37 +03:00			`* Corporation. Portions created by Netscape are`
			`* Copyright (C) 1998 Netscape Communications Corporation. All`
			`* Rights Reserved.`
			`*`
			`* Contributor(s):`
new 1998-10-20 04:17:17 +04:00			`*/`
			`#ifndef nsTextTransformer_h___`
			`#define nsTextTransformer_h___`

			`#include "nsTextFragment.h"`
			`#include "nsISupports.h"`
bug 4238; r/a=ftang,buster,waterson; added language specific transforms so that we can do things like U+005C -> U+00A5 (backslash -> yen sign for ja) 2000-09-21 03:00:32 +04:00			`#include "nsIPresContext.h"`
new 1998-10-20 04:17:17 +04:00
Minor changes to reduce the amount of unnecessary ref counting and speed things up a little 1999-09-17 03:31:59 +04:00			`class nsIContent;`
new 1998-10-20 04:17:17 +04:00			`class nsIFrame;`
change nsTextTransformer to break line by calling nsILineBreak and make nsTextFrame pass the nsILineBreaker to nsTextTransformer 1999-02-24 21:21:23 +03:00			`class nsILineBreaker;`
add one boolean to indicate word break or line break 1999-04-07 02:41:44 +04:00			`class nsIWordBreaker;`
new 1998-10-20 04:17:17 +04:00
r=ftang (someday); fixed 17559 regression - there were a few cases where characters > 127 were leaking out without setting the mHasMultibyte flag that were triggering painting bugs on macs... 1999-11-01 18:32:37 +03:00			`// XXX I'm sure there are other special characters`
			`#define CH_NBSP 160`
#14588 Ctrl+right arrow skips over nbsp (nbsp should be word break) ra=ftang a new fix which changes only apply to word jump. 2000-08-25 01:13:18 +04:00			`#define CH_ENSP 8194 //<!ENTITY ensp CDATA " " -- en space, U+2002 ISOpub -->`
			`#define CH_EMSP 8195 //<!ENTITY emsp CDATA " " -- em space, U+2003 ISOpub -->`
			`#define CH_THINSP 8291 //<!ENTITY thinsp CDATA " " -- thin space, U+2009 ISOpub -->`
			`#define CH_ZWNJ 8204 //<!ENTITY zwnj CDATA "‌" -- zero width non-joiner, U+200C NEW RFC 2070#define CH_SHY 173`
r=ftang (someday); fixed 17559 regression - there were a few cases where characters > 127 were leaking out without setting the mHasMultibyte flag that were triggering painting bugs on macs... 1999-11-01 18:32:37 +03:00			`#define CH_SHY 173`

fix for bug 50432. PRPackedBools compressed to one flag. mAutoBuffer size reduced to 128. r=buster 2000-09-12 04:00:58 +04:00			`#define NS_TEXT_TRANSFORMER_AUTO_WORD_BUF_SIZE 128 // used to be 256`

			`// Indicates whether the transformed text should be left as ascii`
			`#define NS_TEXT_TRANSFORMER_LEAVE_AS_ASCII 1`

			`// If at any point during GetNextWord or GetPrevWord we`
			`// run across a multibyte (> 127) unicode character.`
			`#define NS_TEXT_TRANSFORMER_HAS_MULTIBYTE 2`

			`// The text in the transform buffer is ascii`
			`#define NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII 4`
Changed to have the stack buffer embedded in the xformer 1999-09-22 04:40:16 +04:00
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`// A growable text buffer that tries to avoid using malloc by having a`
			`// builtin buffer. Ideally used as an automatic variable.`
			`class nsAutoTextBuffer {`
			`public:`
			`nsAutoTextBuffer();`
			`~nsAutoTextBuffer();`

			`nsresult GrowBy(PRInt32 aAtLeast, PRBool aCopyToHead = PR_TRUE);`

			`nsresult GrowTo(PRInt32 aNewSize, PRBool aCopyToHead = PR_TRUE);`

			`PRUnichar* GetBuffer() { return mBuffer; }`
			`PRUnichar* GetBufferEnd() { return mBuffer + mBufferLen; }`
			`PRInt32 GetBufferLength() const { return mBufferLen; }`

			`PRUnichar* mBuffer;`
			`PRInt32 mBufferLen;`
			`PRUnichar mAutoBuffer[NS_TEXT_TRANSFORMER_AUTO_WORD_BUF_SIZE];`
			`};`

			`//----------------------------------------`

new 1998-10-20 04:17:17 +04:00			`/**`
			`* This object manages the transformation of text:`
			`*`
			`* <UL>`
			`* <LI>whitespace compression`
			`* <LI>capitalization`
			`* <LI>lowercasing`
			`* <LI>uppercasing`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`* <LI>ascii to Unicode (if requested)`
Eliminated buffering that the text frame was doing when measuring text in runs and changed the text transformer code to do the buffering instead. It was already copying the transformed text into its internal buffer anyway, so this saves the extra copy 2000-04-04 18:14:47 +04:00			`* <LI>discarded characters`
			`* <LI>conversion of &nbsp that is not part of whitespace into a space`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`* <LI>tab and newline characters to space (normal text only)`
new 1998-10-20 04:17:17 +04:00			`* </UL>`
			`*`
			`* Note that no transformations are applied that would impact word`
			`* breaking (like mapping   into space, for example). In`
			`* addition, this logic will not strip leading or trailing whitespace`
			`* (across the entire run of text; leading whitespace can be skipped`
			`* for a frames text because of whitespace compression).`
			`*/`
			`class nsTextTransformer {`
			`public:`
Changed to have the stack buffer embedded in the xformer 1999-09-22 04:40:16 +04:00			`// Note: The text transformer does not hold a reference to the line`
			`// breaker and work breaker objects`
			`nsTextTransformer(nsILineBreaker* aLineBreaker,`
bug 4238; r/a=ftang,buster,waterson; added language specific transforms so that we can do things like U+005C -> U+00A5 (backslash -> yen sign for ja) 2000-09-21 03:00:32 +04:00			`nsIWordBreaker* aWordBreaker,`
			`nsIPresContext* aPresContext);`
change nsTextTransformer to break line by calling nsILineBreak and make nsTextFrame pass the nsILineBreaker to nsTextTransformer 1999-02-24 21:21:23 +03:00
new 1998-10-20 04:17:17 +04:00			`~nsTextTransformer();`

			`/**`
Eliminated buffering that the text frame was doing when measuring text in runs and changed the text transformer code to do the buffering instead. It was already copying the transformed text into its internal buffer anyway, so this saves the extra copy 2000-04-04 18:14:47 +04:00			`* Initialize the text transform. Use GetNextWord() and GetPrevWord()`
			`* to iterate the text`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`*`
			`* The default is to transform all text to Unicode; however, you can`
			`* specify that the text should be left as ascii if possible. Note that`
			`* we don't step the text down from Unicode to ascii (even if it doesn't`
			`* contain multibyte characters) so this only happens for text fragments`
			`* that contain 1-byte text.`
			`* XXX This is currently not implemented for GetPreviousWord()`
			`* @see TransformedTextIsAscii()`
new 1998-10-20 04:17:17 +04:00			`*/`
Minor changes to reduce the amount of unnecessary ref counting and speed things up a little 1999-09-17 03:31:59 +04:00			`nsresult Init(nsIFrame* aFrame,`
			`nsIContent* aContent,`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`PRInt32 aStartingOffset,`
			`PRBool aLeaveAsAscii = PR_FALSE);`
new 1998-10-20 04:17:17 +04:00
			`PRInt32 GetContentLength() const {`
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`return mFrag ? mFrag->GetLength() : 0;`
new 1998-10-20 04:17:17 +04:00			`}`

Eliminated buffering that the text frame was doing when measuring text in runs and changed the text transformer code to do the buffering instead. It was already copying the transformed text into its internal buffer anyway, so this saves the extra copy 2000-04-04 18:14:47 +04:00			`/**`
			`* Iterates the next word in the text fragment.`
			`*`
			`* Returns a pointer to the word, the number of characters in the word, the`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`* content length of the word, whether it is whitespace, and whether the`
			`* text was transformed (any of the transformations listed above). The content`
			`* length can be greater than the word length if whitespace compression occured`
			`* or if characters were discarded`
Eliminated buffering that the text frame was doing when measuring text in runs and changed the text transformer code to do the buffering instead. It was already copying the transformed text into its internal buffer anyway, so this saves the extra copy 2000-04-04 18:14:47 +04:00			`*`
			`* The default behavior is to reset the transform buffer to the beginning,`
			`* but you can choose to not reste it and buffer across multiple words`
			`*/`
Added support for capitalization transform 1998-10-20 20:45:14 +04:00			`PRUnichar* GetNextWord(PRBool aInWord,`
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`PRInt32* aWordLenResult,`
			`PRInt32* aContentLenResult,`
			`PRBool* aIsWhitespaceResult,`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`PRBool* aWasTransformed,`
Eliminated buffering that the text frame was doing when measuring text in runs and changed the text transformer code to do the buffering instead. It was already copying the transformed text into its internal buffer anyway, so this saves the extra copy 2000-04-04 18:14:47 +04:00			`PRBool aResetTransformBuf = PR_TRUE,`
add one boolean to indicate word break or line break 1999-04-07 02:41:44 +04:00			`PRBool aForLineBreak = PR_TRUE);`
new 1998-10-20 04:17:17 +04:00
gettig word jumping to work, adding GetPrevWord to texttransformer 1999-02-22 06:20:59 +03:00			`PRUnichar* GetPrevWord(PRBool aInWord,`
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`PRInt32* aWordLenResult,`
			`PRInt32* aContentLenResult,`
			`PRBool* aIsWhitespaceResult,`
			`PRBool aForLineBreak = PR_TRUE);`

fix for bug 50432. PRPackedBools compressed to one flag. mAutoBuffer size reduced to 128. r=buster 2000-09-12 04:00:58 +04:00
			`// Returns PR_TRUE if the LEAVE_AS_ASCII flag is set`
			`PRBool LeaveAsAscii() const {`
			`return (mFlags & NS_TEXT_TRANSFORMER_LEAVE_AS_ASCII) ? PR_TRUE : PR_FALSE;`
			`}`

			`// Returns PR_TRUE if any of the characters are multibyte (greater than 127)`
new 1998-10-20 04:17:17 +04:00			`PRBool HasMultibyte() const {`
fix for bug 50432. PRPackedBools compressed to one flag. mAutoBuffer size reduced to 128. r=buster 2000-09-12 04:00:58 +04:00			`return (mFlags & NS_TEXT_TRANSFORMER_HAS_MULTIBYTE) ? PR_TRUE : PR_FALSE;`
new 1998-10-20 04:17:17 +04:00			`}`

fix for bug 50432. PRPackedBools compressed to one flag. mAutoBuffer size reduced to 128. r=buster 2000-09-12 04:00:58 +04:00			`// Returns PR_TRUE if the text in the transform bufer is ascii (i.e., it`
			`// doesn't contain any multibyte characters)`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`PRBool TransformedTextIsAscii() const {`
fix for bug 50432. PRPackedBools compressed to one flag. mAutoBuffer size reduced to 128. r=buster 2000-09-12 04:00:58 +04:00			`return (mFlags & NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII) ? PR_TRUE : PR_FALSE;`
			`}`

			`// Set or clears the LEAVE_AS_ASCII bit`
			`void SetLeaveAsAscii(PRBool aValue) {`
			`aValue ? mFlags \|= NS_TEXT_TRANSFORMER_LEAVE_AS_ASCII :`
			`mFlags &= (~NS_TEXT_TRANSFORMER_LEAVE_AS_ASCII);`
			`}`

			`// Set or clears the NS_TEXT_TRANSFORMER_HAS_MULTIBYTE bit`
			`void SetHasMultibyte(PRBool aValue) {`
			`aValue ? mFlags \|= NS_TEXT_TRANSFORMER_HAS_MULTIBYTE :`
			`mFlags &= (~NS_TEXT_TRANSFORMER_HAS_MULTIBYTE);`
			`}`

			`// Set or clears the NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII bit`
			`void SetTransformedTextIsAscii(PRBool aValue) {`
			`aValue ? mFlags \|= NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII :`
			`mFlags &= (~NS_TEXT_TRANSFORMER_TRANSFORMED_TEXT_IS_ASCII);`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`}`

Changed to have the stack buffer embedded in the xformer 1999-09-22 04:40:16 +04:00			`PRUnichar* GetWordBuffer() {`
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`return mTransformBuf.GetBuffer();`
Changed to have the stack buffer embedded in the xformer 1999-09-22 04:40:16 +04:00			`}`

			`PRInt32 GetWordBufferLength() const {`
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`return mTransformBuf.GetBufferLength();`
Changed to have the stack buffer embedded in the xformer 1999-09-22 04:40:16 +04:00			`}`
new 1998-10-20 04:17:17 +04:00
fix for bug 50432. PRPackedBools compressed to one flag. mAutoBuffer size reduced to 128. r=buster 2000-09-12 04:00:58 +04:00
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`static nsresult Initialize();`
			`static void Shutdown();`
new 1998-10-20 04:17:17 +04:00
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`protected:`
			`// Helper methods for GetNextWord (F == forwards)`
			`PRInt32 ScanNormalWhiteSpace_F();`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`PRInt32 ScanNormalAsciiText_F(PRInt32* aWordLen,`
			`PRBool* aWasTransformed);`
#14588 Ctrl+right arrow skips over nbsp (nbsp should be word break) ra=ftang a new fix which changes only apply to word jump. 2000-08-25 01:13:18 +04:00			`PRInt32 ScanNormalAsciiText_F_ForWordBreak(PRInt32* aWordLen,`
			`PRBool* aWasTransformed);`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`PRInt32 ScanNormalUnicodeText_F(PRBool aForLineBreak,`
			`PRInt32* aWordLen,`
			`PRBool* aWasTransformed);`
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`PRInt32 ScanPreWrapWhiteSpace_F(PRInt32* aWordLen);`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`PRInt32 ScanPreAsciiData_F(PRInt32* aWordLen,`
			`PRBool* aWasTransformed);`
			`PRInt32 ScanPreData_F(PRInt32* aWordLen,`
			`PRBool* aWasTransformed);`
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00
			`// Helper methods for GetPrevWord (B == backwards)`
			`PRInt32 ScanNormalWhiteSpace_B();`
			`PRInt32 ScanNormalAsciiText_B(PRInt32* aWordLen);`
			`PRInt32 ScanNormalUnicodeText_B(PRBool aForLineBreak, PRInt32* aWordLen);`
			`PRInt32 ScanPreWrapWhiteSpace_B(PRInt32* aWordLen);`
			`PRInt32 ScanPreData_B(PRInt32* aWordLen);`

Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00			`// Converts the current text in the transform buffer from ascii to`
			`// Unicode`
			`void ConvertTransformedTextToUnicode();`

bug 4238; r/a=ftang,buster,waterson; added language specific transforms so that we can do things like U+005C -> U+00A5 (backslash -> yen sign for ja) 2000-09-21 03:00:32 +04:00			`void LanguageSpecificTransform(PRUnichar* aText, PRInt32 aLen,`
			`PRBool* aWasTransformed);`

r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`// The text fragment that we are looking at`
r=troy; revised nsITextContent api to simplify it and the consumers; this is done as prep work for bug 9101 1999-10-16 03:36:07 +04:00			`const nsTextFragment* mFrag;`
new 1998-10-20 04:17:17 +04:00
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`// Our current offset into the text fragment`
			`PRInt32 mOffset;`

			`// The frame's white-space mode we are using to process text`
			`enum {`
			`eNormal,`
			`ePreformatted,`
			`ePreWrap`
			`} mMode;`
fix for bug 50432. PRPackedBools compressed to one flag. mAutoBuffer size reduced to 128. r=buster 2000-09-12 04:00:58 +04:00
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`nsILineBreaker* mLineBreaker; // [WEAK]`

			`nsIWordBreaker* mWordBreaker; // [WEAK]`

bug 4238; r/a=ftang,buster,waterson; added language specific transforms so that we can do things like U+005C -> U+00A5 (backslash -> yen sign for ja) 2000-09-21 03:00:32 +04:00			`nsLanguageSpecificTransformType mLanguageSpecificTransformType;`

r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`// Buffer used to hold the transformed words from GetNextWord or`
			`// GetPrevWord`
			`nsAutoTextBuffer mTransformBuf;`

Eliminated buffering that the text frame was doing when measuring text in runs and changed the text transformer code to do the buffering instead. It was already copying the transformed text into its internal buffer anyway, so this saves the extra copy 2000-04-04 18:14:47 +04:00			`// Our current position within the buffer. Used when iterating the next`
			`// word, because we may be requested to buffer across multiple words`
			`PRInt32 mBufferPos;`
Added support for measuring text runs in ascii, and changed text transformer to leave the text as ascii if possible 2000-04-12 18:54:43 +04:00
			`// The frame's text-transform state`
			`PRUint8 mTextTransform;`
Eliminated buffering that the text frame was doing when measuring text in runs and changed the text transformer code to do the buffering instead. It was already copying the transformed text into its internal buffer anyway, so this saves the extra copy 2000-04-04 18:14:47 +04:00
fix for bug 50432. PRPackedBools compressed to one flag. mAutoBuffer size reduced to 128. r=buster 2000-09-12 04:00:58 +04:00			`// Flag for controling mLeaveAsAscii, mHasMultibyte, mTransformedTextIsAscii`
			`PRUint8 mFlags;`

r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`#ifdef DEBUG`
			`static void SelfTest(nsILineBreaker* aLineBreaker,`
bug 4238; r/a=ftang,buster,waterson; added language specific transforms so that we can do things like U+005C -> U+00A5 (backslash -> yen sign for ja) 2000-09-21 03:00:32 +04:00			`nsIWordBreaker* aWordBreaker,`
			`nsIPresContext* aPresContext);`
Changed to have the stack buffer embedded in the xformer 1999-09-22 04:40:16 +04:00
r=ftang; rewrite to fix 16656, parts of 7455 1999-10-20 03:01:45 +04:00			`nsresult Init2(const nsTextFragment* aFrag,`
			`PRInt32 aStartingOffset,`
			`PRUint8 aWhiteSpace,`
			`PRUint8 aTextTransform);`
			`#endif`
new 1998-10-20 04:17:17 +04:00			`};`

			`#endif /* nsTextTransformer_h___ */`