gecko-dev/intl/uconv/nsUnicodeToUTF8.cpp

/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
/* This Source Code Form is subject to the terms of the Mozilla Public
 * License, v. 2.0. If a copy of the MPL was not distributed with this
 * file, You can obtain one at http://mozilla.org/MPL/2.0/. */

//----------------------------------------------------------------------
// Global functions and data [declaration]
#include "nsUnicodeToUTF8.h"
#include "mozilla/CheckedInt.h"

NS_IMPL_ISUPPORTS(nsUnicodeToUTF8, nsIUnicodeEncoder)

//----------------------------------------------------------------------
// nsUnicodeToUTF8 class [implementation]

NS_IMETHODIMP nsUnicodeToUTF8::GetMaxLength(const char16_t* aSrc,
                                            int32_t aSrcLength,
                                            int32_t* aDestLength)
{
  MOZ_ASSERT(aDestLength);

  // aSrc is interpreted as UTF16, 3 is normally enough.
  // But when previous buffer only contains part of the surrogate pair, we
  // need to complete it here. If the first word in following buffer is not
  // in valid surrogate range, we need to convert the remaining of last buffer
  // to 3 bytes.
  mozilla::CheckedInt32 length = aSrcLength;
  length *= 3;
  length += 3;

  if (!length.isValid()) {
    return NS_ERROR_OUT_OF_MEMORY;
  }

  *aDestLength = length.value();
  return NS_OK;
}

NS_IMETHODIMP nsUnicodeToUTF8::Convert(const char16_t* aSrc,
                                       int32_t* aSrcLength,
                                       char* aDest,
                                       int32_t* aDestLength)
{
  const char16_t* src = aSrc;
  const char16_t* srcEnd = aSrc + *aSrcLength;
  char* dest = aDest;
  int32_t destLen = *aDestLength;
  uint32_t n;

  //complete remaining of last conversion
  if (mHighSurrogate) {
    if (src < srcEnd) {
      *aDestLength = 0;
      return NS_OK_UENC_MOREINPUT;
    }
    if (*aDestLength < 4) {
      *aSrcLength = 0;
      *aDestLength = 0;
      return NS_OK_UENC_MOREOUTPUT;
    }
    if (*src < (char16_t)0xdc00 || *src > (char16_t)0xdfff) { //not a pair
      *dest++ = (char)0xef; //replacement character
      *dest++ = (char)0xbf;
      *dest++ = (char)0xbd;
      destLen -= 3;
    } else { 
      n = ((mHighSurrogate - (char16_t)0xd800) << 10) + 
              (*src - (char16_t)0xdc00) + 0x10000;
      *dest++ = (char)0xf0 | (n >> 18);
      *dest++ = (char)0x80 | ((n >> 12) & 0x3f);
      *dest++ = (char)0x80 | ((n >> 6) & 0x3f);
      *dest++ = (char)0x80 | (n & 0x3f);
      ++src;
      destLen -= 4;
    }
    mHighSurrogate = 0;
  }

  while (src < srcEnd) {
    if ( *src <= 0x007f) {
      if (destLen < 1)
        goto error_more_output;
      *dest++ = (char)*src;
      --destLen;
    } else if (*src <= 0x07ff) {
      if (destLen < 2)
        goto error_more_output;
      *dest++ = (char)0xc0 | (*src >> 6);
      *dest++ = (char)0x80 | (*src & 0x003f);
      destLen -= 2;
    } else if (*src >= (char16_t)0xd800 && *src <= (char16_t)0xdfff) {
      if (*src >= (char16_t)0xdc00) { //not a pair
        if (destLen < 3)
          goto error_more_output;
        *dest++ = (char)0xef; //replacement character
        *dest++ = (char)0xbf;
        *dest++ = (char)0xbd;
        destLen -= 3;
        ++src;
        continue;
      }
      if ((src+1) >= srcEnd) {
        //we need another surrogate to complete this unicode char
        mHighSurrogate = *src;
        *aDestLength = dest - aDest;
        return NS_OK_UENC_MOREINPUT;
      }
      //handle surrogate
      if (destLen < 4)
        goto error_more_output;
      if (*(src+1) < (char16_t)0xdc00 || *(src+1) > 0xdfff) { //not a pair
        *dest++ = (char)0xef; //replacement character
        *dest++ = (char)0xbf;
        *dest++ = (char)0xbd;
        destLen -= 3;
      } else {
        n = ((*src - (char16_t)0xd800) << 10) + (*(src+1) - (char16_t)0xdc00) + (uint32_t)0x10000;
        *dest++ = (char)0xf0 | (n >> 18);
        *dest++ = (char)0x80 | ((n >> 12) & 0x3f);
        *dest++ = (char)0x80 | ((n >> 6) & 0x3f);
        *dest++ = (char)0x80 | (n & 0x3f);
        destLen -= 4;
        ++src;
      }
    } else { 
      if (destLen < 3)
        goto error_more_output;
      //treat rest of the character as BMP
      *dest++ = (char)0xe0 | (*src >> 12);
      *dest++ = (char)0x80 | ((*src >> 6) & 0x003f);
      *dest++ = (char)0x80 | (*src & 0x003f);
      destLen -= 3;
    }
    ++src;
  }

  *aDestLength = dest - aDest;
  return NS_OK;

error_more_output:
  *aSrcLength = src - aSrc;
  *aDestLength = dest - aDest;
  return NS_OK_UENC_MOREOUTPUT;
}

NS_IMETHODIMP nsUnicodeToUTF8::Finish(char * aDest, int32_t * aDestLength)
{
  char * dest = aDest;

  if (mHighSurrogate) {
    if (*aDestLength < 3) {
      *aDestLength = 0;
      return NS_OK_UENC_MOREOUTPUT;
    }
    *dest++ = (char)0xef; //replacement character
    *dest++ = (char)0xbf;
    *dest++ = (char)0xbd;
    mHighSurrogate = 0;
    *aDestLength = 3;
    return NS_OK;
  } 

  *aDestLength  = 0;
  return NS_OK;
}
License changes, take 2. Bug 98089. mozilla/include/, /mozilla/htmlparser/, /mozilla/intl/ (part 1). 2001-09-26 04:40:45 +04:00			`/* -- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -- */`
Bug 716478 - update licence to MPL 2. 2012-05-21 15:12:37 +04:00			`/* This Source Code Form is subject to the terms of the Mozilla Public`
			`* License, v. 2.0. If a copy of the MPL was not distributed with this`
			`* file, You can obtain one at http://mozilla.org/MPL/2.0/. */`
Fix for 65685; /r=valeski, /sr=ftang 2001-02-07 02:54:12 +03:00
			`//----------------------------------------------------------------------`
			`// Global functions and data [declaration]`
			`#include "nsUnicodeToUTF8.h"`
Bug 1170794 - Improve the length check of the input in nsUnicode*::GetMaxLength, r=dveditz 2015-06-17 14:21:39 +03:00			`#include "mozilla/CheckedInt.h"`
Fix for 65685; /r=valeski, /sr=ftang 2001-02-07 02:54:12 +03:00
Bug 900908 - Part 3: Change uses of numbered macros in nsIClassInfoImpl.h/nsISupportsImpl.h to the variadic variants. r=froydnj 2014-04-27 11:06:00 +04:00			`NS_IMPL_ISUPPORTS(nsUnicodeToUTF8, nsIUnicodeEncoder)`
Fix for 65685; /r=valeski, /sr=ftang 2001-02-07 02:54:12 +03:00
			`//----------------------------------------------------------------------`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`// nsUnicodeToUTF8 class [implementation]`
Fix for 65685; /r=valeski, /sr=ftang 2001-02-07 02:54:12 +03:00
Bug 1170794 - Improve the length check of the input in nsUnicode*::GetMaxLength, r=dveditz 2015-06-17 14:21:39 +03:00			`NS_IMETHODIMP nsUnicodeToUTF8::GetMaxLength(const char16_t* aSrc,`
			`int32_t aSrcLength,`
			`int32_t* aDestLength)`
Fix for 65685; /r=valeski, /sr=ftang 2001-02-07 02:54:12 +03:00			`{`
Bug 1170794 - Improve the length check of the input in nsUnicode*::GetMaxLength, r=dveditz 2015-06-17 14:21:39 +03:00			`MOZ_ASSERT(aDestLength);`

#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`// aSrc is interpreted as UTF16, 3 is normally enough.`
Bug 1170794 - Improve the length check of the input in nsUnicode*::GetMaxLength, r=dveditz 2015-06-17 14:21:39 +03:00			`// But when previous buffer only contains part of the surrogate pair, we`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`// need to complete it here. If the first word in following buffer is not`
Bug 577266 - Correct misspellings in source code 2011-09-07 04:20:35 +04:00			`// in valid surrogate range, we need to convert the remaining of last buffer`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`// to 3 bytes.`
Bug 1170794 - Improve the length check of the input in nsUnicode*::GetMaxLength, r=dveditz 2015-06-17 14:21:39 +03:00			`mozilla::CheckedInt32 length = aSrcLength;`
			`length *= 3;`
			`length += 3;`

			`if (!length.isValid()) {`
Bug 1170794 - patch 2 - Improve the length check of the input in nsUnicode*::GetMaxLength, r=dveditz 2015-06-17 14:38:29 +03:00			`return NS_ERROR_OUT_OF_MEMORY;`
Bug 1170794 - Improve the length check of the input in nsUnicode*::GetMaxLength, r=dveditz 2015-06-17 14:21:39 +03:00			`}`

			`*aDestLength = length.value();`
Fix for 65685; /r=valeski, /sr=ftang 2001-02-07 02:54:12 +03:00			`return NS_OK;`
			`}`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00
Bug 1170794 - patch 2 - Improve the length check of the input in nsUnicode*::GetMaxLength, r=dveditz 2015-06-17 14:38:29 +03:00			`NS_IMETHODIMP nsUnicodeToUTF8::Convert(const char16_t* aSrc,`
			`int32_t* aSrcLength,`
			`char* aDest,`
			`int32_t* aDestLength)`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`{`
Bug 1170794 - patch 2 - Improve the length check of the input in nsUnicode*::GetMaxLength, r=dveditz 2015-06-17 14:38:29 +03:00			`const char16_t* src = aSrc;`
			`const char16_t* srcEnd = aSrc + *aSrcLength;`
			`char* dest = aDest;`
Bug 579517 - Part 1: Automated conversion of NSPR numeric types to stdint types in Gecko; r=bsmedberg This patch was generated by a script. Here's the source of the script for future reference: function convert() { echo "Converting $1 to $2..." find . ! -wholename "nsprpub" \ ! -wholename "security/nss" \ ! -wholename "/.hg" \ ! -wholename "obj-ff-dbg" \ ! -name nsXPCOMCID.h \ ! -name prtypes.h \ -type f \ \( -iname ".cpp" \ -o -iname ".h" \ -o -iname ".c" \ -o -iname ".cc" \ -o -iname ".idl" \ -o -iname ".ipdl" \ -o -iname ".ipdlh" \ -o -iname "*.mm" \) \| \ xargs -n 1 sed -i -e "s/\b$1\b/$2/g" } convert PRInt8 int8_t convert PRUint8 uint8_t convert PRInt16 int16_t convert PRUint16 uint16_t convert PRInt32 int32_t convert PRUint32 uint32_t convert PRInt64 int64_t convert PRUint64 uint64_t convert PRIntn int convert PRUintn unsigned convert PRSize size_t convert PROffset32 int32_t convert PROffset64 int64_t convert PRPtrdiff ptrdiff_t convert PRFloat64 double 2012-08-22 19:56:38 +04:00			`int32_t destLen = *aDestLength;`
			`uint32_t n;`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00
			`//complete remaining of last conversion`
			`if (mHighSurrogate) {`
			`if (src < srcEnd) {`
			`*aDestLength = 0;`
			`return NS_OK_UENC_MOREINPUT;`
			`}`
			`if (*aDestLength < 4) {`
			`*aSrcLength = 0;`
			`*aDestLength = 0;`
			`return NS_OK_UENC_MOREOUTPUT;`
			`}`
Bug 927728 - Part 1: Replace PRUnichar with char16_t; r=roc This patch was automatically generated by the following script: #!/bin/bash # Command to convert PRUnichar to char16_t function convert() { echo "Converting $1 to $2..." find . ! -wholename "nsprpub" \ ! -wholename "security/nss" \ ! -wholename "modules/libmar" \ ! -wholename "/.hg" \ ! -wholename "obj-ff-dbg" \ ! -name prtypes.h \ ! -name Char16.h \ -type f \ \( -iname ".cpp" \ -o -iname ".h" \ -o -iname ".c" \ -o -iname ".cc" \ -o -iname ".idl" \ -o -iname ".ipdl" \ -o -iname ".ipdlh" \ -o -iname "*.mm" \) \| \ xargs -n 1 sed -i -e "s/\b$1\b/$2/g" } convert PRUnichar char16_t 2014-01-04 19:02:17 +04:00			`if (src < (char16_t)0xdc00 \|\| src > (char16_t)0xdfff) { //not a pair`
Bug 746900 - Implement "Best Practices for Using U+FFFD" from the Unicode standard. r=smontagu 2012-11-27 05:38:19 +04:00			`*dest++ = (char)0xef; //replacement character`
			`*dest++ = (char)0xbf;`
			`*dest++ = (char)0xbd;`
#128825 Browser crash if I view an image Adjust destLen (remaining buffer length) as buffer is consumed. This way we will know when we will run out of buffer. r=ftang, sr=jst, a=shaver 2002-03-14 03:36:55 +03:00			`destLen -= 3;`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`} else {`
Bug 927728 - Part 1: Replace PRUnichar with char16_t; r=roc This patch was automatically generated by the following script: #!/bin/bash # Command to convert PRUnichar to char16_t function convert() { echo "Converting $1 to $2..." find . ! -wholename "nsprpub" \ ! -wholename "security/nss" \ ! -wholename "modules/libmar" \ ! -wholename "/.hg" \ ! -wholename "obj-ff-dbg" \ ! -name prtypes.h \ ! -name Char16.h \ -type f \ \( -iname ".cpp" \ -o -iname ".h" \ -o -iname ".c" \ -o -iname ".cc" \ -o -iname ".idl" \ -o -iname ".ipdl" \ -o -iname ".ipdlh" \ -o -iname "*.mm" \) \| \ xargs -n 1 sed -i -e "s/\b$1\b/$2/g" } convert PRUnichar char16_t 2014-01-04 19:02:17 +04:00			`n = ((mHighSurrogate - (char16_t)0xd800) << 10) +`
			`(*src - (char16_t)0xdc00) + 0x10000;`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`*dest++ = (char)0xf0 \| (n >> 18);`
			`*dest++ = (char)0x80 \| ((n >> 12) & 0x3f);`
			`*dest++ = (char)0x80 \| ((n >> 6) & 0x3f);`
			`*dest++ = (char)0x80 \| (n & 0x3f);`
			`++src;`
#128825 Browser crash if I view an image Adjust destLen (remaining buffer length) as buffer is consumed. This way we will know when we will run out of buffer. r=ftang, sr=jst, a=shaver 2002-03-14 03:36:55 +03:00			`destLen -= 4;`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`}`
			`mHighSurrogate = 0;`
			`}`

			`while (src < srcEnd) {`
Bugs in intl/uconv/src/nsUnicodeToUTF8.cpp. Bug 191483, Author=hsivonen@iki.fi, r=smontagu, sr=rbs 2003-05-30 05:16:20 +04:00			`if ( *src <= 0x007f) {`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`if (destLen < 1)`
			`goto error_more_output;`
			`dest++ = (char)src;`
			`--destLen;`
Bugs in intl/uconv/src/nsUnicodeToUTF8.cpp. Bug 191483, Author=hsivonen@iki.fi, r=smontagu, sr=rbs 2003-05-30 05:16:20 +04:00			`} else if (*src <= 0x07ff) {`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`if (destLen < 2)`
			`goto error_more_output;`
			`dest++ = (char)0xc0 \| (src >> 6);`
			`dest++ = (char)0x80 \| (src & 0x003f);`
#128825 Browser crash if I view an image Adjust destLen (remaining buffer length) as buffer is consumed. This way we will know when we will run out of buffer. r=ftang, sr=jst, a=shaver 2002-03-14 03:36:55 +03:00			`destLen -= 2;`
Bug 927728 - Part 1: Replace PRUnichar with char16_t; r=roc This patch was automatically generated by the following script: #!/bin/bash # Command to convert PRUnichar to char16_t function convert() { echo "Converting $1 to $2..." find . ! -wholename "nsprpub" \ ! -wholename "security/nss" \ ! -wholename "modules/libmar" \ ! -wholename "/.hg" \ ! -wholename "obj-ff-dbg" \ ! -name prtypes.h \ ! -name Char16.h \ -type f \ \( -iname ".cpp" \ -o -iname ".h" \ -o -iname ".c" \ -o -iname ".cc" \ -o -iname ".idl" \ -o -iname ".ipdl" \ -o -iname ".ipdlh" \ -o -iname "*.mm" \) \| \ xargs -n 1 sed -i -e "s/\b$1\b/$2/g" } convert PRUnichar char16_t 2014-01-04 19:02:17 +04:00			`} else if (src >= (char16_t)0xd800 && src <= (char16_t)0xdfff) {`
			`if (*src >= (char16_t)0xdc00) { //not a pair`
Bug 746900 - Implement "Best Practices for Using U+FFFD" from the Unicode standard. r=smontagu 2012-11-27 05:38:19 +04:00			`if (destLen < 3)`
			`goto error_more_output;`
			`*dest++ = (char)0xef; //replacement character`
			`*dest++ = (char)0xbf;`
			`*dest++ = (char)0xbd;`
			`destLen -= 3;`
			`++src;`
			`continue;`
			`}`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`if ((src+1) >= srcEnd) {`
			`//we need another surrogate to complete this unicode char`
			`mHighSurrogate = *src;`
			`*aDestLength = dest - aDest;`
			`return NS_OK_UENC_MOREINPUT;`
			`}`
			`//handle surrogate`
			`if (destLen < 4)`
			`goto error_more_output;`
Bug 927728 - Part 1: Replace PRUnichar with char16_t; r=roc This patch was automatically generated by the following script: #!/bin/bash # Command to convert PRUnichar to char16_t function convert() { echo "Converting $1 to $2..." find . ! -wholename "nsprpub" \ ! -wholename "security/nss" \ ! -wholename "modules/libmar" \ ! -wholename "/.hg" \ ! -wholename "obj-ff-dbg" \ ! -name prtypes.h \ ! -name Char16.h \ -type f \ \( -iname ".cpp" \ -o -iname ".h" \ -o -iname ".c" \ -o -iname ".cc" \ -o -iname ".idl" \ -o -iname ".ipdl" \ -o -iname ".ipdlh" \ -o -iname "*.mm" \) \| \ xargs -n 1 sed -i -e "s/\b$1\b/$2/g" } convert PRUnichar char16_t 2014-01-04 19:02:17 +04:00			`if ((src+1) < (char16_t)0xdc00 \|\| (src+1) > 0xdfff) { //not a pair`
Bug 746900 - Implement "Best Practices for Using U+FFFD" from the Unicode standard. r=smontagu 2012-11-27 05:38:19 +04:00			`*dest++ = (char)0xef; //replacement character`
			`*dest++ = (char)0xbf;`
			`*dest++ = (char)0xbd;`
#128825 Browser crash if I view an image Adjust destLen (remaining buffer length) as buffer is consumed. This way we will know when we will run out of buffer. r=ftang, sr=jst, a=shaver 2002-03-14 03:36:55 +03:00			`destLen -= 3;`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`} else {`
Bug 927728 - Part 1: Replace PRUnichar with char16_t; r=roc This patch was automatically generated by the following script: #!/bin/bash # Command to convert PRUnichar to char16_t function convert() { echo "Converting $1 to $2..." find . ! -wholename "nsprpub" \ ! -wholename "security/nss" \ ! -wholename "modules/libmar" \ ! -wholename "/.hg" \ ! -wholename "obj-ff-dbg" \ ! -name prtypes.h \ ! -name Char16.h \ -type f \ \( -iname ".cpp" \ -o -iname ".h" \ -o -iname ".c" \ -o -iname ".cc" \ -o -iname ".idl" \ -o -iname ".ipdl" \ -o -iname ".ipdlh" \ -o -iname "*.mm" \) \| \ xargs -n 1 sed -i -e "s/\b$1\b/$2/g" } convert PRUnichar char16_t 2014-01-04 19:02:17 +04:00			`n = ((src - (char16_t)0xd800) << 10) + ((src+1) - (char16_t)0xdc00) + (uint32_t)0x10000;`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`*dest++ = (char)0xf0 \| (n >> 18);`
			`*dest++ = (char)0x80 \| ((n >> 12) & 0x3f);`
			`*dest++ = (char)0x80 \| ((n >> 6) & 0x3f);`
			`*dest++ = (char)0x80 \| (n & 0x3f);`
#128825 Browser crash if I view an image Adjust destLen (remaining buffer length) as buffer is consumed. This way we will know when we will run out of buffer. r=ftang, sr=jst, a=shaver 2002-03-14 03:36:55 +03:00			`destLen -= 4;`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`++src;`
			`}`
			`} else {`
			`if (destLen < 3)`
			`goto error_more_output;`
			`//treat rest of the character as BMP`
			`dest++ = (char)0xe0 \| (src >> 12);`
			`dest++ = (char)0x80 \| ((src >> 6) & 0x003f);`
			`dest++ = (char)0x80 \| (src & 0x003f);`
#128825 Browser crash if I view an image Adjust destLen (remaining buffer length) as buffer is consumed. This way we will know when we will run out of buffer. r=ftang, sr=jst, a=shaver 2002-03-14 03:36:55 +03:00			`destLen -= 3;`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`}`
			`++src;`
			`}`

			`*aDestLength = dest - aDest;`
			`return NS_OK;`

			`error_more_output:`
			`*aSrcLength = src - aSrc;`
			`*aDestLength = dest - aDest;`
			`return NS_OK_UENC_MOREOUTPUT;`
			`}`

Bug 579517 - Part 1: Automated conversion of NSPR numeric types to stdint types in Gecko; r=bsmedberg This patch was generated by a script. Here's the source of the script for future reference: function convert() { echo "Converting $1 to $2..." find . ! -wholename "nsprpub" \ ! -wholename "security/nss" \ ! -wholename "/.hg" \ ! -wholename "obj-ff-dbg" \ ! -name nsXPCOMCID.h \ ! -name prtypes.h \ -type f \ \( -iname ".cpp" \ -o -iname ".h" \ -o -iname ".c" \ -o -iname ".cc" \ -o -iname ".idl" \ -o -iname ".ipdl" \ -o -iname ".ipdlh" \ -o -iname "*.mm" \) \| \ xargs -n 1 sed -i -e "s/\b$1\b/$2/g" } convert PRInt8 int8_t convert PRUint8 uint8_t convert PRInt16 int16_t convert PRUint16 uint16_t convert PRInt32 int32_t convert PRUint32 uint32_t convert PRInt64 int64_t convert PRUint64 uint64_t convert PRIntn int convert PRUintn unsigned convert PRSize size_t convert PROffset32 int32_t convert PROffset64 int64_t convert PRPtrdiff ptrdiff_t convert PRFloat64 double 2012-08-22 19:56:38 +04:00			`NS_IMETHODIMP nsUnicodeToUTF8::Finish(char * aDest, int32_t * aDestLength)`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`{`
			`char * dest = aDest;`

			`if (mHighSurrogate) {`
			`if (*aDestLength < 3) {`
			`*aDestLength = 0;`
			`return NS_OK_UENC_MOREOUTPUT;`
			`}`
Bug 746900 - Implement "Best Practices for Using U+FFFD" from the Unicode standard. r=smontagu 2012-11-27 05:38:19 +04:00			`*dest++ = (char)0xef; //replacement character`
			`*dest++ = (char)0xbf;`
			`*dest++ = (char)0xbd;`
#102595 nsUnicodeToUTF8 does not handle surrogate pair correctly r=bstell, sr=brendan 2002-01-15 04:04:24 +03:00			`mHighSurrogate = 0;`
			`*aDestLength = 3;`
			`return NS_OK;`
			`}`

			`*aDestLength = 0;`
			`return NS_OK;`
			`}`