gecko-dev/intl/uconv/src/nsTextToSubURI.cpp

/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
/* ***** BEGIN LICENSE BLOCK *****
 * Version: NPL 1.1/GPL 2.0/LGPL 2.1
 *
 * The contents of this file are subject to the Netscape Public License
 * Version 1.1 (the "License"); you may not use this file except in
 * compliance with the License. You may obtain a copy of the License at
 * http://www.mozilla.org/NPL/
 *
 * Software distributed under the License is distributed on an "AS IS" basis,
 * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
 * for the specific language governing rights and limitations under the
 * License.
 *
 * The Original Code is mozilla.org code.
 *
 * The Initial Developer of the Original Code is 
 * Netscape Communications Corporation.
 * Portions created by the Initial Developer are Copyright (C) 1998
 * the Initial Developer. All Rights Reserved.
 *
 * Contributor(s):
 *   Pierre Phaneuf <pp@ludusdesign.com>
 *
 *
 * Alternatively, the contents of this file may be used under the terms of
 * either the GNU General Public License Version 2 or later (the "GPL"), or
 * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
 * in which case the provisions of the GPL or the LGPL are applicable instead
 * of those above. If you wish to allow use of your version of this file only
 * under the terms of either the GPL or the LGPL, and not to allow others to
 * use your version of this file under the terms of the NPL, indicate your
 * decision by deleting the provisions above and replace them with the notice
 * and other provisions required by the GPL or the LGPL. If you do not delete
 * the provisions above, a recipient may use your version of this file under
 * the terms of any one of the NPL, the GPL or the LGPL.
 *
 * ***** END LICENSE BLOCK ***** */
#include "nsString.h"
#include "nsIUnicodeEncoder.h"
#include "nsICharsetConverterManager.h"
#include "nsICharsetConverterManager2.h"
#include "nsReadableUtils.h"
#include "nsITextToSubURI.h"
#include "nsIServiceManager.h"
#include "nsUConvDll.h"
#include "nsEscape.h"
#include "prmem.h"
#include "nsTextToSubURI.h"
#include "nsCRT.h"

static NS_DEFINE_CID(kITextToSubURIIID, NS_ITEXTTOSUBURI_IID);
static NS_DEFINE_CID(kCharsetConverterManagerCID, NS_ICHARSETCONVERTERMANAGER_CID);

nsTextToSubURI::nsTextToSubURI()
{
}
nsTextToSubURI::~nsTextToSubURI()
{
}

NS_IMPL_ISUPPORTS1(nsTextToSubURI, nsITextToSubURI)

NS_IMETHODIMP  nsTextToSubURI::ConvertAndEscape(
  const char *charset, const PRUnichar *text, char **_retval) 
{
  if(nsnull == _retval)
    return NS_ERROR_NULL_POINTER;
  *_retval = nsnull;
  nsAutoString charsetStr; charsetStr.AssignWithConversion(charset);
  nsIUnicodeEncoder *encoder = nsnull;
  nsresult rv = NS_OK;
  
  // Get Charset, get the encoder.
  nsICharsetConverterManager * ccm = nsnull;
  rv = nsServiceManager::GetService(kCharsetConverterManagerCID ,
                                    NS_GET_IID(nsICharsetConverterManager),
                                    (nsISupports**)&ccm);
  if(NS_SUCCEEDED(rv) && (nsnull != ccm)) {
     rv = ccm->GetUnicodeEncoder(&charsetStr, &encoder);
     nsServiceManager::ReleaseService( kCharsetConverterManagerCID, ccm);
     if (NS_SUCCEEDED(rv)) {
       rv = encoder->SetOutputErrorBehavior(nsIUnicodeEncoder::kOnError_Replace, nsnull, (PRUnichar)'?');
       if(NS_SUCCEEDED(rv))
       {
          char buf[256];
          char *pBuf = buf;
          PRInt32 ulen = nsCRT::strlen(text);
          PRInt32 outlen = 0;
          if(NS_SUCCEEDED(rv = encoder->GetMaxLength(text, ulen, &outlen))) 
          {
             if(outlen >= 256) {
                pBuf = (char*)PR_Malloc(outlen+1);
             }
             if(nsnull == pBuf) {
                outlen = 255;
                pBuf = buf;
             }
             PRInt32 bufLen = outlen;
             if(NS_SUCCEEDED(rv = encoder->Convert(text,&ulen, pBuf, &outlen))) {
                // put termination characters (e.g. ESC(B of ISO-2022-JP) if necessary
                PRInt32 finLen = bufLen - outlen;
                if (finLen > 0) {
                  if (NS_SUCCEEDED(encoder->Finish((char *)(pBuf+outlen), &finLen)))
                    outlen += finLen;
                }
                pBuf[outlen] = '\0';
                *_retval = nsEscape(pBuf, url_XPAlphas);
                if(nsnull == *_retval)
                  rv = NS_ERROR_OUT_OF_MEMORY;
             }
          }
          if(pBuf != buf)
             PR_Free(pBuf);
       }
       NS_IF_RELEASE(encoder);
     }
  }
  
  return rv;
}

NS_IMETHODIMP  nsTextToSubURI::UnEscapeAndConvert(
  const char *charset, const char *text, PRUnichar **_retval) 
{
  if(nsnull == _retval)
    return NS_ERROR_NULL_POINTER;
  *_retval = nsnull;
  nsresult rv = NS_OK;
  
  // unescape the string, unescape changes the input
  char *unescaped = nsCRT::strdup((char *) text);
  if (nsnull == unescaped)
    return NS_ERROR_OUT_OF_MEMORY;
  unescaped = nsUnescape(unescaped);
  NS_ASSERTION(unescaped, "nsUnescape returned null");

  // Convert from the charset to unicode
  nsCOMPtr<nsICharsetConverterManager> ccm = 
           do_GetService(kCharsetConverterManagerCID, &rv); 
  if (NS_SUCCEEDED(rv)) {
    nsAutoString charsetStr; charsetStr.AssignWithConversion(charset);
    nsIUnicodeDecoder *decoder;
    rv = ccm->GetUnicodeDecoder(&charsetStr, &decoder);
    if (NS_SUCCEEDED(rv)) {
      PRUnichar *pBuf = nsnull;
      PRInt32 len = strlen(unescaped);
      PRInt32 outlen = 0;
      if (NS_SUCCEEDED(rv = decoder->GetMaxLength(unescaped, len, &outlen))) {
        pBuf = (PRUnichar *) PR_Malloc((outlen+1)*sizeof(PRUnichar*));
        if (nsnull == pBuf)
          rv = NS_ERROR_OUT_OF_MEMORY;
        else {
          if (NS_SUCCEEDED(rv = decoder->Convert(unescaped, &len, pBuf, &outlen))) {
            pBuf[outlen] = 0;
            *_retval = pBuf;
          }
        }
      }
      NS_IF_RELEASE(decoder);
    }
  }
  PR_FREEIF(unescaped);

  return rv;
}

static PRBool statefulCharset(const char *charset)
{
  if (!nsCRT::strncasecmp(charset, "ISO-2022-", sizeof("ISO-2022-")-1) ||
      !nsCRT::strcasecmp(charset, "UTF-7") ||
      !nsCRT::strcasecmp(charset, "HZ-GB-2312"))
    return PR_TRUE;

  return PR_FALSE;
}

nsresult nsTextToSubURI::convertURItoUnicode(const nsAFlatCString &aCharset,
                                             const nsAFlatCString &aURI, 
                                             PRBool aIRI, 
                                             nsAString &_retval)
{
  nsresult rv = NS_OK;

  // check for 7bit encoding the data may not be ASCII after we decode
  PRBool isStatefulCharset = statefulCharset(aCharset.get());

  if (!isStatefulCharset && IsASCII(aURI)) {
    _retval.Assign(NS_ConvertASCIItoUCS2(aURI));
    return rv;
  }

  if (!isStatefulCharset && aIRI) {
    if (IsUTF8(aURI)) {
      _retval.Assign(NS_ConvertUTF8toUCS2(aURI));
      return rv;
    }
  }

  // empty charset could indicate UTF-8, but aURI turns out not to be UTF-8.
  NS_ENSURE_FALSE(aCharset.IsEmpty(), NS_ERROR_INVALID_ARG);

  nsCOMPtr<nsICharsetConverterManager2> charsetConverterManager;

  charsetConverterManager = do_GetService(NS_CHARSETCONVERTERMANAGER_CONTRACTID, &rv);
  NS_ENSURE_SUCCESS(rv, rv);

  nsCOMPtr<nsIAtom> charsetAtom;
  rv = charsetConverterManager->GetCharsetAtom2(aCharset.get(), getter_AddRefs(charsetAtom));
  NS_ENSURE_SUCCESS(rv, rv);

  nsCOMPtr<nsIUnicodeDecoder> unicodeDecoder;
  rv = charsetConverterManager->GetUnicodeDecoder(charsetAtom, 
                                                  getter_AddRefs(unicodeDecoder));
  NS_ENSURE_SUCCESS(rv, rv);

  PRInt32 srcLen = aURI.Length();
  PRInt32 dstLen;
  rv = unicodeDecoder->GetMaxLength(aURI.get(), srcLen, &dstLen);
  NS_ENSURE_SUCCESS(rv, rv);

  PRUnichar *ustr = (PRUnichar *) nsMemory::Alloc(dstLen * sizeof(PRUnichar));
  NS_ENSURE_TRUE(ustr, NS_ERROR_OUT_OF_MEMORY);

  rv = unicodeDecoder->Convert(aURI.get(), &srcLen, ustr, &dstLen);

  if (NS_SUCCEEDED(rv))
    _retval.Assign(ustr, dstLen);
  
  nsMemory::Free(ustr);

  return rv;
}

NS_IMETHODIMP  nsTextToSubURI::UnEscapeURIForUI(const nsACString & aCharset, 
                                                const nsACString &aURIFragment, 
                                                nsAString &_retval)
{
  nsCAutoString unescapedSpec(aURIFragment);
  NS_UnescapeURL(unescapedSpec);

  return convertURItoUnicode(PromiseFlatCString(aCharset), unescapedSpec, PR_TRUE, _retval);
}

NS_IMETHODIMP  nsTextToSubURI::UnEscapeNonAsciiURI(const nsACString & aCharset, 
                                                   const nsACString &aURIFragment, 
                                                   nsAString &_retval)
{
  nsCAutoString unescapedSpec;
  NS_UnescapeURL(PromiseFlatCString(aURIFragment),
                 esc_AlwaysCopy | esc_OnlyNonASCII, unescapedSpec);

  return convertURItoUnicode(PromiseFlatCString(aCharset), unescapedSpec, PR_TRUE, _retval);
}

//----------------------------------------------------------------------
License changes, take 2. Bug 98089. mozilla/include/, /mozilla/htmlparser/, /mozilla/intl/ (part 1). 2001-09-26 04:40:45 +04:00			`/* -- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 2 -- */`
			`/* *** BEGIN LICENSE BLOCK ***`
			`* Version: NPL 1.1/GPL 2.0/LGPL 2.1`
1st check in 1999-09-21 04:30:12 +04:00			`*`
License changes, take 2. Bug 98089. mozilla/include/, /mozilla/htmlparser/, /mozilla/intl/ (part 1). 2001-09-26 04:40:45 +04:00			`* The contents of this file are subject to the Netscape Public License`
			`* Version 1.1 (the "License"); you may not use this file except in`
			`* compliance with the License. You may obtain a copy of the License at`
			`* http://www.mozilla.org/NPL/`
1st check in 1999-09-21 04:30:12 +04:00			`*`
License changes, take 2. Bug 98089. mozilla/include/, /mozilla/htmlparser/, /mozilla/intl/ (part 1). 2001-09-26 04:40:45 +04:00			`* Software distributed under the License is distributed on an "AS IS" basis,`
			`* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License`
			`* for the specific language governing rights and limitations under the`
			`* License.`
1st check in 1999-09-21 04:30:12 +04:00			`*`
updated xPL license boilerplate to v1.1, a=chofmann@netscape.com,r=endico@mozilla.org 1999-11-06 06:43:54 +03:00			`* The Original Code is mozilla.org code.`
			`*`
License changes, take 2. Bug 98089. mozilla/include/, /mozilla/htmlparser/, /mozilla/intl/ (part 1). 2001-09-26 04:40:45 +04:00			`* The Initial Developer of the Original Code is`
			`* Netscape Communications Corporation.`
			`* Portions created by the Initial Developer are Copyright (C) 1998`
			`* the Initial Developer. All Rights Reserved.`
updated xPL license boilerplate to v1.1, a=chofmann@netscape.com,r=endico@mozilla.org 1999-11-06 06:43:54 +03:00			`*`
License changes, take 2. Bug 98089. mozilla/include/, /mozilla/htmlparser/, /mozilla/intl/ (part 1). 2001-09-26 04:40:45 +04:00			`* Contributor(s):`
Converting ::GetIID() into NS_GET_IID(). Bug #20232. r=scc, r=mozbot 2000-02-03 01:24:56 +03:00			`* Pierre Phaneuf <pp@ludusdesign.com>`
License changes, take 2. Bug 98089. mozilla/include/, /mozilla/htmlparser/, /mozilla/intl/ (part 1). 2001-09-26 04:40:45 +04:00			`*`
			`*`
			`* Alternatively, the contents of this file may be used under the terms of`
			`* either the GNU General Public License Version 2 or later (the "GPL"), or`
			`* the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),`
			`* in which case the provisions of the GPL or the LGPL are applicable instead`
			`* of those above. If you wish to allow use of your version of this file only`
			`* under the terms of either the GPL or the LGPL, and not to allow others to`
			`* use your version of this file under the terms of the NPL, indicate your`
			`* decision by deleting the provisions above and replace them with the notice`
			`* and other provisions required by the GPL or the LGPL. If you do not delete`
			`* the provisions above, a recipient may use your version of this file under`
			`* the terms of any one of the NPL, the GPL or the LGPL.`
			`*`
			`* *** END LICENSE BLOCK *** */`
1st check in 1999-09-21 04:30:12 +04:00			`#include "nsString.h"`
			`#include "nsIUnicodeEncoder.h"`
			`#include "nsICharsetConverterManager.h"`
Added unescape function which takes a charset to uconv, changed uriloader to use the uconv unescape to handle unescape non Ascii URI correctly. bug 155569, r=ftang, sr=bzbarsky. 2002-08-12 23:23:22 +04:00			`#include "nsICharsetConverterManager2.h"`
			`#include "nsReadableUtils.h"`
1st check in 1999-09-21 04:30:12 +04:00			`#include "nsITextToSubURI.h"`
			`#include "nsIServiceManager.h"`
			`#include "nsUConvDll.h"`
			`#include "nsEscape.h"`
			`#include "prmem.h"`
Bug 110486 Removing NSGetFactory from UCONV /r=shanjian; /sr=brendan 2001-12-08 03:25:28 +03:00			`#include "nsTextToSubURI.h"`
Fixes mozilla/strings requiring unfrozen nsCRT class. patch by scc, r=dougt, sr=jag, b=136756 2002-05-15 22:55:21 +04:00			`#include "nsCRT.h"`
1st check in 1999-09-21 04:30:12 +04:00
			`static NS_DEFINE_CID(kITextToSubURIIID, NS_ITEXTTOSUBURI_IID);`
			`static NS_DEFINE_CID(kCharsetConverterManagerCID, NS_ICHARSETCONVERTERMANAGER_CID);`

			`nsTextToSubURI::nsTextToSubURI()`
			`{`
			`}`
			`nsTextToSubURI::~nsTextToSubURI()`
			`{`
			`}`

#45797 - fix consumers of NS_IMPL_ISUPPORTS r=dveditz a=self 2000-11-17 11:06:12 +03:00			`NS_IMPL_ISUPPORTS1(nsTextToSubURI, nsITextToSubURI)`
1st check in 1999-09-21 04:30:12 +04:00
			`NS_IMETHODIMP nsTextToSubURI::ConvertAndEscape(`
			`const char charset, const PRUnichar text, char **_retval)`
			`{`
Added a function to url unescape and convert to unicode, bug 25034, r=ftang. 2000-02-04 02:18:07 +03:00			`if(nsnull == _retval)`
			`return NS_ERROR_NULL_POINTER;`
1st check in 1999-09-21 04:30:12 +04:00			`*_retval = nsnull;`
making string conversions explicit 2000-04-03 09:52:40 +04:00			`nsAutoString charsetStr; charsetStr.AssignWithConversion(charset);`
1st check in 1999-09-21 04:30:12 +04:00			`nsIUnicodeEncoder *encoder = nsnull;`
			`nsresult rv = NS_OK;`

			`// Get Charset, get the encoder.`
			`nsICharsetConverterManager * ccm = nsnull;`
			`rv = nsServiceManager::GetService(kCharsetConverterManagerCID ,`
Converting ::GetIID() into NS_GET_IID(). Bug #20232. r=scc, r=mozbot 2000-02-03 01:24:56 +03:00			`NS_GET_IID(nsICharsetConverterManager),`
1st check in 1999-09-21 04:30:12 +04:00			`(nsISupports**)&ccm);`
			`if(NS_SUCCEEDED(rv) && (nsnull != ccm)) {`
			`rv = ccm->GetUnicodeEncoder(&charsetStr, &encoder);`
			`nsServiceManager::ReleaseService( kCharsetConverterManagerCID, ccm);`
Added a function to url unescape and convert to unicode, bug 25034, r=ftang. 2000-02-04 02:18:07 +03:00			`if (NS_SUCCEEDED(rv)) {`
			`rv = encoder->SetOutputErrorBehavior(nsIUnicodeEncoder::kOnError_Replace, nsnull, (PRUnichar)'?');`
			`if(NS_SUCCEEDED(rv))`
			`{`
			`char buf[256];`
			`char *pBuf = buf;`
			`PRInt32 ulen = nsCRT::strlen(text);`
			`PRInt32 outlen = 0;`
			`if(NS_SUCCEEDED(rv = encoder->GetMaxLength(text, ulen, &outlen)))`
			`{`
			`if(outlen >= 256) {`
			`pBuf = (char*)PR_Malloc(outlen+1);`
			`}`
			`if(nsnull == pBuf) {`
			`outlen = 255;`
			`pBuf = buf;`
			`}`
Call nsIUnicharEncoder::Finish to ensure the converted string is terminated, bug 179392, r=shanjian, sr=bzbarsky 2002-11-14 00:56:01 +03:00			`PRInt32 bufLen = outlen;`
Added a function to url unescape and convert to unicode, bug 25034, r=ftang. 2000-02-04 02:18:07 +03:00			`if(NS_SUCCEEDED(rv = encoder->Convert(text,&ulen, pBuf, &outlen))) {`
Call nsIUnicharEncoder::Finish to ensure the converted string is terminated, bug 179392, r=shanjian, sr=bzbarsky 2002-11-14 00:56:01 +03:00			`// put termination characters (e.g. ESC(B of ISO-2022-JP) if necessary`
			`PRInt32 finLen = bufLen - outlen;`
			`if (finLen > 0) {`
			`if (NS_SUCCEEDED(encoder->Finish((char *)(pBuf+outlen), &finLen)))`
			`outlen += finLen;`
			`}`
Added a function to url unescape and convert to unicode, bug 25034, r=ftang. 2000-02-04 02:18:07 +03:00			`pBuf[outlen] = '\0';`
			`*_retval = nsEscape(pBuf, url_XPAlphas);`
			`if(nsnull == *_retval)`
			`rv = NS_ERROR_OUT_OF_MEMORY;`
			`}`
			`}`
			`if(pBuf != buf)`
			`PR_Free(pBuf);`
			`}`
			`NS_IF_RELEASE(encoder);`
1st check in 1999-09-21 04:30:12 +04:00			`}`
			`}`

			`return rv;`
			`}`
wired up nsTextToSubURI to the dll, remove unnecessary reghac2.h 1999-09-21 09:13:53 +04:00
Added a function to url unescape and convert to unicode, bug 25034, r=ftang. 2000-02-04 02:18:07 +03:00			`NS_IMETHODIMP nsTextToSubURI::UnEscapeAndConvert(`
			`const char charset, const char text, PRUnichar **_retval)`
			`{`
			`if(nsnull == _retval)`
			`return NS_ERROR_NULL_POINTER;`
			`*_retval = nsnull;`
			`nsresult rv = NS_OK;`

			`// unescape the string, unescape changes the input`
			`char unescaped = nsCRT::strdup((char ) text);`
			`if (nsnull == unescaped)`
			`return NS_ERROR_OUT_OF_MEMORY;`
			`unescaped = nsUnescape(unescaped);`
			`NS_ASSERTION(unescaped, "nsUnescape returned null");`

			`// Convert from the charset to unicode`
Bug 86734: Remove NS_WITH_SERVICE. r=dbaron, rs=scc, a=asa 2001-07-25 11:54:28 +04:00			`nsCOMPtr<nsICharsetConverterManager> ccm =`
			`do_GetService(kCharsetConverterManagerCID, &rv);`
Added a function to url unescape and convert to unicode, bug 25034, r=ftang. 2000-02-04 02:18:07 +03:00			`if (NS_SUCCEEDED(rv)) {`
making string conversions explicit 2000-04-03 09:52:40 +04:00			`nsAutoString charsetStr; charsetStr.AssignWithConversion(charset);`
Added a function to url unescape and convert to unicode, bug 25034, r=ftang. 2000-02-04 02:18:07 +03:00			`nsIUnicodeDecoder *decoder;`
			`rv = ccm->GetUnicodeDecoder(&charsetStr, &decoder);`
			`if (NS_SUCCEEDED(rv)) {`
			`PRUnichar *pBuf = nsnull;`
eliminate nsCRT::strlen for char* strings (part 2), bug 124536 r=dp sr=brendan 2002-02-19 10:43:41 +03:00			`PRInt32 len = strlen(unescaped);`
Added a function to url unescape and convert to unicode, bug 25034, r=ftang. 2000-02-04 02:18:07 +03:00			`PRInt32 outlen = 0;`
			`if (NS_SUCCEEDED(rv = decoder->GetMaxLength(unescaped, len, &outlen))) {`
			`pBuf = (PRUnichar ) PR_Malloc((outlen+1)sizeof(PRUnichar*));`
			`if (nsnull == pBuf)`
			`rv = NS_ERROR_OUT_OF_MEMORY;`
			`else {`
			`if (NS_SUCCEEDED(rv = decoder->Convert(unescaped, &len, pBuf, &outlen))) {`
			`pBuf[outlen] = 0;`
			`*_retval = pBuf;`
			`}`
			`}`
			`}`
			`NS_IF_RELEASE(decoder);`
			`}`
			`}`
			`PR_FREEIF(unescaped);`

			`return rv;`
			`}`

Added a function to unescape 8bit only, 7bit encoding support. bug 161479, r=shanjian, sr=jst, a=dbaron. 2002-09-08 19:08:21 +04:00			`static PRBool statefulCharset(const char *charset)`
			`{`
			`if (!nsCRT::strncasecmp(charset, "ISO-2022-", sizeof("ISO-2022-")-1) \|\|`
			`!nsCRT::strcasecmp(charset, "UTF-7") \|\|`
			`!nsCRT::strcasecmp(charset, "HZ-GB-2312"))`
			`return PR_TRUE;`

			`return PR_FALSE;`
			`}`

Added unescape function which takes a charset to uconv, changed uriloader to use the uconv unescape to handle unescape non Ascii URI correctly. bug 155569, r=ftang, sr=bzbarsky. 2002-08-12 23:23:22 +04:00			`nsresult nsTextToSubURI::convertURItoUnicode(const nsAFlatCString &aCharset,`
			`const nsAFlatCString &aURI,`
			`PRBool aIRI,`
			`nsAString &_retval)`
			`{`
			`nsresult rv = NS_OK;`

Added a function to unescape 8bit only, 7bit encoding support. bug 161479, r=shanjian, sr=jst, a=dbaron. 2002-09-08 19:08:21 +04:00			`// check for 7bit encoding the data may not be ASCII after we decode`
			`PRBool isStatefulCharset = statefulCharset(aCharset.get());`

			`if (!isStatefulCharset && IsASCII(aURI)) {`
Added unescape function which takes a charset to uconv, changed uriloader to use the uconv unescape to handle unescape non Ascii URI correctly. bug 155569, r=ftang, sr=bzbarsky. 2002-08-12 23:23:22 +04:00			`_retval.Assign(NS_ConvertASCIItoUCS2(aURI));`
			`return rv;`
			`}`

Added a function to unescape 8bit only, 7bit encoding support. bug 161479, r=shanjian, sr=jst, a=dbaron. 2002-09-08 19:08:21 +04:00			`if (!isStatefulCharset && aIRI) {`
bug 191542 : Add UTF-8 equivalent of \|IsASCII\|, IsUTF8. r=smontagu, sr=alecf 2003-03-25 11:11:13 +03:00			`if (IsUTF8(aURI)) {`
			`_retval.Assign(NS_ConvertUTF8toUCS2(aURI));`
Added unescape function which takes a charset to uconv, changed uriloader to use the uconv unescape to handle unescape non Ascii URI correctly. bug 155569, r=ftang, sr=bzbarsky. 2002-08-12 23:23:22 +04:00			`return rv;`
			`}`
			`}`

bug 163998: URL-unescape the image URL for rendering in the title bar (r=nhotta,jst, sr=darin, a=asa) 2003-02-19 14:14:35 +03:00			`// empty charset could indicate UTF-8, but aURI turns out not to be UTF-8.`
			`NS_ENSURE_FALSE(aCharset.IsEmpty(), NS_ERROR_INVALID_ARG);`

Added unescape function which takes a charset to uconv, changed uriloader to use the uconv unescape to handle unescape non Ascii URI correctly. bug 155569, r=ftang, sr=bzbarsky. 2002-08-12 23:23:22 +04:00			`nsCOMPtr<nsICharsetConverterManager2> charsetConverterManager;`

			`charsetConverterManager = do_GetService(NS_CHARSETCONVERTERMANAGER_CONTRACTID, &rv);`
			`NS_ENSURE_SUCCESS(rv, rv);`

			`nsCOMPtr<nsIAtom> charsetAtom;`
			`rv = charsetConverterManager->GetCharsetAtom2(aCharset.get(), getter_AddRefs(charsetAtom));`
			`NS_ENSURE_SUCCESS(rv, rv);`

			`nsCOMPtr<nsIUnicodeDecoder> unicodeDecoder;`
			`rv = charsetConverterManager->GetUnicodeDecoder(charsetAtom,`
			`getter_AddRefs(unicodeDecoder));`
			`NS_ENSURE_SUCCESS(rv, rv);`

			`PRInt32 srcLen = aURI.Length();`
			`PRInt32 dstLen;`
			`rv = unicodeDecoder->GetMaxLength(aURI.get(), srcLen, &dstLen);`
			`NS_ENSURE_SUCCESS(rv, rv);`

			`PRUnichar ustr = (PRUnichar ) nsMemory::Alloc(dstLen * sizeof(PRUnichar));`
			`NS_ENSURE_TRUE(ustr, NS_ERROR_OUT_OF_MEMORY);`

			`rv = unicodeDecoder->Convert(aURI.get(), &srcLen, ustr, &dstLen);`

			`if (NS_SUCCEEDED(rv))`
			`_retval.Assign(ustr, dstLen);`

			`nsMemory::Free(ustr);`

			`return rv;`
			`}`

			`NS_IMETHODIMP nsTextToSubURI::UnEscapeURIForUI(const nsACString & aCharset,`
			`const nsACString &aURIFragment,`
			`nsAString &_retval)`
			`{`
			`nsCAutoString unescapedSpec(aURIFragment);`
			`NS_UnescapeURL(unescapedSpec);`

			`return convertURItoUnicode(PromiseFlatCString(aCharset), unescapedSpec, PR_TRUE, _retval);`
			`}`

Added a function to unescape 8bit only, 7bit encoding support. bug 161479, r=shanjian, sr=jst, a=dbaron. 2002-09-08 19:08:21 +04:00			`NS_IMETHODIMP nsTextToSubURI::UnEscapeNonAsciiURI(const nsACString & aCharset,`
			`const nsACString &aURIFragment,`
			`nsAString &_retval)`
			`{`
			`nsCAutoString unescapedSpec;`
			`NS_UnescapeURL(PromiseFlatCString(aURIFragment),`
			`esc_AlwaysCopy \| esc_OnlyNonASCII, unescapedSpec);`

			`return convertURItoUnicode(PromiseFlatCString(aCharset), unescapedSpec, PR_TRUE, _retval);`
			`}`

Convert to module from component 1999-10-01 01:11:05 +04:00			`//----------------------------------------------------------------------`