1998-04-14 00:24:54 +04:00
|
|
|
/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
|
|
|
|
*
|
|
|
|
* The contents of this file are subject to the Netscape Public License
|
|
|
|
* Version 1.0 (the "NPL"); you may not use this file except in
|
|
|
|
* compliance with the NPL. You may obtain a copy of the NPL at
|
|
|
|
* http://www.mozilla.org/NPL/
|
|
|
|
*
|
|
|
|
* Software distributed under the NPL is distributed on an "AS IS" basis,
|
|
|
|
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the NPL
|
|
|
|
* for the specific language governing rights and limitations under the
|
|
|
|
* NPL.
|
|
|
|
*
|
|
|
|
* The Initial Developer of this code under the NPL is Netscape
|
|
|
|
* Communications Corporation. Portions created by Netscape are
|
|
|
|
* Copyright (C) 1998 Netscape Communications Corporation. All Rights
|
|
|
|
* Reserved.
|
|
|
|
*/
|
1999-02-03 21:55:10 +03:00
|
|
|
|
|
|
|
#define NS_IMPL_IDS
|
1998-04-14 00:24:54 +04:00
|
|
|
#include "nsIUnicharInputStream.h"
|
|
|
|
#include "nsIByteBuffer.h"
|
|
|
|
#include "nsIUnicharBuffer.h"
|
1999-02-03 21:55:10 +03:00
|
|
|
#include "nsIServiceManager.h"
|
|
|
|
#include "nsICharsetConverterManager.h"
|
|
|
|
#include "nsIUnicodeDecoder.h"
|
1998-04-14 00:24:54 +04:00
|
|
|
#include "nsString.h"
|
|
|
|
#include "nsCRT.h"
|
|
|
|
#include <fcntl.h>
|
|
|
|
#ifdef NS_WIN32
|
|
|
|
#include <io.h>
|
|
|
|
#else
|
|
|
|
#include <unistd.h>
|
|
|
|
#endif
|
|
|
|
|
1999-07-22 09:25:17 +04:00
|
|
|
static NS_DEFINE_CID(kCharsetConverterManagerCID, NS_ICHARSETCONVERTERMANAGER_CID);
|
1998-04-14 00:24:54 +04:00
|
|
|
|
|
|
|
class StringUnicharInputStream : public nsIUnicharInputStream {
|
|
|
|
public:
|
|
|
|
StringUnicharInputStream(nsString* aString);
|
1999-04-25 08:57:38 +04:00
|
|
|
virtual ~StringUnicharInputStream();
|
1998-04-14 00:24:54 +04:00
|
|
|
|
|
|
|
NS_DECL_ISUPPORTS
|
|
|
|
|
1998-07-24 00:34:01 +04:00
|
|
|
NS_IMETHOD Read(PRUnichar* aBuf,
|
1998-12-16 08:40:20 +03:00
|
|
|
PRUint32 aOffset,
|
|
|
|
PRUint32 aCount,
|
|
|
|
PRUint32 *aReadCount);
|
1998-07-24 00:34:01 +04:00
|
|
|
NS_IMETHOD Close();
|
1998-04-14 00:24:54 +04:00
|
|
|
|
|
|
|
nsString* mString;
|
1998-12-16 08:40:20 +03:00
|
|
|
PRUint32 mPos;
|
|
|
|
PRUint32 mLen;
|
1998-04-14 00:24:54 +04:00
|
|
|
};
|
|
|
|
|
|
|
|
StringUnicharInputStream::StringUnicharInputStream(nsString* aString)
|
|
|
|
{
|
1998-05-28 22:38:32 +04:00
|
|
|
NS_INIT_REFCNT();
|
1998-04-14 00:24:54 +04:00
|
|
|
mString = aString;
|
|
|
|
mPos = 0;
|
|
|
|
mLen = aString->Length();
|
|
|
|
}
|
|
|
|
|
|
|
|
StringUnicharInputStream::~StringUnicharInputStream()
|
|
|
|
{
|
|
|
|
if (nsnull != mString) {
|
|
|
|
delete mString;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
1998-07-24 00:34:01 +04:00
|
|
|
nsresult StringUnicharInputStream::Read(PRUnichar* aBuf,
|
1998-12-16 08:40:20 +03:00
|
|
|
PRUint32 aOffset,
|
|
|
|
PRUint32 aCount,
|
|
|
|
PRUint32 *aReadCount)
|
1998-04-14 00:24:54 +04:00
|
|
|
{
|
|
|
|
if (mPos >= mLen) {
|
1998-07-24 00:34:01 +04:00
|
|
|
*aReadCount = 0;
|
1998-07-25 01:05:50 +04:00
|
|
|
return (nsresult)-1;
|
1998-04-14 00:24:54 +04:00
|
|
|
}
|
|
|
|
const PRUnichar* us = mString->GetUnicode();
|
1998-12-16 08:40:20 +03:00
|
|
|
NS_ASSERTION(mLen >= mPos, "unsigned madness");
|
|
|
|
PRUint32 amount = mLen - mPos;
|
1998-04-14 00:24:54 +04:00
|
|
|
if (amount > aCount) {
|
|
|
|
amount = aCount;
|
|
|
|
}
|
|
|
|
nsCRT::memcpy(aBuf + aOffset, us + mPos, sizeof(PRUnichar) * amount);
|
|
|
|
mPos += amount;
|
1998-07-24 00:34:01 +04:00
|
|
|
*aReadCount = amount;
|
|
|
|
return NS_OK;
|
1998-04-14 00:24:54 +04:00
|
|
|
}
|
|
|
|
|
1998-07-24 00:34:01 +04:00
|
|
|
nsresult StringUnicharInputStream::Close()
|
1998-04-14 00:24:54 +04:00
|
|
|
{
|
|
|
|
mPos = mLen;
|
|
|
|
if (nsnull != mString) {
|
|
|
|
delete mString;
|
|
|
|
}
|
1998-07-24 00:34:01 +04:00
|
|
|
return NS_OK;
|
1998-04-14 00:24:54 +04:00
|
|
|
}
|
|
|
|
|
1999-08-23 14:14:16 +04:00
|
|
|
NS_IMPL_ISUPPORTS1(StringUnicharInputStream, nsIUnicharInputStream)
|
1998-04-14 00:24:54 +04:00
|
|
|
|
1999-05-26 05:38:36 +04:00
|
|
|
NS_COM nsresult
|
1998-04-14 00:24:54 +04:00
|
|
|
NS_NewStringUnicharInputStream(nsIUnicharInputStream** aInstancePtrResult,
|
|
|
|
nsString* aString)
|
|
|
|
{
|
|
|
|
NS_PRECONDITION(nsnull != aString, "null ptr");
|
|
|
|
NS_PRECONDITION(nsnull != aInstancePtrResult, "null ptr");
|
|
|
|
if ((nsnull == aString) || (nsnull == aInstancePtrResult)) {
|
|
|
|
return NS_ERROR_NULL_POINTER;
|
|
|
|
}
|
|
|
|
|
|
|
|
StringUnicharInputStream* it = new StringUnicharInputStream(aString);
|
|
|
|
if (nsnull == it) {
|
|
|
|
return NS_ERROR_OUT_OF_MEMORY;
|
|
|
|
}
|
|
|
|
|
1999-08-23 14:14:16 +04:00
|
|
|
return it->QueryInterface(NS_GET_IID(nsIUnicharInputStream),
|
1998-04-14 00:24:54 +04:00
|
|
|
(void**) aInstancePtrResult);
|
|
|
|
}
|
|
|
|
|
|
|
|
//----------------------------------------------------------------------
|
|
|
|
|
1999-02-03 21:55:10 +03:00
|
|
|
/**
|
1999-05-26 05:38:36 +04:00
|
|
|
* This function used to be public, with the NS_COM declaration. I am
|
1999-02-03 21:55:10 +03:00
|
|
|
* changing it right now into a module private visibility because there are
|
|
|
|
* better and more xpcom-like ways to get a Converter.
|
|
|
|
*/
|
1999-02-19 19:13:47 +03:00
|
|
|
|
|
|
|
nsresult NS_NewB2UConverter(nsIUnicodeDecoder** aInstancePtrResult, nsISupports* aOuter, nsString* aCharSet);
|
1999-02-03 21:55:10 +03:00
|
|
|
nsresult
|
|
|
|
NS_NewB2UConverter(nsIUnicodeDecoder** aInstancePtrResult,
|
1998-04-14 00:24:54 +04:00
|
|
|
nsISupports* aOuter,
|
1999-01-25 19:05:04 +03:00
|
|
|
nsString* aCharSet)
|
1998-04-14 00:24:54 +04:00
|
|
|
{
|
|
|
|
if (nsnull != aOuter) {
|
|
|
|
return NS_ERROR_NO_AGGREGATION;
|
|
|
|
}
|
1999-02-03 21:55:10 +03:00
|
|
|
|
|
|
|
// Create converter
|
|
|
|
nsresult res;
|
|
|
|
nsAutoString defaultCharset("ISO-8859-1");
|
|
|
|
|
|
|
|
if (aCharSet == nsnull) aCharSet = &defaultCharset;
|
|
|
|
|
1999-09-26 14:05:06 +04:00
|
|
|
NS_WITH_SERVICE(nsICharsetConverterManager, ccm, kCharsetConverterManagerCID, &res);
|
|
|
|
if (NS_FAILED(res)) return res;
|
1999-02-03 21:55:10 +03:00
|
|
|
|
1999-09-26 14:05:06 +04:00
|
|
|
return ccm->GetUnicodeDecoder(aCharSet, aInstancePtrResult);
|
1998-04-14 00:24:54 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
//----------------------------------------------------------------------
|
|
|
|
|
|
|
|
class ConverterInputStream : public nsIUnicharInputStream {
|
|
|
|
public:
|
|
|
|
ConverterInputStream(nsIInputStream* aStream,
|
1999-02-03 21:55:10 +03:00
|
|
|
nsIUnicodeDecoder* aConverter,
|
1998-12-16 08:40:20 +03:00
|
|
|
PRUint32 aBufSize);
|
1999-04-25 08:57:38 +04:00
|
|
|
virtual ~ConverterInputStream();
|
1998-04-14 00:24:54 +04:00
|
|
|
|
|
|
|
NS_DECL_ISUPPORTS
|
1998-07-24 00:34:01 +04:00
|
|
|
NS_IMETHOD Read(PRUnichar* aBuf,
|
1998-12-16 08:40:20 +03:00
|
|
|
PRUint32 aOffset,
|
|
|
|
PRUint32 aCount,
|
|
|
|
PRUint32 *aReadCount);
|
1998-07-24 00:34:01 +04:00
|
|
|
NS_IMETHOD Close();
|
1998-04-14 00:24:54 +04:00
|
|
|
|
|
|
|
protected:
|
1998-07-24 00:34:01 +04:00
|
|
|
PRInt32 Fill(nsresult * aErrorCode);
|
1998-04-14 00:24:54 +04:00
|
|
|
|
|
|
|
nsIInputStream* mInput;
|
1999-02-03 21:55:10 +03:00
|
|
|
nsIUnicodeDecoder* mConverter;
|
1998-04-14 00:24:54 +04:00
|
|
|
nsIByteBuffer* mByteData;
|
1998-12-16 08:40:20 +03:00
|
|
|
PRUint32 mByteDataOffset;
|
1998-04-14 00:24:54 +04:00
|
|
|
nsIUnicharBuffer* mUnicharData;
|
1998-12-16 08:40:20 +03:00
|
|
|
PRUint32 mUnicharDataOffset;
|
|
|
|
PRUint32 mUnicharDataLength;
|
1998-04-14 00:24:54 +04:00
|
|
|
};
|
|
|
|
|
|
|
|
ConverterInputStream::ConverterInputStream(nsIInputStream* aStream,
|
1999-02-03 21:55:10 +03:00
|
|
|
nsIUnicodeDecoder* aConverter,
|
1998-12-16 08:40:20 +03:00
|
|
|
PRUint32 aBufferSize)
|
1998-04-14 00:24:54 +04:00
|
|
|
{
|
|
|
|
NS_INIT_REFCNT();
|
|
|
|
mInput = aStream; aStream->AddRef();
|
|
|
|
mConverter = aConverter; aConverter->AddRef();
|
|
|
|
if (aBufferSize == 0) {
|
|
|
|
aBufferSize = 8192;
|
|
|
|
}
|
1999-07-16 21:40:39 +04:00
|
|
|
|
|
|
|
// XXX what if these fail?
|
|
|
|
NS_NewByteBuffer(&mByteData, nsnull, aBufferSize);
|
|
|
|
NS_NewUnicharBuffer(&mUnicharData, nsnull, aBufferSize);
|
|
|
|
|
1998-04-14 00:24:54 +04:00
|
|
|
mByteDataOffset = 0;
|
|
|
|
mUnicharDataOffset = 0;
|
|
|
|
mUnicharDataLength = 0;
|
|
|
|
}
|
|
|
|
|
1999-08-23 14:14:16 +04:00
|
|
|
NS_IMPL_ISUPPORTS1(ConverterInputStream,nsIUnicharInputStream)
|
1998-04-14 00:24:54 +04:00
|
|
|
|
|
|
|
ConverterInputStream::~ConverterInputStream()
|
|
|
|
{
|
|
|
|
Close();
|
|
|
|
}
|
|
|
|
|
1998-07-24 00:34:01 +04:00
|
|
|
nsresult ConverterInputStream::Close()
|
1998-04-14 00:24:54 +04:00
|
|
|
{
|
|
|
|
if (nsnull != mInput) {
|
|
|
|
mInput->Release();
|
|
|
|
mInput = nsnull;
|
|
|
|
}
|
|
|
|
if (nsnull != mConverter) {
|
|
|
|
mConverter->Release();
|
|
|
|
mConverter = nsnull;
|
|
|
|
}
|
|
|
|
if (nsnull != mByteData) {
|
|
|
|
mByteData->Release();
|
|
|
|
mByteData = nsnull;
|
|
|
|
}
|
|
|
|
if (nsnull != mUnicharData) {
|
|
|
|
mUnicharData->Release();
|
|
|
|
mUnicharData = nsnull;
|
|
|
|
}
|
1998-07-24 00:34:01 +04:00
|
|
|
|
|
|
|
return NS_OK;
|
1998-04-14 00:24:54 +04:00
|
|
|
}
|
|
|
|
|
1998-07-24 00:34:01 +04:00
|
|
|
nsresult ConverterInputStream::Read(PRUnichar* aBuf,
|
1998-12-16 08:40:20 +03:00
|
|
|
PRUint32 aOffset,
|
|
|
|
PRUint32 aCount,
|
|
|
|
PRUint32 *aReadCount)
|
1998-04-14 00:24:54 +04:00
|
|
|
{
|
1998-12-16 08:40:20 +03:00
|
|
|
NS_ASSERTION(mUnicharDataLength >= mUnicharDataOffset, "unsigned madness");
|
|
|
|
PRUint32 rv = mUnicharDataLength - mUnicharDataOffset;
|
1998-07-24 00:34:01 +04:00
|
|
|
nsresult errorCode;
|
1998-04-14 00:24:54 +04:00
|
|
|
if (0 == rv) {
|
|
|
|
// Fill the unichar buffer
|
1998-07-24 00:34:01 +04:00
|
|
|
rv = Fill(&errorCode);
|
1998-04-14 00:24:54 +04:00
|
|
|
if (rv <= 0) {
|
1998-07-24 00:34:01 +04:00
|
|
|
*aReadCount = 0;
|
|
|
|
return errorCode;
|
1998-04-14 00:24:54 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
if (rv > aCount) {
|
|
|
|
rv = aCount;
|
|
|
|
}
|
|
|
|
nsCRT::memcpy(aBuf + aOffset, mUnicharData->GetBuffer() + mUnicharDataOffset,
|
|
|
|
rv * sizeof(PRUnichar));
|
|
|
|
mUnicharDataOffset += rv;
|
1998-07-24 00:34:01 +04:00
|
|
|
*aReadCount = rv;
|
|
|
|
return NS_OK;
|
1998-04-14 00:24:54 +04:00
|
|
|
}
|
|
|
|
|
1998-07-24 00:34:01 +04:00
|
|
|
PRInt32 ConverterInputStream::Fill(nsresult * aErrorCode)
|
1998-04-14 00:24:54 +04:00
|
|
|
{
|
|
|
|
if (nsnull == mInput) {
|
|
|
|
// We already closed the stream!
|
1998-07-24 00:34:01 +04:00
|
|
|
*aErrorCode = NS_BASE_STREAM_CLOSED;
|
1998-04-14 00:24:54 +04:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
1998-12-16 08:40:20 +03:00
|
|
|
NS_ASSERTION(mByteData->GetLength() >= mByteDataOffset, "unsigned madness");
|
|
|
|
PRUint32 remainder = mByteData->GetLength() - mByteDataOffset;
|
1998-04-14 00:24:54 +04:00
|
|
|
mByteDataOffset = remainder;
|
|
|
|
PRInt32 nb = mByteData->Fill(aErrorCode, mInput, remainder);
|
|
|
|
if (nb <= 0) {
|
|
|
|
// Because we assume a many to one conversion, the lingering data
|
|
|
|
// in the byte buffer must be a partial conversion
|
|
|
|
// fragment. Because we know that we have recieved no more new
|
|
|
|
// data to add to it, we can't convert it. Therefore, we discard
|
|
|
|
// it.
|
|
|
|
return nb;
|
|
|
|
}
|
|
|
|
NS_ASSERTION(remainder + nb == mByteData->GetLength(), "bad nb");
|
|
|
|
|
|
|
|
// Now convert as much of the byte buffer to unicode as possible
|
1999-02-03 21:55:10 +03:00
|
|
|
PRInt32 dstLen = mUnicharData->GetBufferSize();
|
|
|
|
PRInt32 srcLen = remainder + nb;
|
1999-09-02 02:50:50 +04:00
|
|
|
*aErrorCode = mConverter->Convert(mByteData->GetBuffer(), &srcLen,
|
|
|
|
mUnicharData->GetBuffer(), &dstLen);
|
1998-04-14 00:24:54 +04:00
|
|
|
mUnicharDataOffset = 0;
|
|
|
|
mUnicharDataLength = dstLen;
|
|
|
|
mByteDataOffset += srcLen;
|
|
|
|
return dstLen;
|
|
|
|
}
|
|
|
|
|
|
|
|
// XXX hook up auto-detect here (do we need more info, like the url?)
|
1999-05-26 05:38:36 +04:00
|
|
|
NS_COM nsresult
|
1998-04-14 00:24:54 +04:00
|
|
|
NS_NewConverterStream(nsIUnicharInputStream** aInstancePtrResult,
|
|
|
|
nsISupports* aOuter,
|
|
|
|
nsIInputStream* aStreamToWrap,
|
|
|
|
PRInt32 aBufferSize,
|
1999-01-25 19:05:04 +03:00
|
|
|
nsString* aCharSet)
|
1998-04-14 00:24:54 +04:00
|
|
|
{
|
|
|
|
if (nsnull != aOuter) {
|
|
|
|
return NS_ERROR_NO_AGGREGATION;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Create converter
|
1999-02-03 21:55:10 +03:00
|
|
|
nsIUnicodeDecoder* converter;
|
1998-04-14 00:24:54 +04:00
|
|
|
nsresult rv = NS_NewB2UConverter(&converter, nsnull, aCharSet);
|
|
|
|
if (NS_OK != rv) {
|
|
|
|
return rv;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Create converter input stream
|
|
|
|
ConverterInputStream* it =
|
|
|
|
new ConverterInputStream(aStreamToWrap, converter, aBufferSize);
|
1999-02-03 21:55:10 +03:00
|
|
|
NS_RELEASE(converter);
|
1998-04-14 00:24:54 +04:00
|
|
|
if (nsnull == it) {
|
|
|
|
return NS_ERROR_OUT_OF_MEMORY;
|
|
|
|
}
|
1999-08-23 14:14:16 +04:00
|
|
|
return it->QueryInterface(NS_GET_IID(nsIUnicharInputStream),
|
1998-04-14 00:24:54 +04:00
|
|
|
(void **) aInstancePtrResult);
|
|
|
|
}
|