зеркало из https://github.com/mozilla/gecko-dev.git
100 строки
3.2 KiB
C++
100 строки
3.2 KiB
C++
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
|
|
/* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
|
|
|
#include "nsUnicodeNormalizer.h"
|
|
#include "ICUUtils.h"
|
|
#include "unicode/unorm2.h"
|
|
#include "unicode/utext.h"
|
|
|
|
NS_IMPL_ISUPPORTS(nsUnicodeNormalizer, nsIUnicodeNormalizer)
|
|
|
|
nsUnicodeNormalizer::nsUnicodeNormalizer()
|
|
{
|
|
}
|
|
|
|
nsUnicodeNormalizer::~nsUnicodeNormalizer()
|
|
{
|
|
}
|
|
|
|
static nsresult
|
|
DoNormalization(const UNormalizer2* aNorm, const nsAString& aSrc,
|
|
nsAString& aDest)
|
|
{
|
|
UErrorCode errorCode = U_ZERO_ERROR;
|
|
const int32_t length = aSrc.Length();
|
|
const UChar* src = reinterpret_cast<const UChar*>(aSrc.BeginReading());
|
|
// Initial guess for a capacity that is likely to be enough for most cases.
|
|
int32_t capacity = length + (length >> 8) + 8;
|
|
while (true) {
|
|
aDest.SetLength(capacity);
|
|
UChar* dest = reinterpret_cast<UChar*>(aDest.BeginWriting());
|
|
int32_t len = unorm2_normalize(aNorm, src, aSrc.Length(), dest, capacity,
|
|
&errorCode);
|
|
if (U_SUCCESS(errorCode)) {
|
|
aDest.SetLength(len);
|
|
break;
|
|
}
|
|
if (errorCode != U_BUFFER_OVERFLOW_ERROR) {
|
|
// Some other error that we don't handle
|
|
break;
|
|
}
|
|
// Buffer wasn't big enough; adjust to the reported size and try again.
|
|
capacity = len;
|
|
errorCode = U_ZERO_ERROR;
|
|
}
|
|
return ICUUtils::UErrorToNsResult(errorCode);
|
|
}
|
|
|
|
nsresult
|
|
nsUnicodeNormalizer::NormalizeUnicodeNFD(const nsAString& aSrc,
|
|
nsAString& aDest)
|
|
{
|
|
// The unorm2_getNF*Instance functions return static singletons that should
|
|
// not be deleted, so we just get them once on first use.
|
|
static UErrorCode errorCode = U_ZERO_ERROR;
|
|
static const UNormalizer2* norm = unorm2_getNFDInstance(&errorCode);
|
|
if (U_SUCCESS(errorCode)) {
|
|
return DoNormalization(norm, aSrc, aDest);
|
|
}
|
|
return ICUUtils::UErrorToNsResult(errorCode);
|
|
}
|
|
|
|
nsresult
|
|
nsUnicodeNormalizer::NormalizeUnicodeNFC(const nsAString& aSrc,
|
|
nsAString& aDest)
|
|
{
|
|
static UErrorCode errorCode = U_ZERO_ERROR;
|
|
static const UNormalizer2* norm = unorm2_getNFCInstance(&errorCode);
|
|
if (U_SUCCESS(errorCode)) {
|
|
return DoNormalization(norm, aSrc, aDest);
|
|
}
|
|
return ICUUtils::UErrorToNsResult(errorCode);
|
|
}
|
|
|
|
nsresult
|
|
nsUnicodeNormalizer::NormalizeUnicodeNFKD(const nsAString& aSrc,
|
|
nsAString& aDest)
|
|
{
|
|
static UErrorCode errorCode = U_ZERO_ERROR;
|
|
static const UNormalizer2* norm = unorm2_getNFKDInstance(&errorCode);
|
|
if (U_SUCCESS(errorCode)) {
|
|
return DoNormalization(norm, aSrc, aDest);
|
|
}
|
|
return ICUUtils::UErrorToNsResult(errorCode);
|
|
}
|
|
|
|
nsresult
|
|
nsUnicodeNormalizer::NormalizeUnicodeNFKC(const nsAString& aSrc,
|
|
nsAString& aDest)
|
|
{
|
|
static UErrorCode errorCode = U_ZERO_ERROR;
|
|
static const UNormalizer2* norm = unorm2_getNFKCInstance(&errorCode);
|
|
if (U_SUCCESS(errorCode)) {
|
|
return DoNormalization(norm, aSrc, aDest);
|
|
}
|
|
return ICUUtils::UErrorToNsResult(errorCode);
|
|
}
|