2015-05-03 22:32:37 +03:00
|
|
|
/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
|
|
|
|
/* vim: set ts=8 sts=2 et sw=2 tw=80: */
|
2012-05-21 15:12:37 +04:00
|
|
|
/* This Source Code Form is subject to the terms of the Mozilla Public
|
|
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
|
|
|
|
2010-08-10 02:32:18 +04:00
|
|
|
// This file should only be compiled if you're on x86 or x86_64. Additionally,
|
|
|
|
// you'll need to compile this file with -msse2 if you're using gcc.
|
|
|
|
|
|
|
|
#include <emmintrin.h>
|
|
|
|
#include "nscore.h"
|
2011-06-25 18:06:02 +04:00
|
|
|
#include "nsAlgorithm.h"
|
2012-10-02 23:14:50 +04:00
|
|
|
#include "nsTextFragmentImpl.h"
|
2013-01-15 16:22:03 +04:00
|
|
|
#include <algorithm>
|
2010-08-10 02:32:18 +04:00
|
|
|
|
2020-01-18 16:48:34 +03:00
|
|
|
namespace mozilla::SSE2 {
|
2010-08-10 02:32:18 +04:00
|
|
|
|
|
|
|
static inline bool is_zero(__m128i x) {
|
|
|
|
return _mm_movemask_epi8(_mm_cmpeq_epi8(x, _mm_setzero_si128())) == 0xffff;
|
|
|
|
}
|
|
|
|
|
2014-01-04 19:02:17 +04:00
|
|
|
int32_t FirstNon8Bit(const char16_t* str, const char16_t* end) {
|
2012-08-22 19:56:38 +04:00
|
|
|
const uint32_t numUnicharsPerVector = 8;
|
2012-10-02 23:14:50 +04:00
|
|
|
typedef Non8BitParameters<sizeof(size_t)> p;
|
|
|
|
const size_t mask = p::mask();
|
|
|
|
const uint32_t numUnicharsPerWord = p::numUnicharsPerWord();
|
2012-08-22 19:56:38 +04:00
|
|
|
const int32_t len = end - str;
|
|
|
|
int32_t i = 0;
|
2010-08-10 02:32:18 +04:00
|
|
|
|
|
|
|
// Align ourselves to a 16-byte boundary, as required by _mm_load_si128
|
|
|
|
// (i.e. MOVDQA).
|
2012-08-22 19:56:38 +04:00
|
|
|
int32_t alignLen = std::min(
|
2014-01-04 19:02:17 +04:00
|
|
|
len, int32_t(((-NS_PTR_TO_INT32(str)) & 0xf) / sizeof(char16_t)));
|
2010-08-10 02:32:18 +04:00
|
|
|
for (; i < alignLen; i++) {
|
|
|
|
if (str[i] > 255) return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Check one XMM register (16 bytes) at a time.
|
2012-08-22 19:56:38 +04:00
|
|
|
const int32_t vectWalkEnd =
|
|
|
|
((len - i) / numUnicharsPerVector) * numUnicharsPerVector;
|
2013-08-05 20:45:50 +04:00
|
|
|
const uint16_t shortMask = 0xff00;
|
|
|
|
__m128i vectmask = _mm_set1_epi16(static_cast<int16_t>(shortMask));
|
2010-08-10 02:32:18 +04:00
|
|
|
for (; i < vectWalkEnd; i += numUnicharsPerVector) {
|
|
|
|
const __m128i vect = *reinterpret_cast<const __m128i*>(str + i);
|
|
|
|
if (!is_zero(_mm_and_si128(vect, vectmask))) return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Check one word at a time.
|
2012-08-22 19:56:38 +04:00
|
|
|
const int32_t wordWalkEnd =
|
|
|
|
((len - i) / numUnicharsPerWord) * numUnicharsPerWord;
|
2010-08-10 02:32:18 +04:00
|
|
|
for (; i < wordWalkEnd; i += numUnicharsPerWord) {
|
|
|
|
const size_t word = *reinterpret_cast<const size_t*>(str + i);
|
|
|
|
if (word & mask) return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Take care of the remainder one character at a time.
|
|
|
|
for (; i < len; i++) {
|
|
|
|
if (str[i] > 255) {
|
2011-09-09 20:27:00 +04:00
|
|
|
return i;
|
2010-08-10 02:32:18 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-09-09 20:27:00 +04:00
|
|
|
return -1;
|
2010-08-10 02:32:18 +04:00
|
|
|
}
|
|
|
|
|
2020-01-18 16:48:34 +03:00
|
|
|
} // namespace mozilla::SSE2
|